Merge pull request #218 from azooKey/fix/dynamic_user_dictionary

fix: 動的ユーザ辞書が適切に読めていなかった問題を修正
This commit is contained in:
Miwa
2025-07-06 17:09:25 +09:00
committed by GitHub
2 changed files with 106 additions and 12 deletions

View File

@@ -256,8 +256,8 @@ public final class DicdataStore {
var generator = TypoCorrectionGenerator(inputs: inputs, leftIndex: leftIndex, rightIndexRange: rightIndexRange, needTypoCorrection: needTypoCorrection)
var targetLOUDS: [String: LOUDS.MovingTowardPrefixSearchHelper] = [:]
var stringToInfo: [([Character], (endIndex: Int, penalty: PValue))] = []
var temporaryMemoryDicdata: [Int: [DicdataElement]] = [:]
//
var dynamicDicdata: [Int: [DicdataElement]] = [:]
//
while let (characters, info) = generator.next() {
guard let firstCharacter = characters.first else {
@@ -291,7 +291,7 @@ public final class DicdataStore {
for (depth, dicdata) in result.dicdata {
for data in dicdata {
if info.penalty.isZero {
temporaryMemoryDicdata[depth, default: []].append(data)
dynamicDicdata[depth, default: []].append(data)
}
let ratio = Self.penaltyRatio[data.lcid]
let pUnit: PValue = Self.getPenalty(data: data) / 2 //
@@ -299,7 +299,29 @@ public final class DicdataStore {
if self.shouldBeRemoved(value: data.value() + adjust, wordCount: data.ruby.count) {
continue
}
temporaryMemoryDicdata[depth, default: []].append(data.adjustedData(adjust))
dynamicDicdata[depth, default: []].append(data.adjustedData(adjust))
}
}
if !self.dynamicUserDict.isEmpty {
//
let katakanaString = String(characters).toKatakana()
let dynamicUserDictResult = self.getMatchDynamicUserDict(katakanaString)
updated = updated || !dynamicUserDictResult.isEmpty
for data in dynamicUserDictResult {
let depth = characters.endIndex
if info.penalty.isZero {
dynamicDicdata[depth, default: []].append(data)
} else {
let ratio = Self.penaltyRatio[data.lcid]
let pUnit: PValue = Self.getPenalty(data: data) / 2 //
let adjust = pUnit * info.penalty * ratio
if self.shouldBeRemoved(value: data.value() + adjust, wordCount: Array(data.ruby).count) {
continue
}
dynamicDicdata[depth, default: []].append(data.adjustedData(adjust))
}
// stringToInfogetLOUDSDataInRange
stringToInfo.append((Array(data.ruby), (depth - 1, info.penalty)))
}
}
if availableMaxIndex < characters.endIndex - 1 {
@@ -314,7 +336,7 @@ public final class DicdataStore {
return (
Dictionary(stringToInfo, uniquingKeysWith: {$0.penalty < $1.penalty ? $1 : $0}),
targetLOUDS.map { ($0.key, $0.value.indicesInDepth(depth: minCount - 1 ..< .max) )},
temporaryMemoryDicdata.flatMap {
dynamicDicdata.flatMap {
minCount < $0.key + 1 ? $0.value : []
}
)
@@ -401,13 +423,6 @@ public final class DicdataStore {
}
dicdata.append(contentsOf: result)
}
do {
let result = self.getMatchDynamicUserDict(segments[i - fromIndex])
for item in result {
stringToInfo[Array(item.ruby)] = (i, 0)
}
dicdata.append(contentsOf: result)
}
}
if fromIndex == .zero {
let result: [LatticeNode] = dicdata.compactMap {