Class: CharDet::JapaneseContextAnalysis
- Inherits:
-
Object
- Object
- CharDet::JapaneseContextAnalysis
show all
- Defined in:
- lib/rchardet/jpcntx.rb
Instance Method Summary
collapse
Constructor Details
Returns a new instance of JapaneseContextAnalysis.
124
125
126
|
# File 'lib/rchardet/jpcntx.rb', line 124
def initialize
reset()
end
|
Instance Method Details
#feed(aBuf, aLen) ⇒ Object
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
|
# File 'lib/rchardet/jpcntx.rb', line 136
def feed(aBuf, aLen)
return if @_mDone
i = @_mNeedToSkipCharNum
while i < aLen
order, charLen = get_order(aBuf[i...i+2])
i += charLen
if i > aLen
@_mNeedToSkipCharNum = i - aLen
@_mLastCharOrder = -1
else
if (order != -1) and (@_mLastCharOrder != -1)
@_mTotalRel += 1
if @_mTotalRel > MAX_REL_THRESHOLD
@_mDone = true
break
end
@_mRelSample[JP2_CHAR_CONTEXT[@_mLastCharOrder][order]] += 1
end
@_mLastCharOrder = order
end
end
end
|
#get_confidence ⇒ Object
170
171
172
173
174
175
176
177
|
# File 'lib/rchardet/jpcntx.rb', line 170
def get_confidence
if @_mTotalRel > MINIMUM_DATA_THRESHOLD
return (@_mTotalRel - @_mRelSample[0]) / @_mTotalRel
else
return DONT_KNOW
end
end
|
#get_order(aStr) ⇒ Object
179
180
181
|
# File 'lib/rchardet/jpcntx.rb', line 179
def get_order(aStr)
return -1, 1
end
|
#got_enough_data ⇒ Object
166
167
168
|
# File 'lib/rchardet/jpcntx.rb', line 166
def got_enough_data
return @_mTotalRel > ENOUGH_REL_THRESHOLD
end
|
#reset ⇒ Object
128
129
130
131
132
133
134
|
# File 'lib/rchardet/jpcntx.rb', line 128
def reset
@_mTotalRel = 0 @_mRelSample = [0] * NUM_OF_CATEGORY @_mNeedToSkipCharNum = 0 @_mLastCharOrder = -1 @_mDone = false end
|