28from typing
import Optional, Union
30from .charsetprober
import CharSetProber
31from .enums
import ProbingState
32from .sbcharsetprober
import SingleByteCharSetProber
149 MIN_FINAL_CHAR_DISTANCE = 5
154 MIN_MODEL_DISTANCE = 0.01
156 VISUAL_HEBREW_NAME =
"ISO-8859-8"
157 LOGICAL_HEBREW_NAME =
"windows-1255"
181 logical_prober: SingleByteCharSetProber,
182 visual_prober: SingleByteCharSetProber,
209 def feed(self, byte_str: Union[bytes, bytearray]) -> ProbingState:
243 if cur == self.
SPACE:
260 and (cur != self.
SPACE)
bytes filter_high_byte_only(Union[bytes, bytearray] buf)
float get_confidence(self)
General ideas of the Hebrew charset recognition ###.
_final_char_logical_score
bool is_non_final(self, int c)
bool is_final(self, int c)
int MIN_FINAL_CHAR_DISTANCE
None set_model_probers(self, SingleByteCharSetProber logical_prober, SingleByteCharSetProber visual_prober)
ProbingState feed(self, Union[bytes, bytearray] byte_str)