Class SingleByteCharsetProber
- java.lang.Object
-
- org.mozilla.universalchardet.prober.CharsetProber
-
- org.mozilla.universalchardet.prober.SingleByteCharsetProber
-
public class SingleByteCharsetProber extends CharsetProber
-
-
Nested Class Summary
-
Nested classes/interfaces inherited from class org.mozilla.universalchardet.prober.CharsetProber
CharsetProber.ProbingState
-
-
Field Summary
Fields Modifier and Type Field Description private int
freqChar
private short
lastOrder
private SequenceModel
model
private CharsetProber
nameProber
static int
NEGATIVE_CAT
static float
NEGATIVE_SHORTCUT_THRESHOLD
static int
NUMBER_OF_SEQ_CAT
static int
POSITIVE_CAT
static float
POSITIVE_SHORTCUT_THRESHOLD
private boolean
reversed
static int
SAMPLE_SIZE
static int
SB_ENOUGH_REL_THRESHOLD
private int[]
seqCounters
private CharsetProber.ProbingState
state
static int
SYMBOL_CAT_ORDER
private int
totalChar
private int
totalSeqs
-
Fields inherited from class org.mozilla.universalchardet.prober.CharsetProber
ASCII_A, ASCII_A_CAPITAL, ASCII_GT, ASCII_LT, ASCII_SP, ASCII_Z, ASCII_Z_CAPITAL, SHORTCUT_THRESHOLD
-
-
Constructor Summary
Constructors Constructor Description SingleByteCharsetProber(SequenceModel model)
SingleByteCharsetProber(SequenceModel model, boolean reversed, CharsetProber nameProber)
-
Method Summary
All Methods Instance Methods Concrete Methods Modifier and Type Method Description java.lang.String
getCharSetName()
float
getConfidence()
CharsetProber.ProbingState
getState()
CharsetProber.ProbingState
handleData(byte[] buf, int offset, int length)
(package private) boolean
keepEnglishLetters()
void
reset()
void
setOption()
-
Methods inherited from class org.mozilla.universalchardet.prober.CharsetProber
filterWithEnglishLetters, filterWithoutEnglishLetters, isActive, setActive
-
-
-
-
Field Detail
-
SAMPLE_SIZE
public static final int SAMPLE_SIZE
- See Also:
- Constant Field Values
-
SB_ENOUGH_REL_THRESHOLD
public static final int SB_ENOUGH_REL_THRESHOLD
- See Also:
- Constant Field Values
-
POSITIVE_SHORTCUT_THRESHOLD
public static final float POSITIVE_SHORTCUT_THRESHOLD
- See Also:
- Constant Field Values
-
NEGATIVE_SHORTCUT_THRESHOLD
public static final float NEGATIVE_SHORTCUT_THRESHOLD
- See Also:
- Constant Field Values
-
SYMBOL_CAT_ORDER
public static final int SYMBOL_CAT_ORDER
- See Also:
- Constant Field Values
-
NUMBER_OF_SEQ_CAT
public static final int NUMBER_OF_SEQ_CAT
- See Also:
- Constant Field Values
-
POSITIVE_CAT
public static final int POSITIVE_CAT
- See Also:
- Constant Field Values
-
NEGATIVE_CAT
public static final int NEGATIVE_CAT
- See Also:
- Constant Field Values
-
state
private CharsetProber.ProbingState state
-
model
private SequenceModel model
-
reversed
private boolean reversed
-
lastOrder
private short lastOrder
-
totalSeqs
private int totalSeqs
-
seqCounters
private int[] seqCounters
-
totalChar
private int totalChar
-
freqChar
private int freqChar
-
nameProber
private CharsetProber nameProber
-
-
Constructor Detail
-
SingleByteCharsetProber
public SingleByteCharsetProber(SequenceModel model)
-
SingleByteCharsetProber
public SingleByteCharsetProber(SequenceModel model, boolean reversed, CharsetProber nameProber)
-
-
Method Detail
-
keepEnglishLetters
boolean keepEnglishLetters()
-
getCharSetName
public java.lang.String getCharSetName()
- Specified by:
getCharSetName
in classCharsetProber
-
getConfidence
public float getConfidence()
- Specified by:
getConfidence
in classCharsetProber
-
getState
public CharsetProber.ProbingState getState()
- Specified by:
getState
in classCharsetProber
-
handleData
public CharsetProber.ProbingState handleData(byte[] buf, int offset, int length)
- Specified by:
handleData
in classCharsetProber
-
reset
public final void reset()
- Specified by:
reset
in classCharsetProber
-
setOption
public void setOption()
- Specified by:
setOption
in classCharsetProber
-
-