zmc
2023-12-22 9fdbf60165db0400c2e8e6be2dc6e88138ac719a
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
U
L±dã@s`ddlmZmZmZmZmZddlmZddlm    Z    m
Z
m Z Gdd„deƒZ Gdd„deƒZ d    S)
é)ÚDictÚListÚ
NamedTupleÚOptionalÚUnioné)Ú CharSetProber)ÚCharacterCategoryÚ ProbingStateÚSequenceLikelihoodc@s^eZdZUeed<eed<eeefed<eeeeeffed<eed<eed<eed<dS)    ÚSingleByteCharSetModelÚ charset_nameÚlanguageÚchar_to_order_mapÚlanguage_modelÚtypical_positive_ratioÚkeep_ascii_lettersÚalphabetN)    Ú__name__Ú
__module__Ú __qualname__ÚstrÚ__annotations__rÚintÚfloatÚbool©rrúNd:\z\workplace\vscode\pyvenv\venv\Lib\site-packages\chardet/sbcharsetprober.pyr #s
r cs¢eZdZdZdZdZdZdeee    e
ddœ‡fdd    „ Z dd
œ‡fd d „ Z e e    ed
œd d„ƒZe e    ed
œdd„ƒZeeefedœdd„Zed
œdd„Z‡ZS)ÚSingleByteCharSetProberé@igffffffî?gš™™™™™©?FN)ÚmodelÚ is_reversedÚ name_proberÚreturncsLtƒ ¡||_||_||_d|_g|_d|_d|_d|_    d|_
|  ¡dS©Néÿr) ÚsuperÚ__init__Ú_modelÚ    _reversedÚ _name_proberÚ _last_orderÚ _seq_countersÚ _total_seqsÚ _total_charÚ _control_charÚ
_freq_charÚreset)Úselfr r!r"©Ú    __class__rrr'3s
z SingleByteCharSetProber.__init__)r#cs<tƒ ¡d|_dgt ¡|_d|_d|_d|_d|_    dSr$)
r&r1r+r Úget_num_categoriesr,r-r.r/r0©r2r3rrr1Gs
zSingleByteCharSetProber.resetcCs|jr|jjS|jjS©N)r*r r(r6rrrr Rsz$SingleByteCharSetProber.charset_namecCs|jr|jjS|jjSr7)r*rr(r6rrrrXsz SingleByteCharSetProber.language)Úbyte_strr#c    CsV|jjs| |¡}n
| |¡}|s(|jS|jj}|jj}|D]˜}| |tj    ¡}|tj
krf|j d7_ ||j krÎ|j d7_ |j|j krÎ|jd7_|js®||j|}n|||j}|j|d7<||_q<|jj}|jtjkrP|j|jkrP| ¡}||jkr(|j d||¡tj|_n(||jkrP|j d|||j¡tj|_|jS)Nrz$%s confidence = %s, we have a winnerz8%s confidence = %s, below negative shortcut threshold %s)r(rÚfilter_international_wordsZremove_xml_tagsÚstaterrÚgetr    Ú    UNDEFINEDÚCONTROLr.Ú SAMPLE_SIZEr0r+r-r)r,r r
Ú    DETECTINGÚSB_ENOUGH_REL_THRESHOLDÚget_confidenceÚPOSITIVE_SHORTCUT_THRESHOLDÚloggerÚdebugÚFOUND_ITÚ_stateÚNEGATIVE_SHORTCUT_THRESHOLDÚNOT_ME)    r2r8rrÚcharÚorderZlm_catr Ú
confidencerrrÚfeed^sP 
 
 
  ÿ
 üzSingleByteCharSetProber.feedcCsnd}|jdkrj|jtjd|jtj|j|jj}||j|j|j}||j    |j}|dkrjd}|S)Ng{®Gáz„?rgÐ?gð?g®Gáz®ï?)
r-r,r ÚPOSITIVEÚLIKELYr(rr.r/r0)r2ÚrrrrrAs
 
ÿüûÿ z&SingleByteCharSetProber.get_confidence)FN)rrrr>r@rBrGr rrrr'r1Úpropertyrr rrÚbytesÚ    bytearrayr
rLrrAÚ __classcell__rrr3rr-s&üû 2rN)ÚtypingrrrrrÚ charsetproberrÚenumsr    r
r r rrrrrÚ<module>s