diff options
Diffstat (limited to 'libtextcat/data/new_fingerprints/lm/italian.lm')
-rw-r--r-- | libtextcat/data/new_fingerprints/lm/italian.lm | 400 |
1 files changed, 400 insertions, 0 deletions
diff --git a/libtextcat/data/new_fingerprints/lm/italian.lm b/libtextcat/data/new_fingerprints/lm/italian.lm new file mode 100644 index 000000000000..543cadcfa88e --- /dev/null +++ b/libtextcat/data/new_fingerprints/lm/italian.lm @@ -0,0 +1,400 @@ +_ 25028 +a 7570 +e 6477 +i 5481 +o 5104 +l 3905 +n 3866 +r 3502 +t 2934 +c 2862 +s 2862 +a_ 2504 +e_ 2404 +d 2004 +i_ 1749 +o_ 1679 +u 1650 +v 1611 +p 1561 +m 1414 +_c 1325 +, 1192 +,_ 1192 +_s 1190 +_d 1094 +g 1067 +an 925 +er 915 +_a 914 +_p 895 +la 858 +_l 830 +re 799 +ar 769 +h 762 +no 753 +co 726 +va 698 +_e 657 +n_ 656 +on 656 +ra 653 +to 651 +f 638 +di 638 +_i 634 +ch 634 +ll 633 +l_ 624 +la_ 598 +ta 593 +el 576 +in 567 +_m 558 +en 529 +b 528 +ri 525 +_co 523 +_n 523 +_di 522 +li 513 +av 507 +al 501 +le 494 +ia 492 +se 484 +ol 479 +_f 477 +or 477 +te 469 +_e_ 467 +ve 454 +at 449 +de 447 +. 443 +ne 429 +va_ 428 +ca 426 +._ 422 +tt 422 +re_ 415 +nt 415 +io 411 +_v 407 +pe 405 +z 392 +to_ 391 +_ch 389 +na 384 +si 384 +' 383 +he 382 +no_ 379 +ci 374 +_la 373 +ro 371 +_g 370 +st 368 +cc 366 +he_ 362 +di_ 362 +ma 358 +ev 354 +che 354 +es 352 +me 352 +pa 351 +_t 349 +ti 348 +_di_ 347 +ss 345 +che_ 344 +a,_ 337 +a, 337 +nd 335 +o, 333 +o,_ 333 +ell 330 +gl 323 +sa 322 +il 322 +gli 321 +da 318 +as 318 +do 314 +_che 308 +_che_ 306 +eva 306 +_la_ 300 +lla 298 +le_ 293 +un 291 +_pe 290 +_de 288 +q 283 +qu 283 +ava 280 +po 277 +on_ 275 +r_ 273 +li_ 273 +_b 269 +_il 268 +_il_ 268 +il_ 268 +lo 267 +om 263 +e, 263 +e,_ 263 +ni 258 +tr 258 +so 255 +ra_ 253 +os 251 +_in 249 +_u 248 +per 244 +are 243 +et 243 +_se 240 +ano 239 +si_ 238 +_ca 238 +_qu 238 +lla_ 238 +_q 238 +_a_ 236 +ac 236 +_r 234 +ic 233 +_no 232 +ie 227 +fa 227 +hi 226 +del 225 +ua 222 +_per 218 +ce 218 +_ma 216 +sc 216 +_del 215 +mi 212 +_un 208 +chi 206 +era 205 +i, 205 +i,_ 205 +su 203 +and 202 +vo 202 +_fa 201 +eva_ 200 +ano_ 199 +gli_ 197 +non 196 +pi 196 +vi 195 +er_ 195 +_al 194 +se_ 193 +_ne 192 +_non 191 +am 190 +is 187 +ava_ 187 +_non_ 186 +non_ 186 +in_ 185 +ent 185 +_si 184 +_pa 184 +com 183 +! 182 +_le 182 +_su 181 +uo 181 +el_ 180 +!_ 180 +l' 178 +ue 177 +te_ 177 +_com 177 +are_ 176 +pr 176 +_in_ 176 +van 172 +mo 172 +ta_ 171 +gn 167 +ere 166 +na_ 166 +tto 163 +it 161 +_per_ 161 +per_ 161 +é 161 +all 160 +ess 159 +ut 159 +col 158 +acc 157 +gi 155 +lo_ 154 +oc 154 +vano 153 +io_ 153 +_av 151 +ndo 151 +é_ 151 +ato 149 +ave 148 +_st 147 +me_ 147 +'a 146 +ia_ 144 +con 143 +mp 143 +fi 142 +ett 142 +_si_ 141 +_pi 140 +era_ 140 +ti_ 140 +ó 140 +vano_ 140 +_gl 139 +qua 139 +ella 139 +sta 138 +ome 137 +S 137 +_gli 137 +_S 137 +ad 136 +_ve 134 +ant 134 +ne_ 134 +ó_ 133 +sp 133 +do_ 133 +_po 132 +ro_ 132 +ov 132 +_le_ 131 +ella_ 130 +sse 129 +_con 128 +ir 128 +_vi 128 +ig 127 +_gli_ 127 +_ave 127 +vev 127 +un_ 126 +ot 126 +veva 125 +dell 125 +que 125 +a. 125 +_o 125 +a._ 124 +tu 124 +cia 123 +za 123 +_que 123 +_da 121 +par 121 +_pr 120 +cch 120 +_dell 120 +eg 119 +_sa 119 +o._ 119 +o. 119 +_col 118 +lt 118 +_un_ 118 +rt 118 +ur 117 +_vo 117 +_me 117 +ome_ 117 +L 116 +ap 116 +_L 116 +zi 116 +nto 116 +og 115 +_an 115 +_so 115 +em 114 +ag 114 +be 111 +ni_ 111 +im 110 +cchi 110 +ver 110 +lle 109 +nz 109 +cci 109 +_ri 109 +nc 108 +_er 108 +come_ 107 +come 107 +aveva 107 +ui 107 +avev 107 +tto_ 107 +_come 106 +ed 106 +P 105 +man 105 +_P 105 +rs 105 +occ 104 +ndo_ 103 +ato_ 103 +_qua 103 +_era 103 +ari 102 +ba 100 +_mo 100 +nel 100 +id 99 +men 98 +_fi 98 +_all 98 +rr 97 +_do 97 +_avev 97 +att 97 +l'a 96 +ei 96 +zz 96 +; 96 +vol 95 +pp 95 +tra 95 +;_ 95 +ere_ 94 +lle_ 94 +nda 94 +utt 94 +est 93 +_nel 93 +ul 92 +ola 92 +iv 92 +ando 90 +ale 90 +lu 90 +rn 90 +e. 89 +e._ 89 +ll' 89 +tta 88 +nte 87 +_l' 87 +uel 87 |