/usr/share/libexttextcat/fpdb.conf is in libexttextcat-data 3.2.0-1ubuntu1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 | # This file have been modified (to OOo by Jocelyn MERAND joc.mer@gmail.com) to
# include country and encoding
#
# TO-DO: convert to BCP-47
#
# guess strings are made as following : language-country-encoding
#
# Based on a sample config file for the language models provided with Gertjan
# van Noords language guesser (http://odur.let.rug.nl/~vannoord/TextCat/)
#
# Notes:
# - Putting the most probable languages at the top of the list
# improves performance, because this will raise the threshold for
# likely candidates more quickly.
#
# Top 10 http://www.ethnologue.com/ethno_docs/distribution.asp?by=size
zh-Hans.lm zh-CN-utf8 #zh-Hans
es.lm es--utf8
en.lm en--utf8
ar.lm ar--utf8
hi.lm hi--utf8
bn.lm bn--utf8
pt.lm pt--utf8
ru.lm ru--utf8
ja.lm ja--utf8
de.lm de--utf8
af.lm af--utf8
am.lm am--utf8
ast.lm ast--utf8
be.lm be--utf8
bg.lm bg--utf8
bo.lm bo--utf8
br.lm br--utf8
bs.lm bs--utf8 #Suppress-Script: Latn
ca.lm ca--utf8
cs.lm cs--utf8
cy.lm cy--utf8
da.lm da--utf8
ee.lm ee--utf8
el.lm el--utf8
eo.lm eo--utf8
et.lm et--utf8
eu.lm eu--utf8
fa.lm fa--utf8
fi.lm fi--utf8
fj.lm fj--utf8
fo.lm fo--utf8
fr.lm fr--utf8
fur.lm fur--utf8
fy.lm fy--utf8
ga.lm ga--utf8
gd.lm gd--utf8
gl.lm gl--utf8
gn.lm gn--utf8
gu.lm gu--utf8
gv.lm gv--utf8
ha-NG.lm ha-NG-utf8
haw.lm haw-utf8
he.lm he--utf8
hil.lm hil--utf8
hr.lm hr--utf8 #Suppress-Script: Latn
hsb.lm hsb--utf8
ht.lm ht--utf8
hu.lm hu--utf8
hy.lm hy--utf8
ia.lm ia--utf8
id.lm id--utf8
is.lm is--utf8
it.lm it--utf8
ka.lm ka--utf8
kk.lm kk--utf8
kl.lm kl--utf8
km.lm km--utf8
ko.lm ko--utf8
ktu.lm ktu--utf8
ky.lm ky--utf8
la.lm la--utf8
lb.lm lb--utf8
lg.lm lg--utf8
ln.lm ln--utf8
lo.lm lo--utf8
lt.lm lt--utf8
lv.lm lv--utf8
mai.lm mai--utf8
mi.lm mi--utf8
mg.lm mg--utf8
mk.lm mk--utf8
ml.lm ml--utf8
mn.lm mn--utf8 #mn-Cyrl
mr.lm mr--utf8
ms.lm ms--utf8 #ms-Latn
mt.lm mt--utf8
my.lm my--utf8
nb.lm nb--utf8
ne.lm ne--utf8
nl.lm nl--utf8
nn.lm nn--utf8
ny.lm ny--utf8
nso.lm nso--utf8
om.lm om--utf8
pa.lm pa--utf8
pl.lm pl--utf8
qxa.lm qxa--utf8
rm.lm rm--utf8
ro.lm ro--utf8
rw.lm rw--utf8
sa.lm sa--utf8
sc.lm sc--utf8
sco.lm sco--utf8
se.lm se--utf8
sg.lm sg--utf8
sk.lm sk--utf8
sl.lm sl--utf8
so.lm so--utf8
sq.lm sq--utf8
sr.lm sr--utf8 #sr-Cyrl
sr-Latn.lm sh--utf8 #sr-Latn
ss.lm ss--utf8
st.lm st--utf8
sv.lm sv--utf8
sw.lm sw--utf8
ta.lm ta--utf8
tet.lm tet--utf8
tg.lm tg--utf8
th.lm th--utf8
ti.lm ti--utf8
tk.lm tk--utf8 #tk-Latn
tl.lm tl--utf8
tn.lm tn--utf8
tpi.lm tpi--utf8
tr.lm tr--utf8
ts.lm ts--utf8
tt.lm tt--utf8
ty.lm ty--utf8
ug.lm ug--utf8 #ug-Arab
uk.lm uk--utf8
ur.lm ur--utf8
uz.lm uz--utf8 #uz-Latn
ve.lm ve--utf8
vi.lm vi--utf8
wa.lm wa--utf8
xh.lm xh--utf8
yi.lm yi--utf8
yo.lm yo--utf8
zh-Hant.lm zh-TW-utf8 #zh-Hant
zu.lm zu--utf8
|