2025-04-27 07:49:33 -04:00

80 lines
2.2 KiB
INI

# Configuration file for Simplified Chinese Desktop recognizer
# Configuration
Locale=CHS
Config=dev_rare
# The list of catagories to select from the .loc file for this configuration.
# JBENN: may want to add ExtMath in V2 Tablet.
CatagoryList=basic,GB1,ExtPunc,RomNum
# The file containing the list of FFF file to train from.
TrainSets="\
//tpg/reco/TextInk/chs/chs-boxed-20020222/people--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/natural--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/neat--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/old--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/gb0--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/gb1--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/punc--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020222/addpanel--list.txt \
//tpg/reco/TextInk/chs/chs-boxed-20020322/filler--list.txt \
"
# //tpg/reco/TextInk/chs/chs-boxed-20020222/cjk--list.txt \
# //tpg/reco/TextInk/chs/chs-boxed-20020222/gb3578--list.txt \
# Free input training set
FreeTrainSet=""
# Tuning sets
NatTuneSet="//tpg/reco/test/chs/tune-natural000.tfl"
UniTuneSet="//tpg/reco/test/chs/tune-uniform000.tfl"
FreeTuneSet=$NatTuneSet
# Unicode text file to generate unigrams and bigrams from.
TextFile="//tpg/reco/corpora/chs/all.utf"
# List of tests to run on recognizer.
TestList="natural address GB0 GB1 free"
# Target size to shrink zilla to.
ZillaSize=7000000
# Select the recognizer for 1 and 2 stroke characters
UseFugu=0
UseOtter=1
UseSole=0
UseJaws=0
# Select the postprocessor
UseCrane=1
UseHawk=0
# Shrink parameters for otter.
OtterStrongCluster=55
OtterWeakCluster=20
OtterSize=1000000
# Otter limit on number of samples per (folded) code point
OtterSampleLimit=25000
# Number of classes to use for Centipede
CentipedeClasses=32
# Weight of natural frequency vs. uniform frequency in training set.
NatuFreqWeight=1.0
# Flag for WinCE configuration.
# Set to 1 if true, 0 if false.
IsWinCE=0
# Character detector settings
UseCharDet=0
# Break net and segmentation net settings
UseBrkNet=0
UseSegNet=0
# Whether to do IFELang3 tuning and testing
UseIFELang3=1