#dictionary character encoding #paoding.dic.charset=UTF-8 #dictionaries which are skip #paoding.dic.skip.prefix=x- #chinese/cjk charactors that will not token #paoding.dic.noise-charactor=x-noise-charactor #chinese/cjk words that will not token #paoding.dic.noise-word=x-noise-word #unit words, like "ge", "zhi", ... #paoding.dic.unit=x-unit #like "Wang", "Zhang", ... #paoding.dic.confucian-family-name=x-confucian-family-name #linke "uPAN", "cdHE" #paoding.dic.for-combinatorics=x-for-combinatorics