文件名称:word (character) segmentation
文件大小:10.46MB
文件格式:RAR
更新时间:2013-02-03 22:12:30
word (character) segmentation
word (character) segmentation 的一些论文 (Kawtrakul et al. 2002) @conference{kawtrakul2002state, title={{A state of the art of Thai language resources and Thai language behavior analysis and modeling}}, author={Kawtrakul, A. and Suktarachan, M. and Varasai, P. and Chanlekha, H.}, booktitle={Proceedings of the ACL-02-Workshop on Effective Tools and Methodologies for Teaching Natural Language Processing and Computational Linguistics}, year={2002} } {(Ha, 2003)} @conference{ha2003method, title={{A method for word segmentation in Vietnamese}}, author={Ha, L.A.}, booktitle={Proceedings of the Corpus Linguistics 2003 Conference}, pages={282--287}, year={2003} } (Wong and Chan, 1996) @conference{wong1996chinese, title={{Chinese word segmentation based on maximum matching and word binding force}}, author={Wong, P. and Chan, C.}, booktitle={Proceedings of the 16th International conference on Computational linguistic}, volume={1}, pages={200--203}, year={1996} } (Sun et al. 1998) @conference{maosong1998chinese, title={{Chinese word segmentation without using lexicon and hand-crafted training data}}, author={Maosong, S. and Dayang, S. and Tsou, B.K.}, booktitle={Proceedings of the 17th international conference on Computational linguistics-Volume 2}, pages={1265--1271}, year={1998}, organization={Association for Computational Linguistics Morristown, NJ, USA} } (Sornlertlamvanich et al., 2000) @conference{sornlertlamvanich2000automatic, title={{Automatic corpus-based Thai word extraction with the C4. 5 learning algorithm}}, author={Sornlertlamvanich, V. and Potipiti, T. and Charoenporn, T.}, booktitle={Proceedings of the 18th conference on Computational linguistics-Volume 2}, pages={802--807}, year={2000}, organization={Association for Computational Linguistics Morristown, NJ, USA} } (Poowarawan, 1986) {Yuen Poowarawan. 1986. Dictionary-based Thai Syllable Separation. In proceeding of the Nithe Electronics Engineering Conference} (Rarunrom, 1991) {Sampan Rarunrom. 1991. Dictionary-based Thai Word Separation. Senior Project Report.} (Sornlertlamvanich, 1993) @article{sornlertlamvanich1993word, title={{Word segmentation for Thai in machine translation system}}, author={Sornlertlamvanich, V.}, journal={Machine Translation, NECTEC}, pages={556--561}, year={1993} (Word segmentation for vietnamese text categorization: an online corpus approach) @conference{nguyen2006word, title={{Word segmentation for Vietnamese text categorization: an online corpus approach}}, author={Nguyen, T.V. and Tran, H.K. and Nguyen, T.T.T. and Nguyen, H.}, booktitle={Proceedings of 4th IEEE International Conference on Computer Science Research, Innovation and Vision of the Future,(HoChiMinh City, Vietnam, 2006)}, organization={Citeseer} } (A Search-based Chinese Word Segmentation Method) @conference{wang2007search, title={{A search-based Chinese word segmentation method}}, author={Wang, X.J. and Qin, Y. and Liu, W.}, booktitle={Proceedings of the 16th international conference on World Wide Web}, pages={1130}, year={2007}, organization={ACM} } (chinese indexing using mutual information) @conference{yang1998chinese, title={{Chinese indexing using mutual information}}, author={Yang, CC and Yen, J. and Yung, S.K. and Chung, A.K.L.}, booktitle={Proceedings of the first Asia digital library workshop}, pages={57--64}, year={1998} } (Unigram Language Model for Chinese Word Segmentation) @conference{chen2005unigram, title={{Unigram language model for Chinese word segmentation}}, author={Chen, A. and Zhou, Y. and Zhang, A. and Sun, G.}, booktitle={Proceedings of the 4th SIGHAN Workshop on Chinese Language Processing}, pages={138--141}, year={2005} }
【文件预览】:
dictionary-based
----an empirical study of smoothing techniques for language modeling.pdf(738KB)
----chinese word segmentation using finite state transducer.pdf(48KB)
----A stochastic finite-state word-sgementation algorithm for Chinses.pdf(1.82MB)
----chinese word segmentation based on maximum matching and word binding force.pdf(315KB)
comparition
----Dinh_LREC2008.pdf(74KB)
----8A comparative study on thai word segementation approaches.pdf(167KB)
----Jin_SIGHAN2008.pdf(500KB)
----Wang_SIGHAN2008.pdf(345KB)
----vietnamese word segmentation with CRFs and SVMs An Investigation.pdf(140KB)
statistical-based
----A maximum Entropy Approach to Chinese Word Segmentation.pdf(86KB)
----Unigram Language Model for Chinese Word Segmentation.pdf(86KB)
----Chinese word segmentation as Character tagging.pdf(181KB)
----corpus-based methods in Chinese morphology and phonology.pdf(849KB)
----Chinese indexing using mutual information.pdf(1.2MB)
----an unsupervised learning and statistical approach for vietnamese word recognition and segmentation.pdf(228KB)
----A Fuzzy Synset-based Hidden Markov Model for Automatic Text Segmentation.pdf(331KB)
----SNLP2002-0051c.pdf(389KB)
----Conditional Random Fields - probabilistic models for segmenting and labeling sequence data.pdf(183KB)
----Thai Word Segmentation based-on GLR Parsing Technique .pdf(316KB)
----bayesian unsupervised word segmentation with nested pitman-yor language modeling.pdf(246KB)
----a stochastic morphological analysis for japanese employing character n-gram and k-nn method.pdf(191KB)
----non-dictionary-based thai word segmentation using decision trees.pdf(93KB)
----japanese word segmentation by adaboost using the decision list.gz(233KB)
----RIVF06_Word_Segmentation_for_Vietnamese_Text_Categorization_An_online_corpus_approach.pdf(372KB)
----feature-based Thai word segmentation.pdf(147KB)
----a Search-based chinese word segmentation method.pdf(314KB)
----a method for word segmentation in vietnamese.pdf(149KB)
----Effective Tag Set Selection in chinese Word Segmentation via Conditional Random File Modeling.pdf(102KB)
----chinese segmentation and new word detection using CRF.pdf(136KB)
biboliography
hybrid
----word segmentation in sentence analysis.pdf(128KB)
----Thai word segmentation a lexical semantic approach approach.pdf(162KB)
----Chinese word segmentatin by classification of characters.pdf(182KB)
----Gao_CL2005.pdf(1.58MB)
----chinese and japanese word segmentation using word-level and character-level information.ps(740KB)
----vietnamese segmentation.pdf(215KB)
----thai word segmentation using character-level information.pdf(222KB)
----Li_SIGHAN2008.pdf(323KB)
----a hybrid approach to chinese word segmentation.pdf(88KB)
----Le_LATA2008.pdf(137KB)