@article {Feng:2006:1384-6655:173, author = "Feng, Zhiwei", title = "Evolution and present situation of corpus research in China", journal = "International Journal of Corpus Linguistics", volume = "11", year = "2006", abstract = "In this paper, the author introduces in detail the development and present situation of corpus linguistics in China: earlier corpora, large-scale & authentic text corpora, national corpora, speech corpora, bilingual corpora and corpora of minority languages in China. The various processing techniques for corpora are also introduced: automatic word segmentation of Chinese text, automatic PoS tagging, automatic tagging of phrase structure and automatic alignment of bilingual corpora. This paper is a bird's-eye view of corpus linguistics of China. Finally, the author discusses several problems in present corpus research: standardization of corpus specifications, commonly sharing of language resources, knowledge properties, etc.", pages = "173-207(35)", url = "http://www.ingentaconnect.com/content/jbp/ijcl/2006/00000011/00000002/art00002" doi = "doi:10.1075/ijcl.11.2.03fen" }