@InProceedings{kovarik:2000:CLPW, author = {John J. Kovarik}, title = {How Should a Large Corpus Be Built?-A Comparative Study of Closure in Annotated Newspaper Corpora from Two Chinese Sources, Towards Building a Larger Representative Corpus Merged from Representative Sublanguage Collections}, booktitle = {Second Chinese Language Processing Workshop}, month = {October}, year = {2000}, address = {Hong Kong, China}, publisher = {Association for Computational Linguistics}, pages = {116--123}, url = {http://www.aclweb.org/anthology/W00-1217}, doi = {10.3115/1117769.1117788} }