@ARTICLE{Myrczek_Ewa_Corpus_2000, author={Myrczek, Ewa}, volume={vol. 21}, journal={LINGUISTICA SILESIANA}, pages={43-62}, howpublished={online}, year={2000}, publisher={Polska Akademia Nauk • Oddział w Katowicach}, abstract={The aim of this article is to discuss a few issues related to corpus, mainly, its definition, development, compilation and taxonomy. The author demonstrates a distinction between a corpus and a text archive or a text database (text bank). The development of corpora is divided into the two following stages: pre-electronic and electronic. Corpora are differentiated and classified according to language variables such as monolingual vs. multilingual, plain vs. annotated and data resources such as speech and written language corpora. The author discusses only a few features ofa corpus, mainly its representativeness, size [static (closed) corpus vs. dynamic (monitor, openended) corpus] and form (machine-readable vs. print). The European and North American centres of corpus linguistics are surveyed. The author argues that the invention of the computer a turning point in the field of corpus linguistics as modem corpora are more precise and flexible than a couple centuries ago. The final conclusion of this article is that the Chomsky's criticism levelled at the practicality of corpus linguistics is no longer valid.}, type={article}, title={Corpus - its definition, compilation, taxonomy and future}, URL={http://czasopisma.pan.pl/Content/132899/PDF/6_SILESIANA_21_Myrczek_CORPUS.pdf}, }