@inproceedings{Lecarda FontanellaBleckmannDieckhoffetal.2023, author = {Lecarda Fontanella, Vitor L{\´e}cio and Bleckmann, Tom and Dieckhoff, Lukas and Friege, Gunnar and Wartena, Christian}, title = {TeCoPhy: A Text Corpus of German Physics Texts}, booktitle = {Corpus Linguistics in the Digital Era: Genres, Registers and Domains ; 14th International Conference on Corpus Linguistics - May 10 - 12, 2023}, doi = {10.25968/opus-2796}, url = {https://cilc2023.wordpress.com/book-of-abstracts/}, institution = {Fakult{\"a}t III - Medien, Information und Design}, pages = {122 -- 123}, year = {2023}, abstract = {To learn a subject, the acquisition of the associated technical language is important. Despite this widely accepted importance of learning the technical language, hardly any studies are published that describe the characteristics of most technical languages that students are supposed to learn. This might largely be due to the absence of specialized text corpora to study such languages at lexical, syntactical and textual level. In the present paper we describe a corpus of German physics text that can be used to study the language used in physics. A large and a small variant are compiled. The small version of the corpus consists of 5.3 Million words and is available on request.}, subject = {Korpus }, language = {en} }