@article{Bizzoni2020b,
title = {Linguistic Variation and Change in 250 years of English Scientific Writing: A Data-driven Approach},
author = {Yuri Bizzoni and Stefania Degaetano-Ortlieb and Peter Fankhauser and Elke Teich},
url = {https://www.frontiersin.org/journals/artificial-intelligence/articles/10.3389/frai.2020.00073},
doi = {https://doi.org/10.3389/frai.2020.00073},
year = {2020},
date = {2020},
journal = {Frontiers in Artificial Intelligence},
volume = {3 - 2020},
abstract = {
We trace the evolution of Scientific English through the Late Modernperiod to modern time on the basis of a comprehensive corpus composedof the Transactions and Proceedings of the Royal Society of London, thefirst and longest-running English scientific journal established in 1665.Specifically, we explore the linguistic imprints of specialization and di-versification in the science domain which accumulate in the formation of"scientific language" and field-specific sublanguages/registers (chemistry,biology etc).We pursue an exploratory, data-driven approach using state-of-the-art computational language models and combine them with selectedinformation-theoretic measures (entropy, relative entropy) for comparingmodels along relevant dimensions of variation (time, register). Focusing onselected linguistic variables (lexis, grammar), we show how we deploy com-putational language models for capturing linguistic variation and changeand discuss benefits and limitations.
},
pubstate = {published},
type = {article}
}