@article{ArnoldBallierLissonetal.2019, author = {Arnold, Taylor and Ballier, Nicolas and Lisson, Paula and Tilton, Lauren}, title = {Beyond lexical frequencies: using R for text analysis in the digital humanities}, series = {Language resources and evaluation}, volume = {53}, journal = {Language resources and evaluation}, number = {4}, publisher = {Springer}, address = {Dordrecht}, issn = {1574-020X}, doi = {10.1007/s10579-019-09456-6}, pages = {707 -- 733}, year = {2019}, abstract = {This paper presents a combination of R packages-user contributed toolkits written in a common core programming language-to facilitate the humanistic investigation of digitised, text-based corpora.Our survey of text analysis packages includes those of our own creation (cleanNLP and fasttextM) as well as packages built by other research groups (stringi, readtext, hyphenatr, quanteda, and hunspell). By operating on generic object types, these packages unite research innovations in corpus linguistics, natural language processing, machine learning, statistics, and digital humanities. We begin by extrapolating on the theoretical benefits of R as an elaborate gluing language for bringing together several areas of expertise and compare it to linguistic concordancers and other tool-based approaches to text analysis in the digital humanities. We then showcase the practical benefits of an ecosystem by illustrating how R packages have been integrated into a digital humanities project. Throughout, the focus is on moving beyond the bag-of-words, lexical frequency model by incorporating linguistically-driven analyses in research.}, language = {en} } @article{vanGervenBredervelddeKleinetal.2015, author = {van Gerven, Luuk P. A. and Brederveld, Robert J. and de Klein, Jeroen J. M. and DeAngelis, Don L. and Downing, Andrea S. and Faber, Michiel and Gerla, Daan J. and Janse, Jan H. and Janssen, Annette B. G. and Jeuken, Michel and Kooi, Bob W. and Kuiper, Jan J. and Lischke, Betty and Liu, Sien and Petzoldt, Thomas and Schep, Sebastiaan A. and Teurlincx, Sven and Thiange, Christophe and Trolle, Dennis and van Nes, Egbert H. and Mooij, Wolf M.}, title = {Advantages of concurrent use of multiple software frameworks in water quality modelling using a database approach}, series = {Fundamental and applied limnology : official journal of the International Association of Theoretical and Applied Limnology}, volume = {186}, journal = {Fundamental and applied limnology : official journal of the International Association of Theoretical and Applied Limnology}, number = {1-2}, publisher = {Schweizerbart}, address = {Stuttgart}, issn = {1863-9135}, doi = {10.1127/fal/2015/0631}, pages = {5 -- 20}, year = {2015}, abstract = {Water quality modelling deals with multidisciplinary questions ranging from fundamental to applied. Addressing this broad range of questions requires multiple analysis techniques and therefore multiple frameworks. Through the recently developed database approach to modelling (DATM), it has become possible to run a model in multiple software frameworks without much overhead. Here we apply DATM to the ecosystem model for ditches PCDitch and its twin model for shallow lakes PCLake. Using DATM, we run these models in six frameworks (ACSL, DELWAQ, DUFLOW, GRIND for MATLAB, OSIRIS and R), and report on the possible model analyses with tools provided by each framework. We conclude that the dynamic link between frameworks and models resulting from DATM has the following main advantages: it allows one to use the framework one is familiar with for most model analyses and eases switching between frameworks for complementary model analyses, including the switch between a 0-D and 1-D to 3-D setting. Moreover, the strength of each framework - including runtime performance - can now be easily exploited. We envision that a community-based further development of the concept can contribute to the future development of water quality modelling, not only by addressing multidisciplinary questions but also by facilitating the exchange of models and process formulations within the community of water quality modellers.}, language = {en} }