@article{WulffBuschhueterWestphaletal.2020, author = {Wulff, Peter and Buschh{\"u}ter, David and Westphal, Andrea and Nowak, Anna and Becker, Lisa and Robalino, Hugo and Stede, Manfred and Borowski, Andreas}, title = {Computer-based classification of preservice physics teachers' written reflections}, series = {Journal of science education and technology}, volume = {30}, journal = {Journal of science education and technology}, number = {1}, publisher = {Springer}, address = {Dordrecht}, issn = {1059-0145}, doi = {10.1007/s10956-020-09865-1}, pages = {1 -- 15}, year = {2020}, abstract = {Reflecting in written form on one's teaching enactments has been considered a facilitator for teachers' professional growth in university-based preservice teacher education. Writing a structured reflection can be facilitated through external feedback. However, researchers noted that feedback in preservice teacher education often relies on holistic, rather than more content-based, analytic feedback because educators oftentimes lack resources (e.g., time) to provide more analytic feedback. To overcome this impediment to feedback for written reflection, advances in computer technology can be of use. Hence, this study sought to utilize techniques of natural language processing and machine learning to train a computer-based classifier that classifies preservice physics teachers' written reflections on their teaching enactments in a German university teacher education program. To do so, a reflection model was adapted to physics education. It was then tested to what extent the computer-based classifier could accurately classify the elements of the reflection model in segments of preservice physics teachers' written reflections. Multinomial logistic regression using word count as a predictor was found to yield acceptable average human-computer agreement (F1-score on held-out test dataset of 0.56) so that it might fuel further development towards an automated feedback tool that supplements existing holistic feedback for written reflections with data-based, analytic feedback.}, language = {en} } @article{TaboadaBrookeTofiloskietal.2011, author = {Taboada, Maite and Brooke, Julian and Tofiloski, Milan and Voll, Kimberly and Stede, Manfred}, title = {Lexicon-Based methods for sentiment analysis}, series = {Computational linguistics}, volume = {37}, journal = {Computational linguistics}, number = {2}, publisher = {MIT Press}, address = {Cambridge}, issn = {0891-2017}, pages = {267 -- 307}, year = {2011}, abstract = {We present a lexicon-based approach to extracting sentiment from text. The Semantic Orientation CALculator (SO-CAL) uses dictionaries of words annotated with their semantic orientation (polarity and strength), and incorporates intensification and negation. SO-CAL is applied to the polarity classification task, the process of assigning a positive or negative label to a text that captures the text's opinion towards its main subject matter. We show that SO-CAL's performance is consistent across domains and on completely unseen data. Additionally, we describe the process of dictionary creation, and our use of Mechanical Turk to check dictionaries for consistency and reliability.}, language = {en} } @article{StedeSchefflerMendes2019, author = {Stede, Manfred and Scheffler, Tatjana and Mendes, Amalia}, title = {Connective-Lex}, series = {Discours : revue de linguistique, psycholinguistique et informatique}, journal = {Discours : revue de linguistique, psycholinguistique et informatique}, number = {24}, publisher = {Universit{\´e} de Paris-Sorbonne}, address = {Paris}, issn = {1963-1723}, doi = {10.4000/discours.10098}, pages = {36}, year = {2019}, abstract = {In this paper, we present a tangible outcome of the TextLink network: a joint online database project displaying and linking existing and newly-created lexicons of discourse connectives in multiple languages. We discuss the definition and demarcation of the class of connectives that should be included in such a resource, and present the syntactic, semantic/pragmatic, and lexicographic information we collected. Further, the technical implementation of the database and the search functionality are presented. We discuss how the multilingual integration of several connective lexicons provides added value for linguistic researchers and other users interested in connectives, by allowing crosslinguistic comparison and a direct linking between discourse relational devices in different languages. Finally, we provide pointers for possible future extensions both in breadth (i.e., by adding lexicons for additional languages) and depth (by extending the information provided for each connective item and by strengthening the crosslinguistic links).}, language = {en} } @article{StedePeldszus2012, author = {Stede, Manfred and Peldszus, Andreas}, title = {The role of illocutionary status in the usage conditions of causal connectives and in coherence relations}, series = {Journal of pragmatics : an interdisciplinary journal of language studies}, volume = {44}, journal = {Journal of pragmatics : an interdisciplinary journal of language studies}, number = {2}, publisher = {Elsevier}, address = {Amsterdam}, issn = {0378-2166}, doi = {10.1016/j.pragma.2012.01.004}, pages = {214 -- 229}, year = {2012}, abstract = {The meaning of linguistic connectives has often been characterized in terms of their position in a bipartite (semantic, pragmatic) or a tripartite (content, epistemic, speech act) structure of domains, depending on what kinds of entities are being connected (largely: propositions or speech acts). This paper argues that a more fine-grained analysis can be achieved by directing some more attention to the characterization of the entities being related. We propose an inventory of categories of illocutionary status for labelling the spans that are being connected. On this basis, the distinction between the content and the epistemic domain, in particular, can be made more explicit. Focusing on the group of causal connectives in German, we conducted a corpus annotation study from which we derived distinct pragmatic 'usage profiles' of the most frequent causal connectives. Finally, we offer some suggestions on the role of illocutions in relation-based accounts of discourse structure.}, language = {en} } @book{StedeMamprinPeldszusetal.2015, author = {Stede, Manfred and Mamprin, Sara and Peldszus, Andreas and Herzog, Andr{\´e} and Kaupat, David and Chiarcos, Christian and Warzecha, Saskia}, title = {Handbuch Textannotation}, editor = {Stede, Manfred}, isbn = {978-3-86956-343-5}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-82761}, publisher = {Universit{\"a}t Potsdam}, pages = {xvii, 209}, year = {2015}, abstract = {Das Potsdamer Kommentarkorpus ist eine Sammlung von Zeitungstexten, die dem Genre 'Kommentar' zuzuordnen sind. Der {\"o}ffentlich verf{\"u}gbare Teil besteht aus 175 Texten aus der M{\"a}rkischen Allgemeinen Zeitung, die hinsichtlich Syntax, Koreferenz, Konnektoren und Rhetorische Struktur manuell annotiert wurden. Weitere Ebenen werden bei zuk{\"u}nftigen Korpusversionen hinzukommen. Dieses Buch enth{\"a}lt die Annotationsrichtlinien, die der Bearbeitung des {\"o}ffentlichen Teils des Korpus zugrunde lagen, sowie auch anderer Teile, bei denen mit weiteren Annotationsebenen experimentiert wurde. Die meisten der Richtlinien werden auch f{\"u}r {\"a}hnliche Text-Genres und f{\"u}r andere Sprachen verwendbar sein.}, language = {de} } @article{StedeKuhn2009, author = {Stede, Manfred and Kuhn, Florian}, title = {Identifying the content zones of German court decisions}, isbn = {978-3-642- 03423-7}, year = {2009}, language = {en} } @article{StedeHuang2012, author = {Stede, Manfred and Huang, Chu-Ren}, title = {Inter-operability and reusability the science of annotation}, series = {Language resources and evaluation}, volume = {46}, journal = {Language resources and evaluation}, number = {1}, publisher = {Springer}, address = {Dordrecht}, issn = {1574-020X}, doi = {10.1007/s10579-011-9164-x}, pages = {91 -- 94}, year = {2012}, abstract = {Annotating linguistic data has become a major field of interest, both for supplying the necessary data for machine learning approaches to NLP applications, and as a research issue in its own right. This comprises issues of technical formats, tools, and methodologies of annotation. We provide a brief overview of these notions and then introduce the papers assembled in this special issue.}, language = {en} } @book{StedeChiarcosGrabskietal.2005, author = {Stede, Manfred and Chiarcos, Christian and Grabski, Michael and Lagerwerf, Luuk}, title = {Salience in discurse : multidisciplinary approaches to discourse 2005}, series = {Uitgaven Stichting Neerlandistiek VU}, volume = {49}, journal = {Uitgaven Stichting Neerlandistiek VU}, publisher = {Nodus-Publ; Stichting Neerlandistiek VU}, address = {M{\"u}nster; Amsterdam}, isbn = {3-89323-749-6}, pages = {153 S.}, year = {2005}, language = {en} } @article{Stede2020, author = {Stede, Manfred}, title = {Automatic argumentation mining and the role of stance and sentiment}, series = {Journal of argumentation in context}, volume = {9}, journal = {Journal of argumentation in context}, number = {1}, publisher = {John Benjamins Publishing Co.}, address = {Amsterdam}, issn = {2211-4742}, doi = {10.1075/jaic.00006.ste}, pages = {19 -- 41}, year = {2020}, abstract = {Argumentation mining is a subfield of Computational Linguistics that aims (primarily) at automatically finding arguments and their structural components in natural language text. We provide a short introduction to this field, intended for an audience with a limited computational background. After explaining the subtasks involved in this problem of deriving the structure of arguments, we describe two other applications that are popular in computational linguistics: sentiment analysis and stance detection. From the linguistic viewpoint, they concern the semantics of evaluation in language. In the final part of the paper, we briefly examine the roles that these two tasks play in argumentation mining, both in current practice, and in possible future systems.}, language = {en} } @book{Stede2007, author = {Stede, Manfred}, title = {Korpusgest{\"u}tzte Textanalyse : Grundz{\"u}ge der Ebenen-orientierten Textlinguistik}, publisher = {Narr}, address = {T{\"u}bingen}, isbn = {978-3-8233-6301-9}, issn = {0941-8105}, pages = {207 S.}, year = {2007}, language = {de} } @article{Stede2004, author = {Stede, Manfred}, title = {Does discourse processing need discourse topics?}, issn = {0301-4428}, year = {2004}, language = {en} } @article{Stede2002, author = {Stede, Manfred}, title = {DiMLex: a lexical approach to discourse markers}, year = {2002}, language = {en} } @article{Stede2002, author = {Stede, Manfred}, title = {Polibox: Generating desciptions, comparisons, and recommendations from a database}, isbn = {1-55860- 899-0}, year = {2002}, language = {en} } @article{Stede2020, author = {Stede, Manfred}, title = {From connectives to coherence relations}, series = {Revue roumaine de linguistique : RRL = Romanian review of linguistics}, volume = {65}, journal = {Revue roumaine de linguistique : RRL = Romanian review of linguistics}, number = {3}, publisher = {Ed. Academiei Rom{\^a}ne}, address = {Bucure{\c{s}}ti}, issn = {0035-3957}, pages = {213 -- 233}, year = {2020}, abstract = {The notion of coherence relations is quite widely accepted in general, but concrete proposals differ considerably on the questions of how they should be motivated, which relations are to be assumed, and how they should be defined. This paper takes a "bottom-up" perspective by assessing the contribution made by linguistic signals (connectives), using insights from the relevant literature as well as verification by practical text annotation. We work primarily with the German language here and focus on the realm of contrast. Thus, we suggest a new inventory of contrastive connective functions and discuss their relationship to contrastive coherence relations that have been proposed in earlier work.}, language = {en} } @article{Stede2008, author = {Stede, Manfred}, title = {Disambiguating rhetorical structure}, issn = {1570-7075}, doi = {10.1007/s11168-008-9053-7}, year = {2008}, abstract = {Empirical studies of text coherence often use tree-like structures in the spirit of Rhetorical Structure Theory (RST) as representational device. This paper identifies several sources of ambiguity in RST-inspired trees and argues that such structures are therefore not as explanatory as a text representation should be. As an alternative, an approach toward multi-level annotation (MLA) of texts is proposed, which separates the information into distinct levels of representation, in particular: referential structure, thematic structure, conjunctive relations, and intentional structure. Levels are conceptually built upon each other, and human annotators can produce them using a dedicated software environment. We argue that the resulting multi-level corpora are descriptively more adequate, and as a resource are more useful than RST-style treebanks.}, language = {en} } @article{Stede2008, author = {Stede, Manfred}, title = {RST revisited : disentangling nuclearity}, isbn = {978-90-272-3109-3}, year = {2008}, language = {en} } @article{Stede2008, author = {Stede, Manfred}, title = {Connective-based local coherence analysis : a lexicon for recognizing causal relationships}, isbn = {978-1-904-98793-2}, year = {2008}, language = {en} } @article{Stede2008, author = {Stede, Manfred}, title = {Computerlinguistik und Textanalyse}, isbn = {978-3-8233- 6432-0}, year = {2008}, language = {de} } @article{Stede2019, author = {Stede, Manfred}, title = {Noch kindlich oder schon jugendlich? Oder gar erwachsen?}, series = {Of trees and birds. A Festschrift for Gisbert Fanselow}, journal = {Of trees and birds. A Festschrift for Gisbert Fanselow}, publisher = {Universit{\"a}tsverlag Potsdam}, address = {Potsdam}, isbn = {978-3-86956-457-9}, doi = {10.25932/publishup-43256}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-432569}, pages = {323 -- 334}, year = {2019}, language = {de} } @article{SchaeferStede2021, author = {Sch{\"a}fer, Robin and Stede, Manfred}, title = {Argument mining on twitter}, series = {Information technology : it ; Methoden und innovative Anwendungen der Informatik und Informationstechnik ; Organ der Fachbereiche 3 und 4 der GI e.V. und des Fachbereichs 6 der ITG}, volume = {63}, journal = {Information technology : it ; Methoden und innovative Anwendungen der Informatik und Informationstechnik ; Organ der Fachbereiche 3 und 4 der GI e.V. und des Fachbereichs 6 der ITG}, number = {1}, publisher = {De Gruyter}, address = {Berlin}, issn = {1611-2776}, doi = {10.1515/itit-2020-0053}, pages = {45 -- 58}, year = {2021}, abstract = {In the last decade, the field of argument mining has grown notably. However, only relatively few studies have investigated argumentation in social media and specifically on Twitter. Here, we provide the, to our knowledge, first critical in-depth survey of the state of the art in tweet-based argument mining. We discuss approaches to modelling the structure of arguments in the context of tweet corpus annotation, and we review current progress in the task of detecting argument components and their relations in tweets. We also survey the intersection of argument mining and stance detection, before we conclude with an outlook.}, language = {en} }