@phdthesis{Yadav2023,
  author    = {Yadav, Himanshu},
  title     = {A computational evaluation of feature distortion and cue weighting in sentence comprehension},
  doi       = {10.25932/publishup-58505},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-585055},
  school      = {Universit{\"a}t Potsdam},
  pages     = {iv, 115},
  year      = {2023},
  abstract  = {Successful sentence comprehension requires the comprehender to correctly figure out who did what to whom. For example, in the sentence John kicked the ball, the comprehender has to figure out who did the action of kicking and what was being kicked. This process of identifying and connecting the syntactically-related words in a sentence is called dependency completion. What are the cognitive constraints that determine dependency completion? A widely-accepted theory is cue-based retrieval. The theory maintains that dependency completion is driven by a content-addressable search for the co-dependents in memory. The cue-based retrieval explains a wide range of empirical data from several constructions including subject-verb agreement, subject-verb non-agreement, plausibility mismatch configurations, and negative polarity items. However, there are two major empirical challenges to the theory: (i) Grammatical sentences' data from subject-verb number agreement dependencies, where the theory predicts a slowdown at the verb in sentences like the key to the cabinet was rusty compared to the key to the cabinets was rusty, but the data are inconsistent with this prediction; and, (ii) Data from antecedent-reflexive dependencies, where a facilitation in reading times is predicted at the reflexive in the bodybuilder who worked with the trainers injured themselves vs. the bodybuilder who worked with the trainer injured themselves, but the data do not show a facilitatory effect. The work presented in this dissertation is dedicated to building a more general theory of dependency completion that can account for the above two datasets without losing the original empirical coverage of the cue-based retrieval assumption. In two journal articles, I present computational modeling work that addresses the above two empirical challenges. To explain the grammatical sentences' data from subject-verb number agreement dependencies, I propose a new model that assumes that the cue-based retrieval operates on a probabilistically distorted representation of nouns in memory (Article I). This hybrid distortion-plus-retrieval model was compared against the existing candidate models using data from 17 studies on subject-verb number agreement in 4 languages. I find that the hybrid model outperforms the existing models of number agreement processing suggesting that the cue-based retrieval theory must incorporate a feature distortion assumption. To account for the absence of facilitatory effect in antecedent-reflexive dependen� cies, I propose an individual difference model, which was built within the cue-based retrieval framework (Article II). The model assumes that individuals may differ in how strongly they weigh a syntactic cue over a number cue. The model was fitted to data from two studies on antecedent-reflexive dependencies, and the participant-level cue-weighting was estimated. We find that one-fourth of the participants, in both studies, weigh the syntactic cue higher than the number cue in processing reflexive dependencies and the remaining participants weigh the two cues equally. The result indicates that the absence of predicted facilitatory effect at the level of grouped data is driven by some, not all, participants who weigh syntactic cues higher than the number cue. More generally, the result demonstrates that the assumption of differential cue weighting is important for a theory of dependency completion processes. This differential cue weighting idea was independently supported by a modeling study on subject-verb non-agreement dependencies (Article III). Overall, the cue-based retrieval, which is a general theory of dependency completion, needs to incorporate two new assumptions: (i) the nouns stored in memory can undergo probabilistic feature distortion, and (ii) the linguistic cues used for retrieval can be weighted differentially. This is the cumulative result of the modeling work presented in this dissertation. The dissertation makes an important theoretical contribution: Sentence comprehension in humans is driven by a mechanism that assumes cue-based retrieval, probabilistic feature distortion, and differential cue weighting. This insight is theoretically important because there is some independent support for these three assumptions in sentence processing and the broader memory literature. The modeling work presented here is also methodologically important because for the first time, it demonstrates (i) how the complex models of sentence processing can be evaluated using data from multiple studies simultaneously, without oversimplifying the models, and (ii) how the inferences drawn from the individual-level behavior can be used in theory development.},
  language  = {en}
}
@article{MaetzigVasishthEngelmannetal.2018,
  author    = {M{\"a}tzig, Paul and Vasishth, Shravan and Engelmann, Felix and Caplan, David and Burchert, Frank},
  title     = {A computational investigation of sources of variability in sentence comprehension difficulty in aphasia},
  series = {Topics in cognitive science},
  volume    = {10},
  journal   = {Topics in cognitive science},
  number    = {1},
  publisher = {Wiley},
  address   = {Hoboken},
  issn      = {1756-8757},
  doi       = {10.1111/tops.12323},
  pages     = {161 -- 174},
  year      = {2018},
  abstract  = {We present a computational evaluation of three hypotheses about sources of deficit in sentence comprehension in aphasia: slowed processing, intermittent deficiency, and resource reduction. The ACT-R based Lewis and Vasishth (2005) model is used to implement these three proposals. Slowed processing is implemented as slowed execution time of parse steps; intermittent deficiency as increased random noise in activation of elements in memory; and resource reduction as reduced spreading activation. As data, we considered subject vs. object relative sentences, presented in a self-paced listening modality to 56 individuals with aphasia (IWA) and 46 matched controls. The participants heard the sentences and carried out a picture verification task to decide on an interpretation of the sentence. These response accuracies are used to identify the best parameters (for each participant) that correspond to the three hypotheses mentioned above. We show that controls have more tightly clustered (less variable) parameter values than IWA; specifically, compared to controls, among IWA there are more individuals with slow parsing times, high noise, and low spreading activation. We find that (a) individual IWA show differential amounts of deficit along the three dimensions of slowed processing, intermittent deficiency, and resource reduction, (b) overall, there is evidence for all three sources of deficit playing a role, and (c) IWA have a more variable range of parameter values than controls. An important implication is that it may be meaningless to talk about sources of deficit with respect to an abstract verage IWA; the focus should be on the individual's differential degrees of deficit along different dimensions, and on understanding the causes of variability in deficit between participants.},
  language  = {en}
}
@misc{ClausenSchefﬂer2020,
  author    = {Clausen, Yulia and Schefﬂer, Tatjana},
  title     = {A corpus-based analysis of meaning variations in German tag questions evidence from spoken and written conversational corpora},
  series = {Postprints der Universit{\"a}t Potsdam : Humanwissenschaftliche Reihe},
  journal   = {Postprints der Universit{\"a}t Potsdam : Humanwissenschaftliche Reihe},
  number    = {706},
  issn      = {1866-8364},
  doi       = {10.25932/publishup-46788},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-467882},
  pages     = {33},
  year      = {2020},
  abstract  = {This paper addresses semantic/pragmatic variability of tag questions in German and makes three main contributions. First, we document the prevalence and variety of question tags in German across three different types of conversational corpora. Second, by annotating question tags according to their syntactic and semantic context, discourse function, and pragmatic effect, we demonstrate the existing overlap and differences between the individual tag variants. Finally, we distinguish several groups of question tags by identifying the factors that influence the speakers' choices of tags in the conversational context, such as clause type, function, speaker/hearer knowledge, as well as conversation type and medium. These factors provide the limits of variability by constraining certain question tags in German against occurring in specific contexts or with individual functions.},
  language  = {en}
}
@phdthesis{Mertzen2022,
  author    = {Mertzen, Daniela},
  title     = {A cross-linguistic investigation of similarity-based interference in sentence comprehension},
  doi       = {10.25932/publishup-55668},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-556685},
  school      = {Universit{\"a}t Potsdam},
  pages     = {xvii, 129},
  year      = {2022},
  abstract  = {The aim of this dissertation was to conduct a larger-scale cross-linguistic empirical investigation of similarity-based interference effects in sentence comprehension. Interference studies can offer valuable insights into the mechanisms that are involved in long-distance dependency completion. Many studies have investigated similarity-based interference effects, showing that syntactic and semantic information are employed during long-distance dependency formation (e.g., Arnett \& Wagers, 2017; Cunnings \& Sturt, 2018; Van Dyke, 2007, Van Dyke \& Lewis, 2003; Van Dyke \& McElree, 2011). Nevertheless, there are some important open questions in the interference literature that are critical to our understanding of the constraints involved in dependency resolution. The first research question concerns the relative timing of syntactic and semantic interference in online sentence comprehension. Only few interference studies have investigated this question, and, to date, there is not enough data to draw conclusions with regard to their time course (Van Dyke, 2007; Van Dyke \& McElree, 2011). Our first cross-linguistic study explores the relative timing of syntactic and semantic interference in two eye-tracking reading experiments that implement the study design used in Van Dyke (2007). The first experiment tests English sentences. The second, larger-sample experiment investigates the two interference types in German. Overall, the data suggest that syntactic and semantic interference can arise simultaneously during retrieval. The second research question concerns a special case of semantic interference: We investigate whether cue-based retrieval interference can be caused by semantically similar items which are not embedded in a syntactic structure. This second interference study builds on a landmark study by Van Dyke \& McElree (2006). The study design used in their study is unique in that it is able to pin down the source of interference as a consequence of cue overload during retrieval, when semantic retrieval cues do not uniquely match the retrieval target. Unlike most other interference studies, this design is able to rule out encoding interference as an alternative explanation. Encoding accounts postulate that it is not cue overload at the retrieval site but the erroneous encoding of similar linguistic items in memory that leads to interference (Lewandowsky et al., 2008; Oberauer \& Kliegl, 2006). While Van Dyke \& McElree (2006) reported cue-based retrieval interference from sentence-external distractors, the evidence for this effect was weak. A subsequent study did not show interference of this type (Van Dyke et al., 2014). Given these inconclusive findings, further research is necessary to investigate semantic cue-based retrieval interference. The second study in this dissertation provides a larger-scale cross-linguistic investigation of cue-based retrieval interference from sentence-external items. Three larger-sample eye-tracking studies in English, German, and Russian tested cue-based interference in the online processing of filler-gap dependencies. This study further extends the previous research by investigating interference in each language under varying task demands (Logačev \& Vasishth, 2016; Swets et al., 2008). Overall, we see some very modest support for proactive cue-based retrieval interference in English. Unexpectedly, this was observed only under a low task demand. In German and Russian, there is some evidence against the interference effect. It is possible that interference is attenuated in languages with richer case marking. In sum, the cross-linguistic experiments on the time course of syntactic and semantic interference from sentence-internal distractors support existing evidence of syntactic and semantic interference during sentence comprehension. Our data further show that both types of interference effects can arise simultaneously. Our cross-linguistic experiments investigating semantic cue-based retrieval interference from sentence-external distractors suggest that this type of interference may arise only in specific linguistic contexts.},
  language  = {en}
}
@article{Petrova2006,
  author    = {Petrova, Svetlana},
  title     = {A discourse-based approach to verb placement in early West-Germanic},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-19540},
  year      = {2006},
  abstract  = {The paper presents a novel approach to explaining word order variation in the early Germanic languages. Initial observations about verb placement as a device marking types of rhetorical relations made on data from Old High German (cf. Hinterh{\"o}lzl \& Petrova 2005) are now reconsidered on a larger scale and compared with evidence from other early Germanic languages. The paper claims that the identification of information-structural domains in a sentence is best achieved by taking into account the interaction between the pragmatic features of discourse referents and properties of discourse organization.},
  language  = {en}
}
@article{ChiarcosDipperGoetzeetal.2008,
  author    = {Chiarcos, Christian and Dipper, Stefanie and G{\"o}tze, Michael and Leser, Ulf and L{\"u}deling, Anke and Ritz, Julia and Stede, Manfred},
  title     = {A flexible framework for integrating annotations from different tools and tag sets},
  issn      = {1248-9433},
  year      = {2008},
  abstract  = {We present a general framework for integrating annotations from different tools and tag sets. When annotating corpora at multiple linguistic levels, annotators may use different expert tools for different phenomena or types of annotation. These tools employ different data models and accompanying approaches to visualization, and they produce different output formats. For the purposes of uniformly processing these outputs, we developed a pivot format called PAULA, along with converters to and from tool formats. Different annotations are not only integrated at the level of data format, but are also joined on the level of conceptual representation. For this purpose, we introduce OLiA, an ontology of linguistic annotations that mediates between alternative tag sets that cover the same class of linguistic phenomena. All components are integrated in the linguistic information system ANNIS : Annotation tool output is converted to the pivot format PAULA and read into a database where the data can be visualized, queried, and evaluated across multiple layers. For cross-tag set querying and statistical evaluation, ANNIS uses the ontology of linguistic annotations. Finally, ANNIS is also tied to a machine learning component for semiautomatic annotation.},
  language  = {en}
}
@article{Alexiadou2019,
  author    = {Alexiadou, Artemis},
  title     = {A form-function mismatch?},
  series = {Of trees and birds. A Festschrift for Gisbert Fanselow},
  journal   = {Of trees and birds. A Festschrift for Gisbert Fanselow},
  publisher = {Universit{\"a}tsverlag Potsdam},
  address   = {Potsdam},
  isbn      = {978-3-86956-457-9},
  doi       = {10.25932/publishup-43223},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-432235},
  pages     = {107 -- 117},
  year      = {2019},
  language  = {en}
}
@article{DeBleser2006,
  author    = {De Bleser, Ria},
  title     = {A linguist's view on progressive anomia: Evidence for Delbr{\"u}ck (1886) in modern neurolinguistic research},
  series = {Cortex : a journal devoted to the study of the nervous system and behaviour},
  volume    = {42},
  journal   = {Cortex : a journal devoted to the study of the nervous system and behaviour},
  publisher = {Elsevier},
  address   = {Milano},
  issn      = {0010-9452},
  doi       = {10.1016/S0010-9452(08)70421-0},
  pages     = {805 -- 810},
  year      = {2006},
  abstract  = {In his short paper of 1886, the neogrammarian linguist Delbruck sketches his views on normal language processing and their relevance for the interpretation of some of the symptoms of progressive anomic aphasia. In particular, he discusses proper name impairments, verb and abstract noun superiority and the predominance of semantically related errors. Furthermore, he suggests that part of speech, morphology and word order may be preserved in this condition. This historical document has been lost in oblivion but the original ideas and their relevance for contemporary discussions merit a revival.},
  language  = {en}
}
@article{Powers2000,
  author    = {Powers, Susan M.},
  title     = {A minimalist account of phrase structure acquisition},
  year      = {2000},
  language  = {en}
}
@article{LogacevVasishth2016,
  author    = {Logacev, Pavel and Vasishth, Shravan},
  title     = {A Multiple-Channel Model of Task-Dependent Ambiguity Resolution in Sentence Comprehension},
  series = {Cognitive science : a multidisciplinary journal of anthropology, artificial intelligence, education, linguistics, neuroscience, philosophy, psychology ; journal of the Cognitive Science Society},
  volume    = {40},
  journal   = {Cognitive science : a multidisciplinary journal of anthropology, artificial intelligence, education, linguistics, neuroscience, philosophy, psychology ; journal of the Cognitive Science Society},
  publisher = {Wiley-Blackwell},
  address   = {Hoboken},
  issn      = {0364-0213},
  doi       = {10.1111/cogs.12228},
  pages     = {266 -- 298},
  year      = {2016},
  abstract  = {Traxler, Pickering, and Clifton (1998) found that ambiguous sentences are read faster than their unambiguous counterparts. This so-called ambiguity advantage has presented a major challenge to classical theories of human sentence comprehension (parsing) because its most prominent explanation, in the form of the unrestricted race model (URM), assumes that parsing is non-deterministic. Recently, Swets, Desmet, Clifton, and Ferreira (2008) have challenged the URM. They argue that readers strategically underspecify the representation of ambiguous sentences to save time, unless disambiguation is required by task demands. When disambiguation is required, however, readers assign sentences full structure—and Swets et al. provide experimental evidence to this end. On the basis of their findings, they argue against the URM and in favor of a model of task-dependent sentence comprehension. We show through simulations that the Swets et al. data do not constitute evidence for task-dependent parsing because they can be explained by the URM. However, we provide decisive evidence from a German self-paced reading study consistent with Swets et al.'s general claim about task-dependent parsing. Specifically, we show that under certain conditions, ambiguous sentences can be read more slowly than their unambiguous counterparts, suggesting that the parser may create several parses, when required. Finally, we present the first quantitative model of task-driven disambiguation that subsumes the URM, and we show that it can explain both Swets et al.'s results and our findings.},
  language  = {en}
}