@article{BoschDeCesareDemskeetal.2023,
  author    = {Bosch, Sina and De Cesare, Ilaria and Demske, Ulrike and Felser, Claudia},
  title     = {Word-order variation and coherence in German infinitival complementation},
  series = {The journal of comparative Germanic linguistics},
  volume    = {26},
  journal   = {The journal of comparative Germanic linguistics},
  number    = {1},
  publisher = {Springer},
  address   = {New York},
  issn      = {1572-8552},
  doi       = {10.1007/s10828-023-09140-8},
  pages     = {43},
  year      = {2023},
  abstract  = {This study provides a synthesis of corpus-based and experimental investigations of word-order preferences in German infinitival complementation. We carried out a systematic analysis of present-day German corpora to establish frequency distributions of different word-order options: extraposition, intraposition, and 'third construction'. We then examined, firstly, whether and to what extent corpus frequencies and processing economy constraints can predict the acceptability of these three word-order variants, and whether subject raising and subject control verbs form clearly distinguishable subclasses of infinitive-embedding verbs in terms of their word-order behaviour. Secondly, our study looks into the issue of coherence by comparing acceptability ratings for monoclausal coherent and biclausal incoherent construals of intraposed infinitives, and by examining whether a biclausal incoherent analysis gives rise to local and/or global processing difficulty. Taken together, our results revealed that (i) whilst the extraposition pattern consistently wins out over all other word-order variants for control verbs, neither frequency nor processing-based approaches to word-order variation can account for the acceptability of low-frequency variants, (ii) there is considerable verb-specific variation regarding word-order preferences both between and within the two sets of raising and control verbs under investigation, and (iii) although monoclausal coherent intraposition is rated above biclausal incoherent intraposition, the latter is not any more difficult to process than the former. Our findings indicate that frequency of occurrence and processing-related constraints interact with idiosyncratic lexical properties of individual verbs in determining German speakers' structural preferences.},
  language  = {en}
}
@article{BoschDeCesareDemskeetal.2023,
  author    = {Bosch, Sina and De Cesare, Ilaria and Demske, Ulrike and Felser, Claudia},
  title     = {Correction zu: Word-order variation and coherence in German infinitival complementation. - (The journal of comparative Germanic linguistics. - 26 (2023) 1) . - https://doi.org/10.1007/s10828-023-09140-8},
  series = {The journal of comparative Germanic linguistics},
  volume    = {26},
  journal   = {The journal of comparative Germanic linguistics},
  number    = {1},
  publisher = {Springer},
  address   = {New York},
  issn      = {1383-4924},
  doi       = {10.1007/s10828-023-09143-5},
  pages     = {2},
  year      = {2023},
  language  = {en}
}
@article{HollensteinTrondlePlomeckaetal.2023,
  author    = {Hollenstein, Nora and Trondle, Marius and Plomecka, Martyna and Kiegeland, Samuel and Ozyurt, Yilmazcan and J{\"a}ger, Lena Ann and Langer, Nicolas},
  title     = {The ZuCo benchmark on cross-subject reading task classification with EEG and eye-tracking data},
  series = {Frontiers in psychology},
  volume    = {13},
  journal   = {Frontiers in psychology},
  publisher = {Frontiers Media},
  address   = {Lausanne},
  issn      = {1664-1078},
  doi       = {10.3389/fpsyg.2022.1028824},
  pages     = {20},
  year      = {2023},
  abstract  = {We present a new machine learning benchmark for reading task classification with the goal of advancing EEG and eye-tracking research at the intersection between computational language processing and cognitive neuroscience. The benchmark task consists of a cross-subject classification to distinguish between two reading paradigms: normal reading and task-specific reading. The data for the benchmark is based on the Zurich Cognitive Language Processing Corpus (ZuCo 2.0), which provides simultaneous eye-tracking and EEG signals from natural reading of English sentences. The training dataset is publicly available, and we present a newly recorded hidden testset. We provide multiple solid baseline methods for this task and discuss future improvements. We release our code and provide an easy-to-use interface to evaluate new approaches with an accompanying public leaderboard: .},
  language  = {en}
}
@phdthesis{LopezGambino2023,
  author    = {L{\´o}pez Gambino, Maria Soledad},
  title     = {Time Buying in Task-Oriented Spoken Dialogue Systems},
  doi       = {10.25932/publishup-59280},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-592806},
  school      = {Universit{\"a}t Potsdam},
  pages     = {148},
  year      = {2023},
  abstract  = {This dissertation focuses on the handling of time in dialogue. Specifically, it investigates how humans bridge time, or "buy time", when they are expected to convey information that is not yet available to them (e.g. a travel agent searching for a flight in a long list while the customer is on the line, waiting). It also explores the feasibility of modeling such time-bridging behavior in spoken dialogue systems, and it examines how endowing such systems with more human-like time-bridging capabilities may affect humans' perception of them. The relevance of time-bridging in human-human dialogue seems to stem largely from a need to avoid lengthy pauses, as these may cause both confusion and discomfort among the participants of a conversation (Levinson, 1983; Lundholm Fors, 2015). However, this avoidance of prolonged silence is at odds with the incremental nature of speech production in dialogue (Schlangen and Skantze, 2011): Speakers often start to verbalize their contribution before it is fully formulated, and sometimes even before they possess the information they need to provide, which may result in them running out of content mid-turn. In this work, we elicit conversational data from humans, to learn how they avoid being silent while they search for information to convey to their interlocutor. We identify commonalities in the types of resources employed by different speakers, and we propose a classification scheme. We explore ways of modeling human time-buying behavior computationally, and we evaluate the effect on human listeners of embedding this behavior in a spoken dialogue system. Our results suggest that a system using conversational speech to bridge time while searching for information to convey (as humans do) can provide a better experience in several respects than one which remains silent for a long period of time. However, not all speech serves this purpose equally: Our experiments also show that a system whose time-buying behavior is more varied (i.e. which exploits several categories from the classification scheme we developed and samples them based on information from human data) can prevent overestimation of waiting time when compared, for example, with a system that repeatedly asks the interlocutor to wait (even if these requests for waiting are phrased differently each time). Finally, this research shows that it is possible to model human time-buying behavior on a relatively small corpus, and that a system using such a model can be preferred by participants over one employing a simpler strategy, such as randomly choosing utterances to produce during the wait —even when the utterances used by both strategies are the same.},
  language  = {en}
}
@phdthesis{Philipp2023,
  author    = {Philipp, Mareike},
  title     = {Quantifier scope ambiguities in English, German, and Asante Twi (Akan): structural and pragmatic factors},
  doi       = {10.25932/publishup-61235},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-612356},
  school      = {Universit{\"a}t Potsdam},
  pages     = {ix, 291},
  year      = {2023},
  abstract  = {This thesis is concerned with the phenomenon of quantifier scope ambiguities. This phenomenon has been researched extensively, both from a theoretical and from an empirical point of view. Nevertheless, there are still a number of under-researched topics in the field of quantifier scope, which will be the main focus of this thesis. I will take a closer look at three languages, English, German, and the Asante Twi dialect of Akan (Kwa, Niger-Kongo). The goal is a better understanding of the phenomenon of quantifier scope both within each language, as well as from a cross-linguistic perspective. First, this thesis will provide a series of experiments that allow a direct cross-linguistic comparison between English and German - two languages about which specific claims have been made in the literature. I will also provide exploratory research in the case of Asante Twi, where so far, no work has been dedicated specifically to the study of quantifier scope. The work on Asante Twi will go beyond quantifier scope and also target the quantifier and determiner system in general. The question is not only if particular scope readings are possible or not, but also which factors contribute to an increase or decrease of scope availability, and if there are factors that block certain scope readings altogether. While some of the results confirm and thereby strengthen previous claims, other results contradict general assumptions in the literature. This is particularly the case for inverse readings in German and inverse readings across clause-boundaries.},
  language  = {en}
}
@article{SalzmannWierzbaGeorgi2023,
  author    = {Salzmann, Martin and Wierzba, Marta and Georgi, Doreen},
  title     = {Condition C in German A'-movement},
  series = {Journal of linguistics : JL},
  volume    = {59},
  journal   = {Journal of linguistics : JL},
  number    = {3},
  publisher = {Cambridge Univ. Press},
  address   = {London [u.a.]},
  issn      = {0022-2267},
  doi       = {10.1017/S0022226722000214},
  pages     = {577 -- 622},
  year      = {2023},
  abstract  = {In recent experimental work, arguments for or against Condition C reconstruction in A'-movement have been based on low/high availability of coreference in sentences with and without A'-movement. We argue that this reasoning is problematic: It involves arbitrary thresholds, and the results are potentially confounded by the different surface orders of the compared structures and non-syntactic factors. We present three experiments with designs that do not require defining thresholds of 'low' or 'high' coreference values. Instead, we focus on grammatical contrasts (wh-movement vs. relativization, subject vs. object wh-movement) and aim to identify and reduce confounds. The results show that reconstruction for A'-movement of DPs is not very robust in German, contra previous findings. Our results are compatible with the view that the surface order and non-syntactic factors (e.g. plausibility, referential accessibility of an R-expression) heavily influence coreference possibilities. Thus, the data argue against a theory that includes both reconstruction and a hard Condition C constraint. There is a residual contrast between sentences with subject/object movement, which is compatible with an account without reconstruction (and an additional non-syntactic factor) or an account with reconstruction (and a soft Condition C constraint).},
  language  = {en}
}
@article{StoneNicenboimVasishthetal.2023,
  author    = {Stone, Kate and Nicenboim, Bruno and Vasishth, Shravan and R{\"o}sler, Frank},
  title     = {Understanding the effects of constraint and predictability in ERP},
  series = {Neurobiology of language},
  volume    = {4},
  journal   = {Neurobiology of language},
  number    = {2},
  publisher = {MIT Press},
  address   = {Cambridge, MA, USA},
  issn      = {2641-4368},
  doi       = {10.1162/nol_a_00094},
  pages     = {221 -- 256},
  year      = {2023},
  abstract  = {Intuitively, strongly constraining contexts should lead to stronger probabilistic representations of sentences in memory. Encountering unexpected words could therefore be expected to trigger costlier shifts in these representations than expected words. However, psycholinguistic measures commonly used to study probabilistic processing, such as the N400 event-related potential (ERP) component, are sensitive to word predictability but not to contextual constraint. Some research suggests that constraint-related processing cost may be measurable via an ERP positivity following the N400, known as the anterior post-N400 positivity (PNP). The PNP is argued to reflect update of a sentence representation and to be distinct from the posterior P600, which reflects conflict detection and reanalysis. However, constraint-related PNP findings are inconsistent. We sought to conceptually replicate Federmeier et al. (2007) and Kuperberg et al. (2020), who observed that the PNP, but not the N400 or the P600, was affected by constraint at unexpected but plausible words. Using a pre-registered design and statistical approach maximising power, we demonstrated a dissociated effect of predictability and constraint: strong evidence for predictability but not constraint in the N400 window, and strong evidence for constraint but not predictability in the later window. However, the constraint effect was consistent with a P600 and not a PNP, suggesting increased conflict between a strong representation and unexpected input rather than greater update of the representation. We conclude that either a simple strong/weak constraint design is not always sufficient to elicit the PNP, or that previous PNP constraint findings could be an artifact of smaller sample size.},
  language  = {en}
}
@phdthesis{Wellmann2023,
  author    = {Wellmann, Caroline},
  title     = {Early sensitivity to prosodic phrase boundary cues: Behavioral evidence from German-learning infants},
  doi       = {10.25932/publishup-57393},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-573937},
  school      = {Universit{\"a}t Potsdam},
  pages     = {xii, 136},
  year      = {2023},
  abstract  = {This dissertation seeks to shed light on the relation of phrasal prosody and developmental speech perception in German-learning infants. Three independent empirical studies explore the role of acoustic correlates of major prosodic boundaries, specifically pitch change, final lengthening, and pause, in infant boundary perception. Moreover, it was examined whether the sensitivity to prosodic phrase boundary markings changes during the first year of life as a result of perceptual attunement to the ambient language (Aslin \& Pisoni, 1980). Using the headturn preference procedure six- and eight-month-old monolingual German-learning infants were tested on their discrimination of two different prosodic groupings of the same list of coordinated names either with or without an internal IPB after the second name, that is, [Moni und Lilli] [und Manu] or [Moni und Lilli und Manu]. The boundary marking was systematically varied with respect to single prosodic cues or specific cue combinations. Results revealed that six- and eight-month-old German-learning infants successfully detect the internal prosodic boundary when it is signaled by all the three main boundary cues pitch change, final lengthening, and pause. For eight-, but not for six-month-olds, the combination of pitch change and final lengthening, without the occurrence of a pause, is sufficient. This mirrors an adult-like perception by eight-months (Holzgrefe-Lang et al., 2016). Six-month-olds detect a prosodic phrase boundary signaled by final lengthening and pause. The findings suggest a developmental change in German prosodic boundary cue perception from a strong reliance on the pause cue at six months to a differentiated sensitivity to the more subtle cues pitch change and final lengthening at eight months. Neither for six- nor for eight-month-olds the occurrence of pitch change or final lengthening as single cues is sufficient, similar to what has been observed for adult speakers of German (Holzgrefe-Lang et al., 2016). The present dissertation provides new scientific knowledge on infants' sensitivity to individual prosodic phrase boundary cues in the first year of life. Methodologically, the studies are pathbreaking since they used exactly the same stimulus materials - phonologically thoroughly controlled lists of names - that have also been used with adults (Holzgrefe-Lang et al., 2016) and with infants in a neurophysiological paradigm (Holzgrefe-Lang, Wellmann, H{\"o}hle, \& Wartenburger, 2018), allowing for comparisons across age (six/ eight months and adults) and method (behavioral vs. neurophysiological methods). Moreover, materials are suited to be transferred to other languages allowing for a crosslinguistic comparison. Taken together with a study with similar French materials (van Ommen et al., 2020) the observed change in sensitivity in German-learning infants can be interpreted as a language-specific one, from an initial language-general processing mechanism that primarily focuses on the presence of pauses to a language-specific processing that takes into account prosodic properties available in the ambient language. The developmental pattern is discussed as an interplay of acoustic salience, prosodic typology (prosodic regularity) and cue reliability.},
  language  = {en}
}
@phdthesis{Yadav2023,
  author    = {Yadav, Himanshu},
  title     = {A computational evaluation of feature distortion and cue weighting in sentence comprehension},
  doi       = {10.25932/publishup-58505},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-585055},
  school      = {Universit{\"a}t Potsdam},
  pages     = {iv, 115},
  year      = {2023},
  abstract  = {Successful sentence comprehension requires the comprehender to correctly figure out who did what to whom. For example, in the sentence John kicked the ball, the comprehender has to figure out who did the action of kicking and what was being kicked. This process of identifying and connecting the syntactically-related words in a sentence is called dependency completion. What are the cognitive constraints that determine dependency completion? A widely-accepted theory is cue-based retrieval. The theory maintains that dependency completion is driven by a content-addressable search for the co-dependents in memory. The cue-based retrieval explains a wide range of empirical data from several constructions including subject-verb agreement, subject-verb non-agreement, plausibility mismatch configurations, and negative polarity items. However, there are two major empirical challenges to the theory: (i) Grammatical sentences' data from subject-verb number agreement dependencies, where the theory predicts a slowdown at the verb in sentences like the key to the cabinet was rusty compared to the key to the cabinets was rusty, but the data are inconsistent with this prediction; and, (ii) Data from antecedent-reflexive dependencies, where a facilitation in reading times is predicted at the reflexive in the bodybuilder who worked with the trainers injured themselves vs. the bodybuilder who worked with the trainer injured themselves, but the data do not show a facilitatory effect. The work presented in this dissertation is dedicated to building a more general theory of dependency completion that can account for the above two datasets without losing the original empirical coverage of the cue-based retrieval assumption. In two journal articles, I present computational modeling work that addresses the above two empirical challenges. To explain the grammatical sentences' data from subject-verb number agreement dependencies, I propose a new model that assumes that the cue-based retrieval operates on a probabilistically distorted representation of nouns in memory (Article I). This hybrid distortion-plus-retrieval model was compared against the existing candidate models using data from 17 studies on subject-verb number agreement in 4 languages. I find that the hybrid model outperforms the existing models of number agreement processing suggesting that the cue-based retrieval theory must incorporate a feature distortion assumption. To account for the absence of facilitatory effect in antecedent-reflexive dependen� cies, I propose an individual difference model, which was built within the cue-based retrieval framework (Article II). The model assumes that individuals may differ in how strongly they weigh a syntactic cue over a number cue. The model was fitted to data from two studies on antecedent-reflexive dependencies, and the participant-level cue-weighting was estimated. We find that one-fourth of the participants, in both studies, weigh the syntactic cue higher than the number cue in processing reflexive dependencies and the remaining participants weigh the two cues equally. The result indicates that the absence of predicted facilitatory effect at the level of grouped data is driven by some, not all, participants who weigh syntactic cues higher than the number cue. More generally, the result demonstrates that the assumption of differential cue weighting is important for a theory of dependency completion processes. This differential cue weighting idea was independently supported by a modeling study on subject-verb non-agreement dependencies (Article III). Overall, the cue-based retrieval, which is a general theory of dependency completion, needs to incorporate two new assumptions: (i) the nouns stored in memory can undergo probabilistic feature distortion, and (ii) the linguistic cues used for retrieval can be weighted differentially. This is the cumulative result of the modeling work presented in this dissertation. The dissertation makes an important theoretical contribution: Sentence comprehension in humans is driven by a mechanism that assumes cue-based retrieval, probabilistic feature distortion, and differential cue weighting. This insight is theoretically important because there is some independent support for these three assumptions in sentence processing and the broader memory literature. The modeling work presented here is also methodologically important because for the first time, it demonstrates (i) how the complex models of sentence processing can be evaluated using data from multiple studies simultaneously, without oversimplifying the models, and (ii) how the inferences drawn from the individual-level behavior can be used in theory development.},
  language  = {en}
}