@article{GenzelKuegler2018,
  author    = {Genzel, Susanne and K{\"u}gler, Frank},
  title     = {Production and perception of question prosody in Akan},
  series = {Journal of the International Phonetic Association},
  volume    = {50},
  journal   = {Journal of the International Phonetic Association},
  number    = {1},
  publisher = {Cambridge Univ. Press},
  address   = {Cambridge},
  issn      = {0025-1003},
  doi       = {10.1017/S0025100318000191},
  pages     = {61 -- 92},
  year      = {2018},
  abstract  = {The paper presents a production experiment investigating the phonetic parameters speakers employ to differentiate Yes-No questions from string-identical statements in Akan, a West-African two-tone Kwa language. Results show that, in comparison to the statement, speakers use a higher pitch register throughout the utterance as a global parameter, and falling f0, longer duration and higher intensity as local parameters on the final syllable of the Yes-No question. Further, two perception experiments (forced-choice identification and gating) investigate the perceptual relevance of the global parameter and the local final parameters. Results show that listeners cannot assess the higher pitch register information to identify the mode of a sentence early on. Rather, identification takes place when the local phonetic parameters on the final vowel are available. The findings point to the superiority of language-specific cues in sentence mode perception. It is suggested that Akan uses a low boundary tone that associates with the right edge of the intonation phrase (L\%) in Yes-No questions. The results are discussed from the point of view of question intonation typology in African languages. It is argued that a classification along the lines of functionally relevant cues is preferable to an impressionistic analysis.},
  language  = {en}
}
@article{AmaechiGeorgi2020,
  author    = {Amaechi, Mary Chimaobi and Georgi, Doreen},
  title     = {On optional wh-/focus fronting in Igbo},
  series = {Zeitschrift f{\"u}r Sprachwissenschaft},
  volume    = {39},
  journal   = {Zeitschrift f{\"u}r Sprachwissenschaft},
  number    = {3},
  publisher = {De Gruyter},
  address   = {Berlin},
  issn      = {0721-9067},
  doi       = {10.1515/zfs-2020-2017},
  pages     = {299 -- 327},
  year      = {2020},
  abstract  = {This paper discusses surface optionality in focus fronting in the Benue-Congo language Igbo. A focused XP can occur in-situ or ex-situ. We argue that the optionality does not have its origins in the syntax: in fact, exactly one focused XP has to move to the designated focus position in the left periphery in the syntax. The alternation between in-situ and ex-situ rather arises at PF: either the lowest or the topmost copy of the focus chain is pronounced. The choice is determined by semantic-pragmatic factors, i. e., we see an interaction between PF and LF. This constitutes a challenge for a strict version of the Y-model of grammar.},
  language  = {en}
}
@phdthesis{Yadav2023,
  author    = {Yadav, Himanshu},
  title     = {A computational evaluation of feature distortion and cue weighting in sentence comprehension},
  doi       = {10.25932/publishup-58505},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-585055},
  school      = {Universit{\"a}t Potsdam},
  pages     = {iv, 115},
  year      = {2023},
  abstract  = {Successful sentence comprehension requires the comprehender to correctly figure out who did what to whom. For example, in the sentence John kicked the ball, the comprehender has to figure out who did the action of kicking and what was being kicked. This process of identifying and connecting the syntactically-related words in a sentence is called dependency completion. What are the cognitive constraints that determine dependency completion? A widely-accepted theory is cue-based retrieval. The theory maintains that dependency completion is driven by a content-addressable search for the co-dependents in memory. The cue-based retrieval explains a wide range of empirical data from several constructions including subject-verb agreement, subject-verb non-agreement, plausibility mismatch configurations, and negative polarity items. However, there are two major empirical challenges to the theory: (i) Grammatical sentences' data from subject-verb number agreement dependencies, where the theory predicts a slowdown at the verb in sentences like the key to the cabinet was rusty compared to the key to the cabinets was rusty, but the data are inconsistent with this prediction; and, (ii) Data from antecedent-reflexive dependencies, where a facilitation in reading times is predicted at the reflexive in the bodybuilder who worked with the trainers injured themselves vs. the bodybuilder who worked with the trainer injured themselves, but the data do not show a facilitatory effect. The work presented in this dissertation is dedicated to building a more general theory of dependency completion that can account for the above two datasets without losing the original empirical coverage of the cue-based retrieval assumption. In two journal articles, I present computational modeling work that addresses the above two empirical challenges. To explain the grammatical sentences' data from subject-verb number agreement dependencies, I propose a new model that assumes that the cue-based retrieval operates on a probabilistically distorted representation of nouns in memory (Article I). This hybrid distortion-plus-retrieval model was compared against the existing candidate models using data from 17 studies on subject-verb number agreement in 4 languages. I find that the hybrid model outperforms the existing models of number agreement processing suggesting that the cue-based retrieval theory must incorporate a feature distortion assumption. To account for the absence of facilitatory effect in antecedent-reflexive dependen� cies, I propose an individual difference model, which was built within the cue-based retrieval framework (Article II). The model assumes that individuals may differ in how strongly they weigh a syntactic cue over a number cue. The model was fitted to data from two studies on antecedent-reflexive dependencies, and the participant-level cue-weighting was estimated. We find that one-fourth of the participants, in both studies, weigh the syntactic cue higher than the number cue in processing reflexive dependencies and the remaining participants weigh the two cues equally. The result indicates that the absence of predicted facilitatory effect at the level of grouped data is driven by some, not all, participants who weigh syntactic cues higher than the number cue. More generally, the result demonstrates that the assumption of differential cue weighting is important for a theory of dependency completion processes. This differential cue weighting idea was independently supported by a modeling study on subject-verb non-agreement dependencies (Article III). Overall, the cue-based retrieval, which is a general theory of dependency completion, needs to incorporate two new assumptions: (i) the nouns stored in memory can undergo probabilistic feature distortion, and (ii) the linguistic cues used for retrieval can be weighted differentially. This is the cumulative result of the modeling work presented in this dissertation. The dissertation makes an important theoretical contribution: Sentence comprehension in humans is driven by a mechanism that assumes cue-based retrieval, probabilistic feature distortion, and differential cue weighting. This insight is theoretically important because there is some independent support for these three assumptions in sentence processing and the broader memory literature. The modeling work presented here is also methodologically important because for the first time, it demonstrates (i) how the complex models of sentence processing can be evaluated using data from multiple studies simultaneously, without oversimplifying the models, and (ii) how the inferences drawn from the individual-level behavior can be used in theory development.},
  language  = {en}
}
@article{GafosLieshout2020,
  author    = {Gafos, Adamantios I. and Lieshout, Pascal H. H. M. van},
  title     = {Models and theories of speech production},
  series = {Frontiers in psychology},
  volume    = {11},
  journal   = {Frontiers in psychology},
  publisher = {Frontiers Research Foundation},
  address   = {Lausanne},
  issn      = {1664-1078},
  doi       = {10.3389/fpsyg.2020.01238},
  pages     = {4},
  year      = {2020},
  language  = {en}
}
@article{FuhrmeisterSmithMyers2020,
  author    = {Fuhrmeister, Pamela and Smith, Garrett and Myers, Emily B.},
  title     = {Overlearning of non-native speech sounds does not result in superior consolidation after a period of sleep},
  series = {The journal of the Acoustical Society of America},
  volume    = {147},
  journal   = {The journal of the Acoustical Society of America},
  number    = {3},
  publisher = {American Institute of Physics},
  address   = {Melville},
  issn      = {0001-4966},
  doi       = {10.1121/10.0000943},
  pages     = {EL289 -- EL294},
  year      = {2020},
  abstract  = {Recent studies suggest that sleep-mediated consolidation processes help adults learn non-native speech sounds. However, overnight improvement was not seen when participants learned in the morning, perhaps resulting from native-language interference. The current study trained participants to perceive the Hindi dental/retroflex contrast in the morning and tested whether increased training can lead to overnight improvement. Results showed overnight effects regardless of training amount. In contrast to previous studies, participants in this study heard sounds in limited contexts (i.e., one talker and one vowel context), corroborating other findings, suggesting that overnight improvement is seen in non-native phonetic learning when variability is limited.},
  language  = {en}
}
@phdthesis{Galetzka2022,
  author    = {Galetzka, Fabian},
  title     = {Investigating and improving background context consistency in neural conversation models},
  doi       = {10.25932/publishup-58463},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-584637},
  school      = {Universit{\"a}t Potsdam},
  pages     = {viii, 173},
  year      = {2022},
  abstract  = {Neural conversation models aim to predict appropriate contributions to a (given) conversation by using neural networks trained on dialogue data. A specific strand focuses on non-goal driven dialogues, first proposed by Ritter et al. (2011): They investigated the task of transforming an utterance into an appropriate reply. Then, this strand evolved into dialogue system approaches using long dialogue histories and additional background context. Contributing meaningful and appropriate to a conversation is a complex task, and therefore research in this area has been very diverse: Serban et al. (2016), for example, looked into utilizing variable length dialogue histories, Zhang et al. (2018) added additional context to the dialogue history, Wolf et al. (2019) proposed a model based on pre-trained Self-Attention neural networks (Vasvani et al., 2017), and Dinan et al. (2021) investigated safety issues of these approaches. This trend can be seen as a transformation from trying to somehow carry on a conversation to generating appropriate replies in a controlled and reliable way. In this thesis, we first elaborate the meaning of appropriateness in the context of neural conversation models by drawing inspiration from the Cooperative Principle (Grice, 1975). We first define what an appropriate contribution has to be by operationalizing these maxims as demands on conversation models: being fluent, informative, consistent towards given context, coherent and following a social norm. Then, we identify different targets (or intervention points) to achieve the conversational appropriateness by investigating recent research in that field. In this thesis, we investigate the aspect of consistency towards context in greater detail, being one aspect of our interpretation of appropriateness. During the research, we developed a new context-based dialogue dataset (KOMODIS) that combines factual and opinionated context to dialogues. The KOMODIS dataset is publicly available and we use the data in this thesis to gather new insights in context-augmented dialogue generation. We further introduced a new way of encoding context within Self-Attention based neural networks. For that, we elaborate the issue of space complexity from knowledge graphs, and propose a concise encoding strategy for structured context inspired from graph neural networks (Gilmer et al., 2017) to reduce the space complexity of the additional context. We discuss limitations of context-augmentation for neural conversation models, explore the characteristics of knowledge graphs, and explain how we create and augment knowledge graphs for our experiments. Lastly, we analyzed the potential of reinforcement and transfer learning to improve context-consistency for neural conversation models. We find that current reward functions need to be more precise to enable the potential of reinforcement learning, and that sequential transfer learning can improve the subjective quality of generated dialogues.},
  language  = {en}
}
@article{PueblaGarcia2021,
  author    = {Puebla, Cecilia and Garcia, Juan},
  title     = {Advocating the inclusion of older adults in digital language learning technology and research},
  series = {Bilingualism : language and cognition},
  volume    = {25},
  journal   = {Bilingualism : language and cognition},
  number    = {3},
  publisher = {Cambridge Univ. Press},
  address   = {New York},
  issn      = {1366-7289},
  doi       = {10.1017/S1366728921000742},
  pages     = {398 -- 399},
  year      = {2021},
  language  = {en}
}
@article{GhaffarvandMokariSardhaei2020,
  author    = {Ghaffarvand Mokari, Payam and Sardhaei, Nasim Mahdinezhad},
  title     = {Predictive power of cepstral coefficients and spectral moments in the classification of Azerbaijani fricatives},
  series = {The journal of the Acoustical Society of America},
  volume    = {147},
  journal   = {The journal of the Acoustical Society of America},
  number    = {3},
  publisher = {American Institute of Physics},
  address   = {Melville},
  issn      = {0001-4966},
  doi       = {10.1121/10.0000830},
  pages     = {EL228 -- EL234},
  year      = {2020},
  abstract  = {This study compares the classification of Azerbaijani fricatives based on two sets of features: (a) spectral moments, spectral peak, amplitude, duration, and (b) cepstral coefficients employing Hidden Markov Models to divide each fricative into three regions such that the variances of the measures within each region are minimized. The cepstral coefficients were found to be more reliable predictors in the classification of all nine Azerbaijani fricatives and the cepstral measures yielded highly successful classification rates (91.21\% across both genders) in the identification of the full set of fricatives of Azerbaijani.},
  language  = {en}
}
@article{KrasotkinaGoetzHoehleetal.2021,
  author    = {Krasotkina, Anna and G{\"o}tz, Antonia and H{\"o}hle, Barbara and Schwarzer, Gudrun},
  title     = {Perceptual narrowing in face- and speech-perception domains in infancy},
  series = {Infant behavior \& development : an international and interdisciplinary journal},
  volume    = {64},
  journal   = {Infant behavior \& development : an international and interdisciplinary journal},
  publisher = {Elsevier},
  address   = {New York},
  issn      = {0163-6383},
  doi       = {10.1016/j.infbeh.2021.101607},
  pages     = {9},
  year      = {2021},
  abstract  = {During the first year of life, infants undergo a process known as perceptual narrowing, which reduces their sensitivity to classes of stimuli which the infants do not encounter in their environment. It has been proposed that perceptual narrowing for faces and speech may be driven by shared domain-general processes. To investigate this theory, our study longitudinally tested 50 German Caucasian infants with respect to these domains first at 6 months of age followed by a second testing at 9 months of age. We used an infant-controlled habituation-dishabituation paradigm to test the infants' ability to discriminate among other-race Asian faces and non-native Cantonese speech tones, as well as same-race Caucasian faces as a control. We found that while at 6 months of age infants could discriminate among all stimuli, by 9 months of age they could no longer discriminate among other-race faces or non-native tones. However, infants could discriminate among same-race stimuli both at 6 and at 9 months of age. These results demonstrate that the same infants undergo perceptual narrowing for both other-race faces and non-native speech tones between the ages of 6 and 9 months. This parallel development of perceptual narrowing occurring in both the face and speech perception modalities over the same period of time lends support to the domain-general theory of perceptual narrowing in face and speech perception.},
  language  = {en}
}
@article{Tran2021,
  author    = {Tran, Thuan},
  title     = {Non-canonical word order and temporal reference in Vietnamese},
  series = {Linguistics : an interdisciplinary journal of the language sciences},
  volume    = {59},
  journal   = {Linguistics : an interdisciplinary journal of the language sciences},
  number    = {1},
  publisher = {De Gruyter Mouton},
  address   = {Berlin},
  issn      = {0024-3949},
  doi       = {10.1515/ling-2020-0256},
  pages     = {1 -- 34},
  year      = {2021},
  abstract  = {The paper revisits Duffield's (2007) (Duffield, Nigel. 2007. Aspects of Vietnamese clausal structure: Separating tense from assertion. Linguistics 45(4). 765-814) analysis of the correlation between the position of a 'when'-phrase and the temporal reference of a bare sentence in Vietnamese. Bare sentences in Vietnamese, based on (Smith, Carlota S. \& Mary S. Erbaugh. 2005. Temporal interpretation in Mandarin Chinese. Linguistics 43(4). 713-756), are argued to obtain their temporal interpretation from their aspectual composition, and the default temporal reference: bounded events are located in the past, unbounded events at present. It is shown that the correlation so observed in when-questions is superficial, and is tied to the syntax and semantics of temporal modification and the requirement that temporal adverbials denoting future time is base generated in sentence-initial position, and past time adverbials in sentence-final position. A 'when'-phrase, being temporally underspecified, obtains its temporal value from its base position. However, the correlation between word order and temporal reference in argument wh-questions and declaratives is factual, depending on whether the predicate-argument configuration allows for a telic interpretation or not. To be specific, it is dependent on whether the application of Generic Modification (Snyder, William. 2012. Parameter theory and motion predicates. In Violeta Demonte \& Louise McNally (eds.), Telicity, change, and state. Acrosscategorial view of event structure, 279-299. Oxford: Oxford University Press) or accomplishment composition is realized. Canonical declaratives, and argument wh-questions, with telicity inducing material, license GM or accomplishment composition, yielding bounded events, hence past; by contrast, their noncanonical counterparts block GM or accomplishment composition, giving rise to unbounded event descriptions, hence non-past.},
  language  = {en}
}