@article{Luedeling2005, author = {L{\"u}deling, Anke}, title = {Heterogeneity and standardization in data, use, and annotation}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {2}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8643}, pages = {43 -- 54}, year = {2005}, abstract = {This paper describes the standardization problems that come up in a diachronic corpus: it has to cope with differing standards with regard to diplomaticity, annotation, and header information. Such highly het-erogeneous texts must be standardized to allow for comparative re-search without (too much) loss of information.}, language = {en} } @article{Schmidt2005, author = {Schmidt, Thomas}, title = {EXMARaLDA und Datenbank "Mehrsprachigkeit"}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {2}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8636}, pages = {21 -- 42}, year = {2005}, abstract = {This paper presents some concepts and principles used in the development of a database of multilingual spoken discourse at the University of Hamburg. The emphasis of the first part is on general considerations for the handling of heterogeneous data sets: After showing that diversity in transcription data is partly conceptually and partly technologically motivated, it is argued that the processing of transcription corpora should be approached via a three-level architecture which separates form (application) and content (data) on the one hand, and logical and physical data structures on the other hand. Such an architecture does not only pave the way for modern text-technological approaches to linguistic data processing, it can also help to decide where and how a standardization in the work with heterogeneous data is possible and desirable and where it would run counter to the needs of the research community. It is further argued that, in order to ensure user acceptance, new solutions developed in this approach must take care not to abandon established concepts too quickly. The focus of the second part is on some practical experiences with users and technologies gained in the four years' project work. Concerning the practical development work, the value of open standards like XML and Unicode is emphasized and some limitations of the "platform-independent" JAVA technology are indicated. With respect to users of the EXMARaLDA system, a predominantly conservative attitude towards technological innovations in transcription corpus work can be stated: individual users tend to stick to known functionalities and are reluctant to adopt themselves to the new possibilities. Furthermore, an active commitment to cooperative corpus work still seems to be the exception rather than the rule. It is concluded that technological innovations can contribute their share to a progress in the work with heterogeneous linguistic data, but that they will have to be supplemented, in the long run, with an adequate methodological reflection and the creation of an appropriate infrastructure.}, language = {de} } @article{Wagner2005, author = {Wagner, Andreas}, title = {Unity in diversity}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {2}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8625}, pages = {1 -- 20}, year = {2005}, abstract = {This paper describes the creation and preparation of TUSNELDA, a collection of corpus data built for linguistic research. This collection contains a number of linguistically annotated corpora which differ in various aspects such as language, text sorts / data types, encoded annotation levels, and linguistic theories underlying the annotation. The paper focuses on this variation on the one hand and the way how these heterogeneous data are integrated into one resource on the other hand.}, language = {en} } @article{DipperGoetzeStedeetal.2004, author = {Dipper, Stefanie and G{\"o}tze, Michael and Stede, Manfred and Wegst, Tillmann}, title = {ANNIS}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8432}, pages = {245 -- 279}, year = {2004}, abstract = {In this paper, we discuss the design and implementation of our first version of the database "ANNIS" ("ANNotation of Information Structure"). For research based on empirical data, ANNIS provides a uniform environment for storing this data together with its linguistic annotations. A central database promotes standardized annotation, which facilitates interpretation and comparison of the data. ANNIS is used through a standard web browser and offers tier-based visualization of data and annotations, as well as search facilities that allow for cross-level and cross-sentential queries. The paper motivates the design of the system, characterizes its user interface, and provides an initial technical evaluation of ANNIS with respect to data size and query processing.}, language = {en} } @article{HartmannZimmermann2004, author = {Hartmann, Katharina and Zimmermann, Malte}, title = {Focus strategies in chadic}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8423}, pages = {207 -- 243}, year = {2004}, abstract = {We argue that the standard focus theories reach their limits when confronted with the focus systems of the Chadic languages. The backbone of the standard focus theories consists of two assumptions, both called into question by the languages under consideration. Firstly, it is standardly assumed that focus is generally marked by stress. The Chadic languages, however, exhibit a variety of different devices for focus marking. Secondly, it is assumed that focus is always marked. In Tangale, at least, focus is not marked consistently on all types of constituents. The paper offers two possible solutions to this dilemma.}, language = {en} } @article{JasinskajaMayerSchlangen2004, author = {Jasinskaja, Ekaterina and Mayer, J{\"o}rg and Schlangen, David}, title = {Discourse structure and information structure}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8414}, pages = {151 -- 206}, year = {2004}, abstract = {In this paper we review the current state of research on the issue of discourse structure (DS)/information structure (IS) interface. This field has received a lot of attention from discourse semanticists and pragmatists, and has made substantial progress in recent years. In this paper we summarize the relevant studies. In addition, we look at the issue of DS/ISinteraction at a different level - that of phonetics. It is known that both information structure and discourse structure can be realized prosodically, but the issue of phonetic interaction between the prosodic devices they employ has hardly ever been discussed in this context. We think that a proper consideration of this aspect of DS/IS-interaction would enrich our understanding of the phenomenon, and hence we formulate some related research-programmatic positions.}, language = {en} } @article{Ishihara2004, author = {Ishihara, Shinichiro}, title = {Prosody by phase}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8391}, pages = {77 -- 119}, year = {2004}, abstract = {Japanese wh-questions always exhibit focus intonation (FI). Furthermore, the domain of FI exhibits a correspondence to the wh-scope. I propose that this phonology-semantics correspondence is a result of the cyclic computation of FI, which is explained under the notion of Multiple Spell-Out in the recent Minimalist framework. The proposed analysis makes two predictions: (1) embedding of an FI into another is possible; (2) (overt) movement of a wh-phrase to a phase edge position causes a mismatch between FI and wh-scope. Both predictions are tested experimentally, and shown to be borne out.}, language = {en} } @article{EndrissHinterwimmer2004, author = {Endriss, Cornelia and Hinterwimmer, Stefan}, title = {The influence of tense in adverbial quantification}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8409}, pages = {121 -- 151}, year = {2004}, abstract = {We argue that there is a crucial difference between determiner and adverbial quantification. Following Herburger [2000] and von Fintel [1994], we assume that determiner quantifiers quantify over individuals and adverbial quantifiers over eventualities. While it is usually assumed that the semantics of sentences with determiner quantifiers and those with adverbial quantifiers basically come out the same, we will show by way of new data that quantification over events is more restricted than quantification over individuals. This is because eventualities in contrast to individuals have to be located in time which is done using contextual information according to a pragmatic resolution strategy. If the contextual information and the tense information given in the respective sentence contradict each other, the sentence is uninterpretable. We conclude that this is the reason why in these cases adverbial quantification, i.e. quantification over eventualities, is impossible whereas quantification over individuals is fine.}, language = {en} } @article{Fanselow2004, author = {Fanselow, Gisbert}, title = {Cyclic phonology-syntax-interaction}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, issn = {1866-4725}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8264}, pages = {1 -- 42}, year = {2004}, abstract = {This paper investigates the nature of the attraction of XPs to clauseinitial position in German (and other languages). It argues that there are two different types of preposing. First, an XP can move when it is attracted by an EPP-like feature of Comp. Comp can, however, also attract elements that bear the formal marker of some semantic or pragmatic (information theoretic) function. This second type of movement is driven by the attraction of a formal property of the moved element. It has often been misanalysed as "operator" movement in the past. Japanese wh-questions always exhibit focus intonation (FI). Furthermore, the domain of FI exhibits a correspondence to the wh-scope. I propose that this phonology-semantics correspondence is a result of the cyclic computation of FI, which is explained under the notion of Multiple Spell-Out in the recent Minimalist framework. The proposed analysis makes two predictions: (1) embedding of an FI into another is possible; (2) (overt) movement of a wh-phrase to a phase edge position causes a mismatch between FI and wh-scope. Both predictions are tested experimentally, and shown to be borne out.}, language = {en} } @article{FeryHerbst2004, author = {F{\´e}ry, Caroline and Herbst, Laura}, title = {German sentence accent revisited}, series = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, journal = {Interdisciplinary studies on information structure : ISIS ; working papers of the SFB 632}, number = {1}, editor = {Ishihara, Shinichiro and Schmitz, Michaela and Schwarz, Anne}, issn = {1614-4708}, url = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-8273}, pages = {43 -- 75}, year = {2004}, abstract = {Results of a production experiment on the placement of sentence accent in German are reported. The hypothesis that German fulfills some of the most widely accepted rules of accent assignment— predicting focus domain integration—was only partly confirmed. Adjacency between argument and verb induces a single accent on the argument, as recognized in the literature, but interruption of this sequence by a modifier often induces remodeling of the accent pattern with a single accent on the modifier. The verb is rarely stressed. All models based on linear alignment or adjacency between elements belonging to a single accent domain fail to account for this result. A cyclic analysis of prosodic domain formation is proposed in an optimality-theoretic framework that can explain the accent pattern. Japanese wh-questions always exhibit focus intonation (FI). Furthermore, the domain of FI exhibits a correspondence to the wh-scope. I propose that this phonology-semantics correspondence is a result of the cyclic computation of FI, which is explained under the notion of Multiple Spell-Out in the recent Minimalist framework. The proposed analysis makes two predictions: (1) embedding of an FI into another is possible; (2) (overt) movement of a wh-phrase to a phase edge position causes a mismatch between FI and wh-scope. Both predictions are tested experimentally, and shown to be borne out.}, language = {en} }