@phdthesis{Haider2013,
  author    = {Haider, Peter},
  title     = {Prediction with Mixture Models},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus-69617},
  school      = {Universit{\"a}t Potsdam},
  year      = {2013},
  abstract  = {Learning a model for the relationship between the attributes and the annotated labels of data examples serves two purposes. Firstly, it enables the prediction of the label for examples without annotation. Secondly, the parameters of the model can provide useful insights into the structure of the data. If the data has an inherent partitioned structure, it is natural to mirror this structure in the model. Such mixture models predict by combining the individual predictions generated by the mixture components which correspond to the partitions in the data. Often the partitioned structure is latent, and has to be inferred when learning the mixture model. Directly evaluating the accuracy of the inferred partition structure is, in many cases, impossible because the ground truth cannot be obtained for comparison. However it can be assessed indirectly by measuring the prediction accuracy of the mixture model that arises from it. This thesis addresses the interplay between the improvement of predictive accuracy by uncovering latent cluster structure in data, and further addresses the validation of the estimated structure by measuring the accuracy of the resulting predictive model. In the application of filtering unsolicited emails, the emails in the training set are latently clustered into advertisement campaigns. Uncovering this latent structure allows filtering of future emails with very low false positive rates. In order to model the cluster structure, a Bayesian clustering model for dependent binary features is developed in this thesis. Knowing the clustering of emails into campaigns can also aid in uncovering which emails have been sent on behalf of the same network of captured hosts, so-called botnets. This association of emails to networks is another layer of latent clustering. Uncovering this latent structure allows service providers to further increase the accuracy of email filtering and to effectively defend against distributed denial-of-service attacks. To this end, a discriminative clustering model is derived in this thesis that is based on the graph of observed emails. The partitionings inferred using this model are evaluated through their capacity to predict the campaigns of new emails. Furthermore, when classifying the content of emails, statistical information about the sending server can be valuable. Learning a model that is able to make use of it requires training data that includes server statistics. In order to also use training data where the server statistics are missing, a model that is a mixture over potentially all substitutions thereof is developed. Another application is to predict the navigation behavior of the users of a website. Here, there is no a priori partitioning of the users into clusters, but to understand different usage scenarios and design different layouts for them, imposing a partitioning is necessary. The presented approach simultaneously optimizes the discriminative as well as the predictive power of the clusters. Each model is evaluated on real-world data and compared to baseline methods. The results show that explicitly modeling the assumptions about the latent cluster structure leads to improved predictions compared to the baselines. It is beneficial to incorporate a small number of hyperparameters that can be tuned to yield the best predictions in cases where the prediction accuracy can not be optimized directly.},
  language  = {en}
}
@phdthesis{Haendel2018,
  author    = {H{\"a}ndel, Annabel},
  title     = {Ground-motion model selection and adjustment for seismic hazard analysis},
  url       = {http://nbn-resolving.de/urn:nbn:de:kobv:517-opus4-418123},
  school      = {Universit{\"a}t Potsdam},
  pages     = {122},
  year      = {2018},
  abstract  = {Erdbeben k{\"o}nnen starke Bodenbewegungen erzeugen und es ist wichtig, diese in einer seismischen Gef{\"a}hrdungsanalyse korrekt vorherzusagen. {\"U}blicherweise werden dazu empirisch ermittelte Bodenbewegungsmodelle (GMPE) in einem logischen Baum zusammengef{\"u}gt. Wenn jedoch die Bodenbewegung in einem Gebiet mit geringer Seismizit{\"a}t bestimmen werden soll, dann fehlen in der Regel die Daten, um regionsspezifische GMPEs zu entwickeln. In diesen F{\"a}llen ist es notwendig, auf Modelle aus anderen Gebieten mit guter Datengrundlage zur{\"u}ckzugreifen und diese an die Zielregion anzupassen. Zur korrekten Anpassung werden seismologische Informationen aus der Zielregion wie beispielsweise die standortspezifische D{\"a}mpfung kappa0 ben{\"o}tigt. Diese Parameter lassen sich jedoch ebenfalls nur unzuverl{\"a}ssig bestimmen, wenn die Datengrundlage schlecht ist. In meiner Dissertation besch{\"a}ftige ich mich daher mit der Auswahl von GMPEs f{\"u}r den logischen Baum beziehungsweise deren Anpassung an Regionen mit geringer Seismizit{\"a}t. Ich folge dabei zwei verschiedenen Strategien. Im ersten Ansatz geht es um das Aufstellen eines logischen Baumes, falls kein regionsspezifisches Modell vorhanden ist. Ich stelle eine Methode vor, in der mehrere regionsfremde Modelle zu einem Mixmodell zusammengef{\"u}gt werden. Die Modelle werden dabei je nach ihrer Eignung gewichtet und die Gewichte mittels der wenigen verf{\"u}gbaren Daten aus der Zielregion ermittelt. Ein solches Mixmodell kann als sogenanntes 'Backbone'-Modell verwendet werden, welches in der Lage ist, mittlere Bodenbewegungen in der Zielregion korrekt vorherzusagen. Ich teste diesen Ansatz f{\"u}r Nordchile und acht GMPEs, die f{\"u}r verschiedene Subduktionszonen auf der Welt entwickelt wurden. Die Resultate zeigen, dass das Mixmodell bessere Ergebnisse liefert als die einzelnen GMPEs, die zu seiner Erzeugung genutzt wurden. Es ist außerdem ebenso gut in der Vorhersage von Bodenbewegungen wie ein Regressionsmodell, welches extra f{\"u}r Nordchile entwickelt wurde. Im zweiten Ansatz besch{\"a}ftige ich mich mit der Bestimmung der standortspezifischen D{\"a}mpfung kappa0. kappa0 ist einer der wichtigsten Parameter zur Anpassung eines GMPEs an eine andere Region. Mein Ziel ist es, kappa0 aus seismischer Bodenunruhe anstelle von Erdbeben zu ermitteln, da diese kontinuierlich aufgezeichnet wird. Mithilfe von Interferometrie kann die Geschwindigkeit und D{\"a}mpfung von seismischen Wellen im Untergrund bestimmt werden. Dazu werden lange Aufzeichnungsreihen seismischer Bodenunruhe entweder kreuzkorreliert oder entfaltet (Dekonvolution). Die Bestimmung der D{\"a}mpfung aus Bodenunruhe bei Frequenzen {\"u}ber 1 Hz und in geringen Tiefen ist jedoch nicht trivial. Ich zeige in meiner Dissertation die Ergebnisse von zwei Studien. In der ersten Studie wird die D{\"a}mpfung von Love-Wellen zwischen 1-4 Hz f{\"u}r ein kleines Testarray in Griechenland ermittelt. In der zweiten Studie verwende ich die Daten einer Bohrloch und einer Oberfl{\"a}chenstation aus dem Vogtland, um die D{\"a}mpfung von S-Wellen zwischen 5-15 Hz zu bestimmen. Diese beiden Studien stellen jedoch nur den Ausgangspunkt f{\"u}r zuk{\"u}nftige Untersuchungen dar, in denen kappa0 direkt aus der seismischer Bodenunruhe hergeleitet werden soll.},
  language  = {en}
}