@inbook{36d52a78ab974baea2cec9c81074ec43,
title = "A Decomposition Approach for Discovering Discriminative Motifs in a Sequence Database",
abstract = "Considerable effort has been invested over the years in ad-hoc algorithms for item set and pattern mining. Constraint programming has recently been proposed as a means to tackle item set mining tasks within a general modelling framework. We follow this approach to address the discovery of discriminative n-ary motifs in databases of labeled sequences. We define a n-ary motif as a mapping of n patterns to n class-wide embeddings and we restrict the interpretation of constraints on a motif to the sequences embedding all patterns. We formulate core constraints that minimize redundancy between motifs and introduce a general constraint optimization framework to compute common and exclusive motifs. We cast the discovery of closed and replication-free motifs in this framework for which we propose a two-stage approach based on constraint programming. Experimental results on datasets of protein sequences demonstrate the efficiency of the approach.",
keywords = "Bioinformatics, Constraint Programming, Motifs, Optimization",
author = "David Lesaint and Deepak Mehta and Barry O'Sullivan and Vincent Vigneron",
note = "Publisher Copyright: {\textcopyright} 2014 IEEE.; 26th IEEE International Conference on Tools with Artificial Intelligence, ICTAI 2014 ; Conference date: 10-11-2014 Through 12-11-2014",
year = "2014",
month = dec,
day = "12",
doi = "10.1109/ICTAI.2014.88",
language = "English",
series = "Proceedings - International Conference on Tools with Artificial Intelligence, ICTAI",
publisher = "IEEE Computer Society",
pages = "544--551",
booktitle = "Proceedings - 2014 IEEE 26th International Conference on Tools with Artificial Intelligence, ICTAI 2014",
address = "United States",
}