@inproceedings{4ec7d95011294d3780a89b4401cb29eb,
title = "Automated Discovery of Active Motifs in Multiple RNA Secondary Structures",
abstract = "In this paper we present a method for discovering approximately common motifs (also known as active motifs) in multiple RNA secondary structures. The secondary structures can be represented as ordered trees (i.e., the order among siblings matters). Motifs in these trees are connected subgraphs that can differ in both substitutions and deletions/insertions. The proposed method consists of two steps: (1) find candidate motifs in a small sample of the secondary structures; (2) search all of the secondary structures to determine how frequently these motifs occur (within the allowed approximation) in the secondary structures. To reduce the running time, we develop two optimization heuristics based on sampling and pattern matching techniques. Experimental results obtained by running these algorithms on both generated data and RNA secondary structures show the good performance of the algorithms. To demonstrate the utility of our algorithms, we discuss their applications to conducting the phylogenetic study of RNA sequences obtained from GenBank.",
author = "Wang, {Jason T.L.} and Shapiro, {Bruce A.} and Dennis Shasha and Kaizhong Zhang and Chang, {Chia Yo}",
note = "Publisher Copyright: {\textcopyright} 1996 AAAI (www.aaai.org). All Rights Reserved.; 2nd International Conference on Knowledge Discovery and Data Mining, KDD 1996 ; Conference date: 02-08-1996 Through 04-08-1996",
year = "1996",
language = "English (US)",
series = "Proceedings - 2nd International Conference on Knowledge Discovery and Data Mining, KDD 1996",
publisher = "AAAI press",
pages = "70--75",
editor = "Evangelos Simoudis and Jiawei Han and Fayyad, {Usama M.}",
booktitle = "Proceedings - 2nd International Conference on Knowledge Discovery and Data Mining, KDD 1996",
}