@inproceedings{f58f920fbd8342718f1e709767605c6b,
title = "Comparative gene prediction based on gene structure conservation",
abstract = "Identifying protein coding genes is one of most important task in newly sequenced genomes. With increasing numbers of gene annotations verified by experiments, it is feasible to identify genes in newly sequenced genomes by comparing with genes annotated on phylogenetically close organisms. Here, we propose a program, GeneAlign, which predicts the genes on one sequence by measuring the similarity between the predicted sequence and related genes annotated on another genome. The program applies CORAL, a heuristic linear time alignment tool, to determine whether the regions flanked by candidate signals are similar with the annotated exons or not. The approach, which employs the conservation of gene structures and sequence homologies between protein coding regions, increases the prediction accuracy. GeneAlign was tested on Projector data set of 449 human-mouse homologous sequence pairs. At the gene level, the sensitivity and specificity of GeneAlign are 80%, and larger than 96% at the exon level.",
author = "Hsieh, {Shu Ju} and Lin, {Chun Yuan} and Liu, {Ning Han} and Tang, {Chuan Yi}",
year = "2006",
doi = "10.1007/11818564_5",
language = "英语",
isbn = "3540374469",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Verlag",
pages = "32--41",
booktitle = "Pattern Recognition in Bioinformatics - International Workshop, PRIB 2006, Proceedings",
address = "德国",
note = "International Workshop on Pattern Recognition in Bioinformatics, PRIB 2006 ; Conference date: 20-08-2006 Through 20-08-2006",
}