Traditionally, phylogenetic analyses over many genes combine data into a contiguous block. Under this concatenated model, all genes are assumed to evolve at the same rate. However, it is clear that genes evolve at very different rates and that accounting for this rate heterogeneity is important if we are to accurately infer phylogenies from heterogeneous multigene data sets. There remain open questions regarding how best to incorporate gene rate parameters into phylogenetic models and which properties of real data correlate with improved fit over the concatenated model. In this study, two methods of accounting for gene rate heterogeneity are compared: the n-parameter method, which allows for each of the n gene partitions to have a gene rate parameter, and the alpha-parameter method, which fits a distribution to the gene rates. Results demonstrate that the n-parameter method is both computationally faster and in general provides a better fit over the concatenated model than the alpha-parameter method. Furthermore, improved model fit over the concatenated model is highly correlated with the presence of a gene with a slow relative rate of evolution.
McGill Centre for Bioinformatics, McGill University, Duff Medical Building, 3775 University Street, Montreal, Quebec, H3A 2B4, Canada. rbbevan@gmail.com
year
2007
month
Jul
journal
Syst Biol
number
2
pages
194--205
volume
56
pmid
17464878
pst
ppublish
issn
1063-5157 (Print)
jt
Systematic biology
edat
2007/04/28 09:00
date-modified
2009-01-28 13:04:38 +1300
mhda
2007/07/13 09:00
jid
9302532
crdt
2007/04/28 09:00
dcom
20070712
da
20070427
so
Syst Biol. 2007 Apr;56(2):194-205.
stat
MEDLINE
au
Bevan, RB and Bryant, D and Lang, BF
pii
777715695
sb
IM
pl
England
pt
Comparative Study; Journal Article; Research Support, Non-U.S. Gov't
%0 Journal Article
%1 Bevan07
%A Bevan, Rachel B
%A Bryant, David
%A Lang, B Franz
%C McGill Centre for Bioinformatics, McGill University, Duff Medical Building, 3775 University Street, Montreal, Quebec, H3A 2B4, Canada. rbbevan@gmail.com
%D 2007
%J Syst Biol
%K *Genetic *Models *Phylogeny Computer Evolution Genes Genetic Heterogeneity Molecular Simulation from:davidjamesbryant
%N 2
%P 194--205
%R 10.1080/10635150701291804
%T Accounting for gene rate heterogeneity in phylogenetic inference.
%U http://dx.doi.org/10.1080/10635150701291804
%V 56
%X Traditionally, phylogenetic analyses over many genes combine data into a contiguous block. Under this concatenated model, all genes are assumed to evolve at the same rate. However, it is clear that genes evolve at very different rates and that accounting for this rate heterogeneity is important if we are to accurately infer phylogenies from heterogeneous multigene data sets. There remain open questions regarding how best to incorporate gene rate parameters into phylogenetic models and which properties of real data correlate with improved fit over the concatenated model. In this study, two methods of accounting for gene rate heterogeneity are compared: the n-parameter method, which allows for each of the n gene partitions to have a gene rate parameter, and the alpha-parameter method, which fits a distribution to the gene rates. Results demonstrate that the n-parameter method is both computationally faster and in general provides a better fit over the concatenated model than the alpha-parameter method. Furthermore, improved model fit over the concatenated model is highly correlated with the presence of a gene with a slow relative rate of evolution.
@article{Bevan07,
abstract = {Traditionally, phylogenetic analyses over many genes combine data into a contiguous block. Under this concatenated model, all genes are assumed to evolve at the same rate. However, it is clear that genes evolve at very different rates and that accounting for this rate heterogeneity is important if we are to accurately infer phylogenies from heterogeneous multigene data sets. There remain open questions regarding how best to incorporate gene rate parameters into phylogenetic models and which properties of real data correlate with improved fit over the concatenated model. In this study, two methods of accounting for gene rate heterogeneity are compared: the n-parameter method, which allows for each of the n gene partitions to have a gene rate parameter, and the alpha-parameter method, which fits a distribution to the gene rates. Results demonstrate that the n-parameter method is both computationally faster and in general provides a better fit over the concatenated model than the alpha-parameter method. Furthermore, improved model fit over the concatenated model is highly correlated with the presence of a gene with a slow relative rate of evolution.},
added-at = {2009-05-14T15:26:58.000+0200},
address = {McGill Centre for Bioinformatics, McGill University, Duff Medical Building, 3775 University Street, Montreal, Quebec, H3A 2B4, Canada. rbbevan@gmail.com},
au = {Bevan, RB and Bryant, D and Lang, BF},
author = {Bevan, Rachel B and Bryant, David and Lang, B Franz},
biburl = {https://www.bibsonomy.org/bibtex/22a1f4a342b5cf4e1feae75c96422a3ce/compevol},
crdt = {2007/04/28 09:00},
da = {20070427},
date-modified = {2009-01-28 13:04:38 +1300},
dcom = {20070712},
doi = {10.1080/10635150701291804},
edat = {2007/04/28 09:00},
interhash = {f1f76a6c5d10eb3477e96589507b9572},
intrahash = {2a1f4a342b5cf4e1feae75c96422a3ce},
issn = {1063-5157 (Print)},
jid = {9302532},
journal = {Syst Biol},
jt = {Systematic biology},
keywords = {*Genetic *Models *Phylogeny Computer Evolution Genes Genetic Heterogeneity Molecular Simulation from:davidjamesbryant},
language = {eng},
mhda = {2007/07/13 09:00},
month = Jul,
number = 2,
own = {NLM},
pages = {194--205},
pii = {777715695},
pl = {England},
pmid = {17464878},
pst = {ppublish},
pt = {Comparative Study; Journal Article; Research Support, Non-U.S. Gov't},
sb = {IM},
so = {Syst Biol. 2007 Apr;56(2):194-205.},
stat = {MEDLINE},
timestamp = {2009-05-14T15:26:58.000+0200},
title = {Accounting for gene rate heterogeneity in phylogenetic inference.},
url = {http://dx.doi.org/10.1080/10635150701291804},
volume = 56,
year = 2007
}