@ARTICLE{TreeBASE2Ref18560,
author = {Mieczyslaw Wolsan and Jun J Sato},
title = {Effects of data incompleteness on the relative performance of parsimony and Bayesian approaches in a supermatrix phylogenetic reconstruction of Mustelidae and Procyonidae (Carnivora)},
year = {2010},
keywords = {},
doi = {10.1111/j.1096-0031.2009.00281.x},
url = {},
pmid = {},
journal = {Cladistics},
volume = {26},
number = {},
pages = {168--194},
abstract = {Missing data are commonly thought to impede a resolved or accurate reconstruction of phylogenetic relationships, and probabilistic analysis techniques (such as Bayesian inference or maximum likelihood) are increasingly viewed as less vulnerable to the negative effects of data incompleteness than parsimony. We test both assumptions empirically by conducting parsimony and Bayesian analyses on a ~1.5 ~ 106-cell (27,965 characters ~ 52 species) mustelid-procyonid molecular supermatrix with 62.7% missing entries. Contrary to the first assumption, phylogenetic relationships inferred from our analyses are fully (Bayesian) or almost fully (parsimony) resolved topologically with mostly strong support and also largely in accord with prior molecular estimations of mustelid and procyonid phylogeny derived with parsimony, Bayesian, and other probabilistic analysis techniques from smaller but complete or nearly complete data sets. Contrary to the second assumption, we found no compelling evidence in support of a relationship between the inferior performance of parsimony and taxon incompleteness (i.e., the proportion of missing character data for a taxon), although we found evidence for a connection between the inferior performance of parsimony and character incompleteness (i.e., no overlap in character data between some taxa). The relatively good performance of our analyses may be related to the large number of sampled characters, so that most taxa (even highly incomplete ones) are represented by a sufficient number of characters allowing both approaches to resolve their relationships.}
}
Citation for Study 10069
Citation title:
"Effects of data incompleteness on the relative performance of parsimony and Bayesian approaches in a supermatrix phylogenetic reconstruction of Mustelidae and Procyonidae (Carnivora)".
This study was previously identified under the legacy study ID S2409
(Status: Published).
Citation
Wolsan M., & Sato J. 2010. Effects of data incompleteness on the relative performance of parsimony and Bayesian approaches in a supermatrix phylogenetic reconstruction of Mustelidae and Procyonidae (Carnivora). Cladistics, 26: 168-194.
Authors
Abstract
Missing data are commonly thought to impede a resolved or accurate reconstruction of phylogenetic relationships, and probabilistic analysis techniques (such as Bayesian inference or maximum likelihood) are increasingly viewed as less vulnerable to the negative effects of data incompleteness than parsimony. We test both assumptions empirically by conducting parsimony and Bayesian analyses on a ~1.5 ~ 106-cell (27,965 characters ~ 52 species) mustelid-procyonid molecular supermatrix with 62.7% missing entries. Contrary to the first assumption, phylogenetic relationships inferred from our analyses are fully (Bayesian) or almost fully (parsimony) resolved topologically with mostly strong support and also largely in accord with prior molecular estimations of mustelid and procyonid phylogeny derived with parsimony, Bayesian, and other probabilistic analysis techniques from smaller but complete or nearly complete data sets. Contrary to the second assumption, we found no compelling evidence in support of a relationship between the inferior performance of parsimony and taxon incompleteness (i.e., the proportion of missing character data for a taxon), although we found evidence for a connection between the inferior performance of parsimony and character incompleteness (i.e., no overlap in character data between some taxa). The relatively good performance of our analyses may be related to the large number of sampled characters, so that most taxa (even highly incomplete ones) are represented by a sufficient number of characters allowing both approaches to resolve their relationships.
External links
About this resource
- Canonical resource URI:
http://purl.org/phylo/treebase/phylows/study/TB2:S10069
- Other versions:
Nexus
NeXML
- Show BibTeX reference
@ARTICLE{TreeBASE2Ref18560,
author = {Mieczyslaw Wolsan and Jun J Sato},
title = {Effects of data incompleteness on the relative performance of parsimony and Bayesian approaches in a supermatrix phylogenetic reconstruction of Mustelidae and Procyonidae (Carnivora)},
year = {2010},
keywords = {},
doi = {10.1111/j.1096-0031.2009.00281.x},
url = {},
pmid = {},
journal = {Cladistics},
volume = {26},
number = {},
pages = {168--194},
abstract = {Missing data are commonly thought to impede a resolved or accurate reconstruction of phylogenetic relationships, and probabilistic analysis techniques (such as Bayesian inference or maximum likelihood) are increasingly viewed as less vulnerable to the negative effects of data incompleteness than parsimony. We test both assumptions empirically by conducting parsimony and Bayesian analyses on a ~1.5 ~ 106-cell (27,965 characters ~ 52 species) mustelid-procyonid molecular supermatrix with 62.7% missing entries. Contrary to the first assumption, phylogenetic relationships inferred from our analyses are fully (Bayesian) or almost fully (parsimony) resolved topologically with mostly strong support and also largely in accord with prior molecular estimations of mustelid and procyonid phylogeny derived with parsimony, Bayesian, and other probabilistic analysis techniques from smaller but complete or nearly complete data sets. Contrary to the second assumption, we found no compelling evidence in support of a relationship between the inferior performance of parsimony and taxon incompleteness (i.e., the proportion of missing character data for a taxon), although we found evidence for a connection between the inferior performance of parsimony and character incompleteness (i.e., no overlap in character data between some taxa). The relatively good performance of our analyses may be related to the large number of sampled characters, so that most taxa (even highly incomplete ones) are represented by a sufficient number of characters allowing both approaches to resolve their relationships.}
}
- Show RIS reference
TY - JOUR
ID - 18560
AU - Wolsan,Mieczyslaw
AU - Sato,Jun J
T1 - Effects of data incompleteness on the relative performance of parsimony and Bayesian approaches in a supermatrix phylogenetic reconstruction of Mustelidae and Procyonidae (Carnivora)
PY - 2010
KW -
UR -
N2 - Missing data are commonly thought to impede a resolved or accurate reconstruction of phylogenetic relationships, and probabilistic analysis techniques (such as Bayesian inference or maximum likelihood) are increasingly viewed as less vulnerable to the negative effects of data incompleteness than parsimony. We test both assumptions empirically by conducting parsimony and Bayesian analyses on a ~1.5 ~ 106-cell (27,965 characters ~ 52 species) mustelid-procyonid molecular supermatrix with 62.7% missing entries. Contrary to the first assumption, phylogenetic relationships inferred from our analyses are fully (Bayesian) or almost fully (parsimony) resolved topologically with mostly strong support and also largely in accord with prior molecular estimations of mustelid and procyonid phylogeny derived with parsimony, Bayesian, and other probabilistic analysis techniques from smaller but complete or nearly complete data sets. Contrary to the second assumption, we found no compelling evidence in support of a relationship between the inferior performance of parsimony and taxon incompleteness (i.e., the proportion of missing character data for a taxon), although we found evidence for a connection between the inferior performance of parsimony and character incompleteness (i.e., no overlap in character data between some taxa). The relatively good performance of our analyses may be related to the large number of sampled characters, so that most taxa (even highly incomplete ones) are represented by a sufficient number of characters allowing both approaches to resolve their relationships.
L3 - 10.1111/j.1096-0031.2009.00281.x
JF - Cladistics
VL - 26
IS -
SP - 168
EP - 194
ER -