@ARTICLE{TreeBASE2Ref14900,
author = {Gustavo Caetano-Anoll?s and D. Caetano-Anoll?s},
title = {An evolutionarily structured universe of protein architecture.},
year = {2003},
keywords = {},
doi = {10.1101/gr.1161903},
url = {},
pmid = {12840035 },
journal = {Genome Research},
volume = {13},
number = {7},
pages = {1563--1571},
abstract = {Protein structural diversity encompasses a finite set of architectural designs. Embedded in these topologies are evolutionary histories that we here uncover using cladistic principles and measurements of protein-fold usage and sharing. The reconstructed phylogenies are inherently rooted and depict histories of protein and proteome diversification. Proteome phylogenies showed two monophyletic sister-groups delimiting Bacteria and Archaea, and a topology rooted in Eucarya. This suggests three dramatic evolutionary events and a common ancestor with a eukaryotic-like, gene-rich, and relatively modern organization. Conversely, a general phylogeny of protein architectures showed that structural classes of globular proteins appeared early in evolution and in defined order, the alpha/beta class being the first. While most ancestral folds shared a common architecture of barrels or interleaved beta-sheets and alpha-helices, many were clearly derived, such as polyhedral folds in the all-alpha class and beta-sandwiches, beta-propellers, and beta-prisms in all-beta proteins. We also describe transformation pathways of architectures that are prevalently used in nature. For example, beta-barrels with increased curl and stagger were favored evolutionary outcomes in the all-beta class. Interestingly, we found cases where structural change followed the alpha-to-beta tendency uncovered in the tree of architectures. We finally traced the total number of enzymatic functions associated with folds in the trees and showed there was a general link between structure and enzymatic function.}
}
Matrices for Study 1018

Citation title:
"An evolutionarily structured universe of protein architecture.".

This study was previously identified under the legacy study ID S909
(Status: Published).
Matrices