@article{90666, keywords = {Models, Molecular, Base Sequence, Nucleic Acid Conformation, Computer Simulation, Molecular Sequence Data, Sequence Analysis, RNA, Structure-Activity Relationship, Reproducibility of Results, Sensitivity and Specificity, Models, Statistical, Base Composition}, author = {Ranjan Mukhopadhyay and Eldon Emberly and Chao Tang and Ned Wingreen}, title = {Statistical mechanics of RNA folding: importance of alphabet size.}, abstract = { We construct a base-stacking model of RNA secondary-structure formation and use it to study the mapping from sequence to structure. There are strong, qualitative differences between two-letter and four- or six-letter alphabets. With only two kinds of bases, most sequences have many alternative folding configurations and are consequently thermally unstable. Stable ground states are found only for a small set of structures of high designability, i.e., total number of associated sequences. In contrast, sequences made from four bases, as found in nature, or six bases have far fewer competing folding configurations, resulting in a much greater average stability of the ground state. }, year = {2003}, journal = {Phys Rev E Stat Nonlin Soft Matter Phys}, volume = {68}, pages = {041904}, month = {10/2003}, issn = {1539-3755}, doi = {10.1103/PhysRevE.68.041904}, language = {eng}, }