@inproceedings{88af50cbaef34473902e675acff51e51,
title = "AB initio prediction of transcription factor binding sites",
abstract = "Transcription factors are DNA-binding proteins that control gene transcription by binding specific short DNA sequences. Experiments that identify transcription factor binding sites are often laborious and expensive, and the binding sites of many transcription factors remain unknown. We present a computational scheme to predict the binding sites directly from transcription factor sequence using all-atom molecular simulations. This method is a computational counterpart to recent high-throughput experimental technologies that identify transcription factor binding sites (ChlP-chip and protein-dsDNA binding microarrays). The only requirement of our method is an accurate 3D structural model of a transcription factor-DNA complex. We apply free energy calculations by thermodynamic integration to compute the change in binding energy of the complex due to a single base pair mutation. By calculating the binding free energy differences for all possible single mutations, we construct a position weight matrix for the predicted binding sites that can be directly compared with experimental data. As water-bridged hydrogen bonds between the transcription factor and DNA often contribute to the binding specificity, we include explicit solvent in our simulations. We present successful predictions for the yeast MAT-α2 homeodomain and GCN4 bZIP proteins. Water-bridged hydrogen bonds are found to be more prevalent than direct protein-DNA hydrogen bonds at the binding interfaces, indicating why empirical potentials with implicit water may be less successful in predicting binding. Our methodology can be applied to a variety of DNA-binding proteins.",
keywords = "free energy, hydrogen bond, position weight matrix, transcription factor binding sites",
author = "{Angela Liu}, L. and Bader, {Joel S.}",
year = "2007",
language = "English (US)",
isbn = "9812704175",
series = "Pacific Symposium on Biocomputing 2007, PSB 2007",
pages = "484--495",
booktitle = "Pacific Symposium on Biocomputing 2007, PSB 2007",
note = "Pacific Symposium on Biocomputing, PSB 2007 ; Conference date: 03-01-2007 Through 07-01-2007",
}