diff --git a/phd_thesis.bib b/phd_thesis.bib index 1e2f2dc..08028d8 100644 --- a/phd_thesis.bib +++ b/phd_thesis.bib @@ -1,7515 +1,4719 @@ -@misc{center_for_history_and_new_media_guide_nodate, - title = {Guide rapide pour débuter}, - url = {http://zotero.org/support/quick_start_guide}, - author = {{Center for History and New Media}} -} - -@article{huang_cellular_2007, - title = {Cellular {microRNAs} contribute to {HIV}-1 latency in resting primary {CD}4+ {T} lymphocytes}, - volume = {13}, - copyright = {© 2007 Nature Publishing Group}, - issn = {1078-8956}, - url = {http://www.nature.com/nm/journal/v13/n10/full/nm1639.html}, - doi = {10.1038/nm1639}, - abstract = {The latency of human immunodeficiency virus type 1 (HIV-1) in resting primary CD4+ T cells is the major barrier for the eradication of the virus in patients on suppressive highly active antiretroviral therapy (HAART). Even with optimal HAART treatment, replication-competent HIV-1 still exists in resting primary CD4+ T cells. Multiple restriction factors that act upon various steps of the viral life cycle could contribute to viral latency. Here we show that cellular microRNAs (miRNAs) potently inhibit HIV-1 production in resting primary CD4+ T cells. We have found that the 3' ends of HIV-1 messenger RNAs are targeted by a cluster of cellular miRNAs including miR-28, miR-125b, miR-150, miR-223 and miR-382, which are enriched in resting CD4+ T cells as compared to activated CD4+ T cells. Specific inhibitors of these miRNAs substantially counteracted their effects on the target mRNAs, measured either as HIV-1 protein translation in resting CD4+ T cells transfected with HIV-1 infectious clones, or as HIV-1 virus production from resting CD4+ T cells isolated from HIV-1–infected individuals on suppressive HAART. Our data indicate that cellular miRNAs are pivotal in HIV-1 latency and suggest that manipulation of cellular miRNAs could be a novel approach for purging the HIV-1 reservoir.}, - language = {en}, - number = {10}, - urldate = {2013-10-08}, - journal = {Nature Medicine}, - author = {Huang, Jialing and Wang, Fengxiang and Argyris, Elias and Chen, Keyang and Liang, Zhihui and Tian, Heng and Huang, Wenlin and Squires, Kathleen and Verlinghieri, Gwen and Zhang, Hui}, - month = oct, - year = {2007}, - keywords = {HIV, bone, cancer, cardiology, cardiovascular disease, content, diabetes, heart, immunity, immunology, infectious diseases, journal, medical technologies, medicine, metabolic syndrome, metabolism, microbiology, molecular medicine, nature, nature medicine, nature publishing group, neurodegeneration, neurology, neuroscience, obesity, oncology, physician, physician scientist, physiology, reproductive biology, stem cells, transplantation, virology}, - pages = {1241--1247}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4ZHR3SEF/Huang et al. - 2007 - Cellular microRNAs contribute to HIV-1 latency in .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6UJM3GFQ/nm1639.html:text/html} -} - -@article{schopman_deep_2012, - title = {Deep sequencing of virus-infected cells reveals {HIV}-encoded small {RNAs}}, - volume = {40}, - issn = {0305-1048, 1362-4962}, - url = {http://nar.oxfordjournals.org/content/40/1/414}, - doi = {10.1093/nar/gkr719}, - abstract = {Small virus-derived interfering RNAs (viRNAs) play an important role in antiviral defence in plants, insects and nematodes by triggering the RNA interference (RNAi) pathway. The role of RNAi as an antiviral defence mechanism in mammalian cells has been obscure due to the lack of viRNA detection. Although viRNAs from different mammalian viruses have recently been identified, their functions and possible impact on viral replication remain unknown. To identify viRNAs derived from HIV-1, we used the extremely sensitive SOLiDTM 3 Plus System to analyse viRNA accumulation in HIV-1-infected T lymphocytes. We detected numerous small RNAs that correspond to the HIV-1 RNA genome. The majority of these sequences have a positive polarity (98.1\%) and could be derived from miRNAs encoded by structured segments of the HIV-1 RNA genome (vmiRNAs). A small portion of the viRNAs is of negative polarity and most of them are encoded within the 3′-UTR, which may represent viral siRNAs (vsiRNAs). The identified vsiRNAs can potently repress HIV-1 production, whereas suppression of the vsiRNAs by antagomirs stimulate virus production. These results suggest that HIV-1 triggers the production of vsiRNAs and vmiRNAs to modulate cellular and/or viral gene expression.}, - language = {en}, - number = {1}, - urldate = {2013-10-29}, - journal = {Nucleic Acids Research}, - author = {Schopman, Nick C. T. and Willemsen, Marcel and Liu, Ying Poi and Bradley, Ted and Kampen, Antoine van and Baas, Frank and Berkhout, Ben and Haasnoot, Joost}, - month = jan, - year = {2012}, - pmid = {21911362}, - pages = {414--427}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XZR4KJP2/Schopman et al. - 2012 - Deep sequencing of virus-infected cells reveals HI.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/833FA4M8/414.html:text/html} -} - -@article{schones_dynamic_2008, - title = {Dynamic {Regulation} of {Nucleosome} {Positioning} in the {Human} {Genome}}, - volume = {132}, - issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867408002705}, - doi = {10.1016/j.cell.2008.02.022}, - abstract = {The positioning of nucleosomes with respect to DNA plays an important role in regulating transcription. However, nucleosome mapping has been performed for only limited genomic regions in humans. We have generated genome-wide maps of nucleosome positions in both resting and activated human CD4+ T cells by direct sequencing of nucleosome ends using the Solexa high-throughput sequencing technique. We find that nucleosome phasing relative to the transcription start sites is directly correlated to RNA polymerase II (Pol II) binding. Furthermore, the first nucleosome downstream of a start site exhibits differential positioning in active and silent genes. TCR signaling induces extensive nucleosome reorganization in promoters and enhancers to allow transcriptional activation or repression. Our results suggest that H2A.Z-containing and modified nucleosomes are preferentially lost from the −1 nucleosome position. Our data provide a comprehensive view of the nucleosome landscape and its dynamic regulation in the human genome.}, - number = {5}, - urldate = {2014-03-05}, - journal = {Cell}, - author = {Schones, Dustin E. and Cui, Kairong and Cuddapah, Suresh and Roh, Tae-Young and Barski, Artem and Wang, Zhibin and Wei, Gang and Zhao, Keji}, - month = mar, - year = {2008}, - keywords = {DNA, SIGNALING}, - pages = {887--898}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7APGCGXA/Schones et al. - 2008 - Dynamic Regulation of Nucleosome Positioning in th.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/52FSKUHE/S0092867408002705.html:text/html} -} - -@article{cohen_understanding_2011, - title = {Understanding {HIV} latency to undo it}, - volume = {332}, - issn = {1095-9203}, - doi = {10.1126/science.332.6031.786}, - language = {eng}, - number = {6031}, - journal = {Science (New York, N.Y.)}, - author = {Cohen, Jon}, - month = may, - year = {2011}, - pmid = {21566174}, - keywords = {Animals, CD4-Positive T-Lymphocytes, Chromosomes, Human, DNA Methylation, DNA, Viral, HIV, HIV Infections, Histone Deacetylase Inhibitors, Humans, Immunologic Memory, Lymphocyte Activation, Transcription Factors, Transcription, Genetic, Virus Integration, Virus Latency}, - pages = {786} -} - -@article{sepkowitz_aids_2001, - title = {{AIDS} — {The} {First} 20 {Years}}, - volume = {344}, - issn = {0028-4793}, - url = {http://www.nejm.org/doi/full/10.1056/NEJM200106073442306}, - doi = {10.1056/NEJM200106073442306}, - abstract = {The disease now known as the acquired immunodeficiency syndrome, or AIDS, was first reported 20 years ago this week in the Morbidity and Mortality Weekly Report under the quiet title “Pneumocystis pneumonia — Los Angeles.”1 The description was not the lead article; that distinction went to a report of dengue infections in vacationers returning to the United States from the Caribbean. Not even the most pessimistic reader could have anticipated the scope and scale the epidemic would assume two decades later. By December 2000, 21.8 million people worldwide had died of the disease, including more Americans (438,795) than died . . .}, - number = {23}, - urldate = {2013-11-09}, - journal = {New England Journal of Medicine}, - author = {Sepkowitz, Kent A.}, - year = {2001}, - pmid = {11396444}, - pages = {1764--1772}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/63EINV5G/Sepkowitz - 2001 - AIDS — The First 20 Years.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TCE5JQKE/NEJM200106073442306.html:text/html} -} - -@article{jin_h3.3/h2a.z_2009, - title = {H3.3/{H}2A.{Z} double variant–containing nucleosomes mark 'nucleosome-free regions' of active promoters and other regulatory regions}, - volume = {41}, - copyright = {© 2009 Nature Publishing Group}, - issn = {1061-4036}, - url = {http://www.nature.com/ng/journal/v41/n8/full/ng.409.html}, - doi = {10.1038/ng.409}, - abstract = {To understand how chromatin structure is organized by different histone variants, we have measured the genome-wide distribution of nucleosome core particles (NCPs) containing the histone variants H3.3 and H2A.Z in human cells. We find that a special class of NCPs containing both variants is enriched at 'nucleosome-free regions' of active promoters, enhancers and insulator regions. We show that preparative methods used previously in studying nucleosome structure result in the loss of these unstable double-variant NCPs. It seems likely that this instability facilitates the access of transcription factors to promoters and other regulatory sites in vivo. Other combinations of variants have different distributions, consistent with distinct roles for histone variants in the modulation of gene expression.}, - language = {en}, - number = {8}, - urldate = {2014-03-05}, - journal = {Nature Genetics}, - author = {Jin, Chunyuan and Zang, Chongzhi and Wei, Gang and Cui, Kairong and Peng, Weiqun and Zhao, Keji and Felsenfeld, Gary}, - month = aug, - year = {2009}, - pages = {941--945}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AI6WKGI2/Jin et al. - 2009 - H3.3H2A.Z double variant–containing nucleosomes m.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VJ3XNXDF/ng.409.html:text/html} -} - -@article{hoch_proteinprotein_2007, - title = {Protein–{Protein} {Förster} {Resonance} {Energy} {Transfer} {Analysis} of {Nucleosome} {Core} {Particles} {Containing} {H}2A and {H}2A.{Z}}, - volume = {371}, - issn = {0022-2836}, - url = {http://www.sciencedirect.com/science/article/pii/S0022283607007140}, - doi = {10.1016/j.jmb.2007.05.075}, - abstract = {A protein–protein Förster resonance energy transfer (FRET) system, employing probes at multiple positions, was designed to specifically monitor the dissociation of the H2A–H2B dimer from the nucleosome core particle (NCP). Tryptophan donors and Cys-AEDANS acceptors were chosen because, compared to previous NCP FRET fluorophores, they: (1) are smaller and less hydrophobic, which should minimize perturbations of histone and NCP structure; and (2) have an R0 of 20 Å, which is much less than the dimensions of the NCP (∼ 50 Å width and ∼ 100 Å diameter). Equilibrium protein unfolding titrations indicate that the donor and acceptor moieties have minimal effects on the stability of the H2A–H2B dimer and (H3–H4)2 tetramer. NCPs containing the various FRET pairs were reconstituted with the 601 DNA positioning element. Equilibrium NaCl-induced dissociation of the modified NCPs showed that the 601 sequence stabilized the NCP to dimer dissociation relative to weaker positioning sequences. This finding implies a significant role for the H2A–H2B dimers in determining the DNA sequence dependence of NCP stability. The free energy of dissociation determined from reversible and well-defined sigmoidal transitions revealed two distinct phases reflecting the dissociation of individual H2A–H2B dimers, confirming cooperativity as suggested previously; these data allow quantitative description of the cooperativity. The FRET system was then used to study the effects of the histone variant H2A.Z on NCP stability; previous studies have reported both destabilizing and stabilizing effects. H2A.Z FRET NCP dissociation transitions suggest a slight increase in stability but a significant increase in cooperativity of the dimer dissociations. Thus, the utility of this protein–protein FRET system to monitor the effects of histone variants on NCP dynamics has been demonstrated, and the system appears equally well-suited for dissection of the kinetic processes of dimer association and dissociation from the NCP.}, - number = {4}, - urldate = {2014-04-14}, - journal = {Journal of Molecular Biology}, - author = {Hoch, Duane A. and Stratton, Jessica J. and Gloss, Lisa M.}, - month = aug, - year = {2007}, - keywords = {Chromatin, FRET, Histone variants, fluorescence, thermodynamics}, - pages = {971--988}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B54HUM4W/Hoch et al. - 2007 - Protein–Protein Förster Resonance Energy Transfer .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5CE6546R/S0022283607007140.html:text/html} -} - -@article{cao_cessation_2009, - title = {Cessation of {HIV}-1 {Transcription} by {Inhibiting} {Regulatory} {Protein} {Rev}- {Mediated} {RNA} {Transport}}, - volume = {7}, - issn = {1570162X}, - url = {http://www.eurekaselect.com/93073/article}, - doi = {10.2174/157016209787048564}, - number = {1}, - urldate = {2013-11-10}, - journal = {Current HIV Research}, - author = {Cao, Yuan and Liu, Xinyong and De Clercq, Erik}, - month = jan, - year = {2009}, - pages = {101--108}, - file = {Cessation of HIV-1 Transcription by Inhibiting Regulatory Protein Rev- Mediated RNA Transport | BenthamScience:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RKET5IZR/article.html:text/html} -} - -@article{meng_wrapping_2013, - title = {Wrapping up the bad news - {HIV} assembly and release}, - volume = {10}, - issn = {1742-4690}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3558412/}, - doi = {10.1186/1742-4690-10-5}, - abstract = {The late Nobel Laureate Sir Peter Medawar once memorably described viruses as ‘bad news wrapped in protein’. Virus assembly in HIV is a remarkably well coordinated process in which the virus achieves extracellular budding using primarily intracellular budding machinery and also the unusual phenomenon of export from the cell of an RNA. Recruitment of the ESCRT system by HIV is one of the best documented examples of the comprehensive way in which a virus hijacks a normal cellular process. This review is a summary of our current understanding of the budding process of HIV, from genomic RNA capture through budding and on to viral maturation, but centering on the proteins of the ESCRT pathway and highlighting some recent advances in our understanding of the cellular components involved and the complex interplay between the Gag protein and the genomic RNA.}, - urldate = {2013-11-10}, - journal = {Retrovirology}, - author = {Meng, Bo and Lever, Andrew ML}, - month = jan, - year = {2013}, - pmid = {23305486}, - pmcid = {PMC3558412}, - pages = {5}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KBJ57DXC/Meng et Lever - 2013 - Wrapping up the bad news - HIV assembly and releas.pdf:application/pdf} -} - -@article{hakre_hiv_2012, - title = {{HIV} latency: experimental systems and molecular models}, - volume = {36}, - issn = {1574-6976}, - shorttitle = {{HIV} latency}, - doi = {10.1111/j.1574-6976.2012.00335.x}, - abstract = {Highly active antiretroviral therapy (HAART) has shown great efficacy in increasing the survival of HIV infected individuals. However, HAART does not lead to the full eradication of infection and therefore has to be continued for life. HIV persists in a transcriptionally inactive form in resting T cells in HAART-treated patients and can be reactivated following T-cell activation. These latently infected cells allow the virus to persist in the presence of HAART. Here, we review recent advances in the study of the molecular mechanisms of HIV latency. We also review experimental models in which latency is currently studied. We focus on the epigenetic mechanisms controlling HIV transcription and on the role of chromatin and its post-translational modifications. We discuss how small molecule inhibitors that target epigenetic regulators, such as HDAC (histone deacetylase) inhibitors, are being tested for their ability to reactivate latent HIV. Finally, we discuss the clinical potential of these drugs to flush out latently infected cells from HIV-infected patients and to eradicate the virus.}, - language = {eng}, - number = {3}, - journal = {FEMS microbiology reviews}, - author = {Hakre, Shweta and Chavez, Leonard and Shirakawa, Kotaro and Verdin, Eric}, - month = may, - year = {2012}, - pmid = {22372374}, - keywords = {Gene Expression Regulation, Viral, HIV, HIV Infections, Host-Pathogen Interactions, Humans, Models, Molecular, T-Lymphocytes, Virus Activation, Virus Latency}, - pages = {706--716} -} - -@article{nozaki_tight_2011, - title = {Tight associations between transcription promoter type and epigenetic variation in histone positioning and modification}, - volume = {12}, - copyright = {2011 Nozaki et al; licensee BioMed Central Ltd.}, - issn = {1471-2164}, - url = {http://www.biomedcentral.com/1471-2164/12/416/abstract}, - doi = {10.1186/1471-2164-12-416}, - abstract = {PMID: 21846408}, - language = {en}, - number = {1}, - urldate = {2015-04-17}, - journal = {BMC Genomics}, - author = {Nozaki, Tadasu and Yachie, Nozomu and Ogawa, Ryu and Kratz, Anton and Saito, Rintaro and Tomita, Masaru}, - month = aug, - year = {2011}, - pmid = {21846408}, - pages = {416}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5NVIJMZH/Nozaki et al. - 2011 - Tight associations between transcription promoter .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4R8FAQ3F/416.html:text/html} -} - -@article{hammond_dicing_2005, - title = {Dicing and slicing: {The} core machinery of the {RNA} interference pathway}, - volume = {579}, - issn = {0014-5793}, - shorttitle = {Dicing and slicing}, - url = {http://www.sciencedirect.com/science/article/pii/S0014579305010884}, - doi = {10.1016/j.febslet.2005.08.079}, - abstract = {RNA interference (RNAi) is broadly defined as a gene silencing pathway that is triggered by double-stranded RNA (dsRNA). Many variations have been described on this theme. The dsRNA trigger can be supplied exogenously, as an experimental tool, or can derive from the genome in the form of microRNAs. Gene silencing can be the result of nucleolytic degradation of the mRNA, or by translational suppression. At the heart of the pathway are two ribonuclease machines. The ribonuclease III enzyme Dicer initiates the RNAi pathway by generating the active short interfering RNA trigger. Silencing is effected by the RNA-induced silencing complex and its RNaseH core enzyme Argonaute. This review describes the discovery of these machines and discusses future lines of work on this amazing biochemical pathway.}, - number = {26}, - urldate = {2013-10-13}, - journal = {FEBS Letters}, - author = {Hammond, Scott M.}, - month = oct, - year = {2005}, - keywords = {Argonaute, Dicer, Drosha, RNA interference, RNA-induced silencing complex, Slicer, miRNA, microRNA}, - pages = {5822--5829} -} - -@article{karn_transcriptional_2012, - title = {Transcriptional and {Posttranscriptional} {Regulation} of {HIV}-1 {Gene} {Expression}}, - volume = {2}, - issn = {, 2157-1422}, - url = {http://perspectivesinmedicine.cshlp.org/content/2/2/a006916}, - doi = {10.1101/cshperspect.a006916}, - abstract = {Control of HIV-1 gene expression depends on two viral regulatory proteins, Tat and Rev. Tat stimulates transcription elongation by directing the cellular transcriptional elongation factor P-TEFb to nascent RNA polymerases. Rev is required for the transport from the nucleus to the cytoplasm of the unspliced and incompletely spliced mRNAs that encode the structural proteins of the virus. Molecular studies of both proteins have revealed how they interact with the cellular machinery to control transcription from the viral LTR and regulate the levels of spliced and unspliced mRNAs. The regulatory feedback mechanisms driven by HIV-1 Tat and Rev ensure that HIV-1 transcription proceeds through distinct phases. In cells that are not fully activated, limiting levels of Tat and Rev act as potent blocks to premature virus production.}, - language = {en}, - number = {2}, - urldate = {2013-11-05}, - journal = {Cold Spring Harbor Perspectives in Medicine}, - author = {Karn, Jonathan and Stoltzfus, C. Martin}, - month = feb, - year = {2012}, - pmid = {22355797}, - pages = {a006916}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U7JATSTA/Karn et Stoltzfus - 2012 - Transcriptional and Posttranscriptional Regulation.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/87DUXV2J/a006916.html:text/html} -} - -@article{ahluwalia_human_2008, - title = {Human cellular {microRNA} hsa-{miR}-29a interferes with viral nef protein expression and {HIV}-1 replication}, - volume = {5}, - copyright = {2008 Ahluwalia et al; licensee BioMed Central Ltd.}, - issn = {1742-4690}, - url = {http://www.retrovirology.com/content/5/1/117/abstract}, - doi = {10.1186/1742-4690-5-117}, - abstract = {Cellular miRNAs play an important role in the regulation of gene expression in eukaryotes. Recently, miRNAs have also been shown to be able to target and inhibit viral gene expression. Computational predictions revealed earlier that the HIV-1 genome includes regions that may be potentially targeted by human miRNAs. Here we report the functionality of predicted miR-29a target site in the HIV-1 nef gene.}, - language = {en}, - number = {1}, - urldate = {2013-10-08}, - journal = {Retrovirology}, - author = {Ahluwalia, Jasmine K. and Khan, Sohrab Z. and Soni, Kartik and Rawat, Pratima and Gupta, Ankit and Hariharan, Manoj and Scaria, Vinod and Lalwani, Mukesh and Pillai, Beena and Mitra, Debashis and Brahmachari, Samir K.}, - month = dec, - year = {2008}, - pmid = {19102781}, - pages = {117}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8DARZ6TW/Ahluwalia et al. - 2008 - Human cellular microRNA hsa-miR-29a interferes wit.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7ERRBEWR/117.html:text/html} -} - -@article{swaminathan_mirnas_2013, - title = {{miRNAs} and {HIV}: unforeseen determinants of host-pathogen interaction}, - volume = {254}, - issn = {1600-065X}, - shorttitle = {{miRNAs} and {HIV}}, - doi = {10.1111/imr.12077}, - abstract = {Our understanding of the complexity of gene regulation has significantly improved in the last decade as the role of small non-coding RNAs, called microRNAs (miRNAs), has been appreciated. These 19-22 nucleotide RNA molecules are critical regulators of mRNA translation and turnover. The miRNAs bind via a protein complex to the 3' untranslated region (3' UTR) of mRNA, ultimately leading to mRNA translational inhibition, degradation, or repression. Although many mechanisms by which human immunodeficiency virus-1 (HIV-1) infection eventually induces catastrophic immune destruction have been elucidated, the important role that miRNAs play in HIV-1 pathogenesis is only now emerging. Accumulating evidence demonstrates that changes to endogenous miRNA levels following infection is important: in maintaining HIV-1 latency in resting CD4(+) T cells, potentially affect immune function via changes to cytokines such as interleukin-2 (IL-2) and IL-10 and may predict disease progression. We review the roles that both viral and host miRNAs play in different cell types and disease conditions that are important in HIV-1 infection and discuss how miRNAs affect key immunomodulatory molecules contributing to immune dysfunction. Further, we discuss whether miRNAs may be used as novel biomarkers in serum and the potential to modulate miRNA levels as a unique approach to combating this pathogen.}, - language = {eng}, - number = {1}, - journal = {Immunological reviews}, - author = {Swaminathan, Sanjay and Murray, Daniel D and Kelleher, Anthony D}, - month = jul, - year = {2013}, - pmid = {23772625}, - pages = {265--280} -} - -@article{skene_histone_2013, - title = {Histone variants in pluripotency and disease}, - volume = {140}, - issn = {0950-1991, 1477-9129}, - url = {http://dev.biologists.org/content/140/12/2513}, - doi = {10.1242/dev.091439}, - abstract = {Most histones are assembled into nucleosomes during replication to package genomic DNA. However, several variant histones are deposited independently of replication at particular regions of chromosomes. Such histone variants include cenH3, which forms the nucleosomal foundation for the centromere, and H3.3, which replaces histones that are lost during dynamic processes that disrupt nucleosomes. Furthermore, various H2A variants participate in DNA repair, gene regulation and other processes that are, as yet, not fully understood. Here, we review recent studies that have implicated histone variants in maintaining pluripotency and as causal factors in cancer and other diseases.}, - language = {en}, - number = {12}, - urldate = {2014-04-16}, - journal = {Development}, - author = {Skene, Peter J. and Henikoff, Steven}, - month = jun, - year = {2013}, - pmid = {23715545}, - keywords = {Disease, Histone chaperone, Histone variant, Nucleosome dynamics, Reprogramming}, - pages = {2513--2524}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q8GVCZFX/Skene et Henikoff - 2013 - Histone variants in pluripotency and disease.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U8M5KR66/2513.html:text/html} -} - -@article{dudley_quick_2009, - title = {A {Quick} {Guide} for {Developing} {Effective} {Bioinformatics} {Programming} {Skills}}, - volume = {5}, - url = {http://dx.doi.org/10.1371/journal.pcbi.1000589}, - doi = {10.1371/journal.pcbi.1000589}, - number = {12}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Dudley, Joel T. and Butte, Atul J.}, - month = dec, - year = {2009}, - pages = {e1000589}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RPAJ8GQ4/Dudley et Butte - 2009 - A Quick Guide for Developing Effective Bioinformat.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PZ77CNI9/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{harris_restriction_2012, - title = {The {Restriction} {Factors} of {Human} {Immunodeficiency} {Virus}}, - volume = {287}, - issn = {0021-9258, 1083-351X}, - url = {http://www.jbc.org/content/287/49/40875}, - doi = {10.1074/jbc.R112.416925}, - abstract = {Cellular proteins called “restriction factors” can serve as powerful blockades to HIV replication, but the virus possesses elaborate strategies to circumvent these barriers. First, we discuss general hallmarks of a restriction factor. Second, we review how the viral Vif protein protects the viral genome from lethal levels of cDNA deamination by promoting APOBEC3 protein degradation; how the viral Vpu, Env, and Nef proteins facilitate internalization and degradation of the virus-tethering protein BST-2/tetherin; and how the viral Vpx protein prevents the premature termination of reverse transcription by degrading the dNTPase SAMHD1. These HIV restriction and counter-restriction mechanisms suggest strategies for new therapeutic interventions.}, - language = {en}, - number = {49}, - urldate = {2013-10-04}, - journal = {Journal of Biological Chemistry}, - author = {Harris, Reuben S. and Hultquist, Judd F. and Evans, David T.}, - month = nov, - year = {2012}, - pmid = {23043100}, - keywords = {Host Defense, Host-Pathogen Interactions, Human Immunodeficiency Virus, Innate Immunity, Restriction Factors, Reverse Transcription}, - pages = {40875--40883}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G3HGJJCZ/Harris et al. - 2012 - The Restriction Factors of Human Immunodeficiency .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4JFPI475/40875.html:text/html} -} - -@article{marques_reconciling_2010, - title = {Reconciling the positive and negative roles of histone {H}2A.{Z} in gene transcription}, - volume = {5}, - issn = {1559-2294, 1559-2308}, - url = {http://www.landesbioscience.com/journals/epigenetics/article/11520/}, - doi = {10.4161/epi.5.4.11520}, - abstract = {The incorporation of variant histone H2A.Z within chromatin is important for proper gene expression and genome stability. H2A.Z is inserted at discrete loci by the Swr1 or Swr1-like remodeling complexes, although very little is known about the nature of the targeting mechanism involved. Replacement of canonical histone H2A for H2A.Z has been shown to modify nucleosome dynamics, although discrepancies still exist in the literature regarding the mechanisms. Recent experiments have shown that H2A.Z can allow nucleosomes to adopt stable translational positions as compared to H2A, which could influence the accessibility to DNA regulatory proteins. This review provides a brief overview of H2A.Z biology and presents hypotheses that could reconcile contradictory reports that are found in the literature regarding the influence of H2A.Z on nucleosome stability.}, - number = {4}, - urldate = {2014-02-19}, - journal = {Epigenetics}, - author = {Marques, Maud and Laflamme, Liette and Gervais, Alain L. and Gaudreau, Luc}, - month = may, - year = {2010}, - pages = {267--272}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SU4GJHVE/Marques et al. - 2010 - Reconciling the positive and negative roles of his.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6MCFD43G/11520.html:text/html} -} - -@article{huttenhower_quick_2010, - title = {A {Quick} {Guide} to {Large}-{Scale} {Genomic} {Data} {Mining}}, - volume = {6}, - url = {http://dx.doi.org/10.1371/journal.pcbi.1000779}, - doi = {10.1371/journal.pcbi.1000779}, - number = {5}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Huttenhower, Curtis and Hofmann, Oliver}, - month = may, - year = {2010}, - pages = {e1000779}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SCPU2DAS/Huttenhower et Hofmann - 2010 - A Quick Guide to Large-Scale Genomic Data Mining.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QRPDTJBJ/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{eglen_quick_2009, - title = {A {Quick} {Guide} to {Teaching} {R} {Programming} to {Computational} {Biology} {Students}}, - volume = {5}, - url = {http://dx.doi.org/10.1371/journal.pcbi.1000482}, - doi = {10.1371/journal.pcbi.1000482}, - number = {8}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Eglen, Stephen J.}, - month = aug, - year = {2009}, - pages = {e1000482}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HFVHV7M9/Eglen - 2009 - A Quick Guide to Teaching R Programming to Computa.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NURQW9GE/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{coleman-derr_dna_2012, - title = {{DNA} {Methylation}, {H}2A.{Z}, and the {Regulation} of {Constitutive} {Expression}}, - volume = {77}, - issn = {0091-7451, 1943-4456}, - url = {http://symposium.cshlp.org/content/77/147}, - doi = {10.1101/sqb.2012.77.014944}, - abstract = {The most well-studied function of DNA methylation in eukaryotic cells is the transcriptional silencing of genes and transposons. More recent results showed that many eukaryotes methylate the bodies of genes as well and that this methylation correlates with transcriptional activity rather than repression. The purpose of gene body methylation remains mysterious, but is potentially related to the histone variant H2A.Z. Studies in plants and animals have shown that the genome-wide distributions of H2A.Z and DNA methylation are strikingly anticorrelated. Furthermore, we and other investigators have shown that this relationship is likely to be the result of an ancient but unknown mechanism by which DNA methylation prevents the incorporation of H2A.Z. Recently, we discovered strong correlations between the presence of H2A.Z within gene bodies, the degree to which a gene's expression varies across tissue types or environmental conditions, and transcriptional misregulation in an h2a.z mutant. We propose that one basal function of gene body methylation is the establishment of constitutive expression patterns within housekeeping genes by excluding H2A.Z from their bodies.}, - language = {en}, - urldate = {2014-04-16}, - journal = {Cold Spring Harbor Symposia on Quantitative Biology}, - author = {Coleman-Derr, D. and Zilberman, D.}, - month = jan, - year = {2012}, - pmid = {23250988}, - pages = {147--154}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9T2N953U/Coleman-Derr et Zilberman - 2012 - DNA Methylation, H2A.Z, and the Regulation of Cons.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G7PFBIXV/147.html:text/html} -} - -@article{lewis_conserved_2005, - title = {Conserved {Seed} {Pairing}, {Often} {Flanked} by {Adenosines}, {Indicates} that {Thousands} of {Human} {Genes} are {MicroRNA} {Targets}}, - volume = {120}, - issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867404012607}, - doi = {10.1016/j.cell.2004.12.035}, - abstract = {We predict regulatory targets of vertebrate microRNAs (miRNAs) by identifying mRNAs with conserved complementarity to the seed (nucleotides 2–7) of the miRNA. An overrepresentation of conserved adenosines flanking the seed complementary sites in mRNAs indicates that primary sequence determinants can supplement base pairing to specify miRNA target recognition. In a four-genome analysis of 3′ UTRs, approximately 13,000 regulatory relationships were detected above the estimate of false-positive predictions, thereby implicating as miRNA targets more than 5300 human genes, which represented 30\% of our gene set. Targeting was also detected in open reading frames. In sum, well over one third of human genes appear to be conserved miRNA targets.}, - number = {1}, - urldate = {2013-12-13}, - journal = {Cell}, - author = {Lewis, Benjamin P. and Burge, Christopher B. and Bartel, David P.}, - month = jan, - year = {2005}, - pages = {15--20}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6RAPJJQT/Lewis et al. - 2005 - Conserved Seed Pairing, Often Flanked by Adenosine.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VJ6RPA6K/S0092867404012607.html:text/html} -} - -@article{aqil_hiv-1_2013, - title = {The {HIV}-1 {Nef} {Protein} {Binds} {Argonaute}-2 and {Functions} as a {Viral} {Suppressor} of {RNA} {Interference}}, - volume = {8}, - url = {http://dx.doi.org/10.1371/journal.pone.0074472}, - doi = {10.1371/journal.pone.0074472}, - abstract = {The HIV-1 accessory protein Nef is an important virulence factor. It associates with cellular membranes and modulates the endocytic machinery and signaling pathways. Nef also increases the proliferation of multivesicular bodies (MVBs), which are sites for virus assembly and budding in macrophages. The RNA interference (RNAi) pathway proteins Ago2 and GW182 localize to MVBs, suggesting these to be sites for assembly and turnover of the miRNA-induced silencing complex (miRISC). While RNAi affects HIV replication, it is not clear if the virus encodes a suppressor activity to overcome this innate host response. Here we show that Nef colocalizes with MVBs and binds Ago2 through two highly conserved Glycine-Tryptophan (GW) motifs, mutations in which abolish Nef binding to Ago2 and reduce virus yield and infectivity. Nef also inhibits the slicing activity of Ago2 and disturbs the sorting of GW182 into exosomes resulting in the suppression of miRNA-induced silencing. Thus, besides its other activities, the HIV-1 Nef protein is also proposed to function as a viral suppressor of RNAi (VSR).}, - number = {9}, - urldate = {2013-10-12}, - journal = {PLoS ONE}, - author = {Aqil, Madeeha and Naqvi, Afsar Raza and Bano, Aalia Shahr and Jameel, Shahid}, - month = sep, - year = {2013}, - pages = {e74472}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EBR3H4NB/Aqil et al. - 2013 - The HIV-1 Nef Protein Binds Argonaute-2 and Functi.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2ACANUMU/infodoi10.1371journal.pone.html:text/html} -} - -@article{schopman_selective_2012, - title = {Selective packaging of cellular {miRNAs} in {HIV}-1 particles}, - volume = {169}, - issn = {0168-1702}, - url = {http://www.sciencedirect.com/science/article/pii/S0168170212002146}, - doi = {10.1016/j.virusres.2012.06.017}, - abstract = {Retroviral particles are known to package specific host cell components such as RNA molecules in addition to the two copies of the viral RNA genome. The highly sensitive SOLiD sequencing technology was used to determine the cellular miRNA content of human immunodeficiency virus type 1 (HIV-1) particles. We determined the relative concentration of cellular miRNAs in a T cell line and several primary cell subsets before and after HIV-1 infection, and compared those values to the miRNA content of virion particles. A small subset of the cellular miRNAs is dramatically concentrated in the virions up to 115 fold, suggesting a biological function in HIV-1 replication.}, - number = {2}, - urldate = {2013-10-29}, - journal = {Virus Research}, - author = {Schopman, Nick C.T. and van Montfort, Thijs and Willemsen, Marcel and Knoepfel, Stefanie A. and Pollakis, Georgios and van Kampen, Antoine and Sanders, Rogier W. and Haasnoot, Joost and Berkhout, Ben}, - month = nov, - year = {2012}, - keywords = {Deep sequencing, HIV-1, RNA interference, Virion, miRNA}, - pages = {438--447}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M8WGAF7M/Schopman et al. - 2012 - Selective packaging of cellular miRNAs in HIV-1 pa.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/D774RJ2M/S0168170212002146.html:text/html} -} - -@article{chiang_mir-132_2013, - title = {{miR}-132 enhances {HIV}-1 replication}, - volume = {438}, - issn = {0042-6822}, - url = {http://www.sciencedirect.com/science/article/pii/S0042682213000056}, - doi = {10.1016/j.virol.2012.12.016}, - abstract = {MicroRNAs upregulated during CD4+ T cell activation may contribute to the increased efficiency of HIV-1 replication seen following perturbation of the resting state. We have found miR-132 to be highly upregulated following CD4+ T cell activation, and show that miR-132 potentiates viral replication in the Jurkat CD4+ T cell line. Knockdown of MeCP2, a previously identified target of miR-132, also increases HIV-1 replication. To the best of our knowledge, miR-132 is the first miRNA reported to enhance HIV-1 replication.}, - number = {1}, - urldate = {2013-10-08}, - journal = {Virology}, - author = {Chiang, Karen and Liu, Hongbing and Rice, Andrew P.}, - month = mar, - year = {2013}, - keywords = {HIV, MeCP2, miR-132, microRNA}, - pages = {1--4}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KBR4ZPEW/Chiang et al. - 2013 - miR-132 enhances HIV-1 replication.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DP2VX65F/S0042682213000056.html:text/html} -} - -@article{durand_developing_2012, - title = {Developing strategies for {HIV}-1 eradication}, - volume = {33}, - issn = {1471-4906}, - url = {http://www.sciencedirect.com/science/article/pii/S1471490612001123}, - doi = {10.1016/j.it.2012.07.001}, - abstract = {Highly active antiretroviral therapy (HAART) suppresses HIV-1 replication, transforming the outlook for infected patients. However, reservoirs of replication-competent forms of the virus persist during HAART, and when treatment is stopped, high rates of HIV-1 replication return. Recent insights into HIV-1 latency, as well as a report that HIV-1 infection was eradicated in one individual, have renewed interest in finding a cure for HIV-1 infection. Strategies for HIV-1 eradication include gene therapy and hematopoietic stem cell transplantation, stimulating host immunity to control HIV-1 replication, and targeting latent HIV-1 in resting memory CD4+ T cells. Future efforts should aim to provide better understanding of how to reconstitute the CD4+ T cell compartment with genetically engineered cells, exert immune control over HIV-1 replication, and identify and eliminate all viral reservoirs.}, - number = {11}, - urldate = {2013-11-09}, - journal = {Trends in Immunology}, - author = {Durand, Christine M. and Blankson, Joel N. and Siliciano, Robert F.}, - month = nov, - year = {2012}, - keywords = {HIV-1, cure, eradication, latency, reservoir}, - pages = {554--562}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZWIQSEHV/Durand et al. - 2012 - Developing strategies for HIV-1 eradication.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JV7E2XEH/S1471490612001123.html:text/html} -} - -@article{schattner_automated_2007, - title = {Automated {Querying} of {Genome} {Databases}}, - volume = {3}, - url = {http://dx.doi.org/10.1371/journal.pcbi.0030001}, - doi = {10.1371/journal.pcbi.0030001}, - number = {1}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Schattner, Peter}, - month = jan, - year = {2007}, - pages = {e1}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E74IT5S8/Schattner - 2007 - Automated Querying of Genome Databases.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/D484W82K/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{valdes-mora_acetylation_2012, - title = {Acetylation of {H}2A.{Z} is a key epigenetic modification associated with gene deregulation and epigenetic remodeling in cancer}, - volume = {22}, - issn = {1088-9051}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3266038/}, - doi = {10.1101/gr.118919.110}, - abstract = {Histone H2A.Z (H2A.Z) is an evolutionarily conserved H2A variant implicated in the regulation of gene expression; however, its role in transcriptional deregulation in cancer remains poorly understood. Using genome-wide studies, we investigated the role of promoter-associated H2A.Z and acetylated H2A.Z (acH2A.Z) in gene deregulation and its relationship with DNA methylation and H3K27me3 in prostate cancer. Our results reconcile the conflicting reports of positive and negative roles for histone H2A.Z and gene expression states. We find that H2A.Z is enriched in a bimodal distribution at nucleosomes, surrounding the transcription start sites (TSSs) of both active and poised gene promoters. In addition, H2A.Z spreads across the entire promoter of inactive genes in a deacetylated state. In contrast, acH2A.Z is only localized at the TSSs of active genes. Gene deregulation in cancer is also associated with a reorganization of acH2A.Z and H2A.Z nucleosome occupancy across the promoter region and TSS of genes. Notably, in cancer cells we find that a gain of acH2A.Z at the TSS occurs with an overall decrease of H2A.Z levels, in concert with oncogene activation. Furthermore, deacetylation of H2A.Z at TSSs is increased with silencing of tumor suppressor genes. We also demonstrate that acH2A.Z anti-correlates with promoter H3K27me3 and DNA methylation. We show for the first time, that acetylation of H2A.Z is a key modification associated with gene activity in normal cells and epigenetic gene deregulation in tumorigenesis.}, - number = {2}, - urldate = {2014-03-05}, - journal = {Genome Research}, - author = {Valdes-Mora, Fatima and Song, Jenny Z. and Statham, Aaron L. and Strbenac, Dario and Robinson, Mark D. and Nair, Shalima S. and Patterson, Kate I. and Tremethick, David J. and Stirzaker, Clare and Clark, Susan J.}, - month = feb, - year = {2012}, - pmid = {21788347}, - pmcid = {PMC3266038}, - pages = {307--321}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/89W78E3A/Valdes-Mora et al. - 2012 - Acetylation of H2A.Z is a key epigenetic modificat.pdf:application/pdf} -} - -@article{rissman_reordering_2009, - title = {Reordering contigs of draft genomes using the {Mauve} {Aligner}}, - volume = {25}, - issn = {1367-4803}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2723005/}, - doi = {10.1093/bioinformatics/btp356}, - abstract = {Summary: Mauve Contig Mover provides a new method for proposing the relative order of contigs that make up a draft genome based on comparison to a complete or draft reference genome. A novel application of the Mauve aligner and viewer provides an automated reordering algorithm coupled with a powerful drill-down display allowing detailed exploration of results., Availability: The software is available for download at http://gel.ahabs.wisc.edu/mauve., Contact: rissman@wisc.edu, Supplementary information: Supplementary data are available at Bioinformatics online and http://gel.ahabs.wisc.edu}, - number = {16}, - urldate = {2014-05-25}, - journal = {Bioinformatics}, - author = {Rissman, Anna I. and Mau, Bob and Biehl, Bryan S. and Darling, Aaron E. and Glasner, Jeremy D. and Perna, Nicole T.}, - month = aug, - year = {2009}, - pmid = {19515959}, - pmcid = {PMC2723005}, - pages = {2071--2073}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6JKVSJAU/Rissman et al. - 2009 - Reordering contigs of draft genomes using the Mauv.pdf:application/pdf} -} - -@article{ouellet_regulation_2013, - title = {Regulation of host gene expression by {HIV}-1 {TAR} {microRNAs}}, - volume = {10}, - copyright = {2013 Ouellet et al.; licensee BioMed Central Ltd.}, - issn = {1742-4690}, - url = {http://www.retrovirology.com/content/10/1/86/abstract}, - doi = {10.1186/1742-4690-10-86}, - abstract = {The transactivating response (TAR) element of human immunodeficiency virus type 1 (HIV-1) is the source of two functional microRNAs (miRNAs), miR-TAR-5p and miR-TAR-3p. The objective of this study was to characterize the post-transcriptional regulation of host messenger RNAs (mRNAs) relevant to HIV-1 pathogenesis by HIV-1 TAR miRNAs. -PMID: 23938024}, - language = {en}, - number = {1}, - urldate = {2013-10-27}, - journal = {Retrovirology}, - author = {Ouellet, Dominique L. and Vigneault-Edwards, Jimmy and Létourneau, Kevin and Gobeil, Lise-Andrée and Plante, Isabelle and Burnett, John C. and Rossi, John J. and Provost, Patrick}, - month = aug, - year = {2013}, - pmid = {23938024}, - keywords = {Aiolos, Apoptosis, Caspase 8, HIV-1, Ikaros, Nucleophosmin (NPM)/B23, TAR microRNAs}, - pages = {86}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/55QQIWBC/Ouellet et al. - 2013 - Regulation of host gene expression by HIV-1 TAR mi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PR5UWZ4K/abstract.html:text/html} -} - -@article{lim_microarray_2005, - title = {Microarray analysis shows that some {microRNAs} downregulate large numbers of target {mRNAs}}, - volume = {433}, - copyright = {© 2005 Nature Publishing Group}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v433/n7027/full/nature03315.html}, - doi = {10.1038/nature03315}, - abstract = {MicroRNAs (miRNAs) are a class of noncoding RNAs that post-transcriptionally regulate gene expression in plants and animals. To investigate the influence of miRNAs on transcript levels, we transfected miRNAs into human cells and used microarrays to examine changes in the messenger RNA profile. Here we show that delivering miR-124 causes the expression profile to shift towards that of brain, the organ in which miR-124 is preferentially expressed, whereas delivering miR-1 shifts the profile towards that of muscle, where miR-1 is preferentially expressed. In each case, about 100 messages were downregulated after 12 h. The 3′ untranslated regions of these messages had a significant propensity to pair to the 5′ region of the miRNA, as expected if many of these messages are the direct targets of the miRNAs. Our results suggest that metazoan miRNAs can reduce the levels of many of their target transcripts, not just the amount of protein deriving from these transcripts. Moreover, miR-1 and miR-124, and presumably other tissue-specific miRNAs, seem to downregulate a far greater number of targets than previously appreciated, thereby helping to define tissue-specific gene expression in humans.}, - language = {en}, - number = {7027}, - urldate = {2014-02-28}, - journal = {Nature}, - author = {Lim, Lee P. and Lau, Nelson C. and Garrett-Engele, Philip and Grimson, Andrew and Schelter, Janell M. and Castle, John and Bartel, David P. and Linsley, Peter S. and Johnson, Jason M.}, - month = feb, - year = {2005}, - pages = {769--773}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A67C2Q64/Lim et al. - 2005 - Microarray analysis shows that some microRNAs down.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BKSAVZFV/nature03315.html:text/html} -} - -@article{nekrasov_histone_2013, - title = {Histone variant selectivity at the transcription start site: {H}2A.{Z} or {H}2A.{Lap}1}, - volume = {4}, - issn = {1949-1034, 1949-1042}, - shorttitle = {Histone variant selectivity at the transcription start site}, - url = {http://www.landesbioscience.com/journals/nucleus/article/26862/}, - doi = {10.4161/nucl.26862}, - abstract = {Considerable attention has been given to the understanding of how nucleosomes are altered or removed from the transcription start site of RNA polymerase II genes to enable transcription to proceed. This has led to the view that for transcriptional activation to occur, the transcription start site (TSS) must become depleted of nucleosomes. However, we have shown that this is not the case with different unstable histone H2A variant-containing nucleosomes occupying the TSS under different physiological settings. For example, during mouse spermatogenesis we found that the mouse homolog of human H2A.Bbd, H2A.Lap1, is targeted to the TSS of active genes expressed during specific stages of spermatogenesis. On the other hand, we observed in trophoblast stem cells, a H2A.Z-containing nucleosome occupying the TSS of genes active in the G1 phase of the cell cycle. Notably, this H2A.Z-containing nucleosome was different compared with other promoter specific H2A.Z nucleosomes by being heterotypic rather than being homotypic. In other words, it did not contain the expected two copies of H2A.Z per nucleosome but only one (i.e., H2A.Z/H2A rather than H2A.Z/H2A.Z). Given these observations, we wondered whether the histone variant composition of a nucleosome at an active TSS could in fact vary in the same cell type. To investigate this possibility, we performed H2A.Z ChIP-H2A reChIP assays in the mouse testis and compared this data with our testis H2A.Lap1 ChIP-seq data. Indeed, we find that different promoters involved in the expression of genes involved in distinct biological processes can contain either H2A.Z/H2A or H2A.Lap1. This argues that specific mechanisms exist, which can determine whether H2A.Z or H2A.Lap1 is targeted to the TSS of an active gene., M Nekrasov, J Amrichova, BJ Parker, TA Soboleva, C Jack, R Williams, GA Huttley, DJ Tremethick. Histone H2A.Z inheritance during the cell cycle and its impact on promoter organization and dynamics. Nat Struct Mol Biol 2012; 19: 1076- 83.PMID: 23085713 DOI: 10.1038/nsmb.2424,}, - number = {6}, - urldate = {2014-02-19}, - journal = {Nucleus}, - author = {Nekrasov, Maxim and Soboleva, Tatiana A. and Jack, Cameron and Tremethick, David J.}, - month = nov, - year = {2013}, - pages = {431--437}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JFCMIVWJ/Nekrasov et al. - 2013 - Histone variant selectivity at the transcription s.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/89FNR26R/26862.html:text/html} -} - -@article{cullen_micrornas_2013, - title = {{MicroRNAs} as mediators of viral evasion of the immune system}, - volume = {14}, - copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1529-2908}, - url = {http://www.nature.com/ni/journal/v14/n3/full/ni.2537.html}, - doi = {10.1038/ni.2537}, - language = {en}, - number = {3}, - urldate = {2013-10-22}, - journal = {Nature Immunology}, - author = {Cullen, Bryan R.}, - month = mar, - year = {2013}, - keywords = {Innate Immunity, Pathogenesis, miRNA}, - pages = {205--210}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4AJRMCD3/Cullen - 2013 - MicroRNAs as mediators of viral evasion of the imm.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QZBMND3C/ni.2537.html:text/html} -} - -@article{swaminathan_mirnas_2013-1, - title = {{miRNAs} and {HIV}: unforeseen determinants of host-pathogen interaction}, - volume = {254}, - copyright = {© 2013 John Wiley \& Sons A/S. Published by John Wiley \& Sons Ltd}, - issn = {1600-065X}, - shorttitle = {{miRNAs} and {HIV}}, - url = {http://onlinelibrary.wiley.com/doi/10.1111/imr.12077/abstract}, - doi = {10.1111/imr.12077}, - abstract = {Our understanding of the complexity of gene regulation has significantly improved in the last decade as the role of small non-coding RNAs, called microRNAs (miRNAs), has been appreciated. These 19–22 nucleotide RNA molecules are critical regulators of mRNA translation and turnover. The miRNAs bind via a protein complex to the 3′ untranslated region (3′ UTR) of mRNA, ultimately leading to mRNA translational inhibition, degradation, or repression. Although many mechanisms by which human immunodeficiency virus-1 (HIV-1) infection eventually induces catastrophic immune destruction have been elucidated, the important role that miRNAs play in HIV-1 pathogenesis is only now emerging. Accumulating evidence demonstrates that changes to endogenous miRNA levels following infection is important: in maintaining HIV-1 latency in resting CD4+ T cells, potentially affect immune function via changes to cytokines such as interleukin-2 (IL-2) and IL-10 and may predict disease progression. We review the roles that both viral and host miRNAs play in different cell types and disease conditions that are important in HIV-1 infection and discuss how miRNAs affect key immunomodulatory molecules contributing to immune dysfunction. Further, we discuss whether miRNAs may be used as novel biomarkers in serum and the potential to modulate miRNA levels as a unique approach to combating this pathogen.}, - language = {en}, - number = {1}, - urldate = {2013-10-22}, - journal = {Immunological Reviews}, - author = {Swaminathan, Sanjay and Murray, Daniel D. and Kelleher, Anthony D.}, - year = {2013}, - keywords = {CD4+ T cell, HIV-1, biomarkers, cytokines, miRNA, monocytes}, - pages = {265--280}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QEHIQS2J/Swaminathan et al. - 2013 - miRNAs and HIV unforeseen determinants of host-pa.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NIJ7MNGA/abstract.html:text/html} -} - -@article{goldberg_distinct_2010, - title = {Distinct {Factors} {Control} {Histone} {Variant} {H}3.3 {Localization} at {Specific} {Genomic} {Regions}}, - volume = {140}, - issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867410000048}, - doi = {10.1016/j.cell.2010.01.003}, - abstract = {The incorporation of histone H3 variants has been implicated in the epigenetic memory of cellular state. Using genome editing with zinc-finger nucleases to tag endogenous H3.3, we report genome-wide profiles of H3 variants in mammalian embryonic stem cells and neuronal precursor cells. Genome-wide patterns of H3.3 are dependent on amino acid sequence and change with cellular differentiation at developmentally regulated loci. The H3.3 chaperone Hira is required for H3.3 enrichment at active and repressed genes. Strikingly, Hira is not essential for localization of H3.3 at telomeres and many transcription factor binding sites. Immunoaffinity purification and mass spectrometry reveal that the proteins Atrx and Daxx associate with H3.3 in a Hira-independent manner. Atrx is required for Hira-independent localization of H3.3 at telomeres and for the repression of telomeric RNA. Our data demonstrate that multiple and distinct factors are responsible for H3.3 localization at specific genomic locations in mammalian cells.}, - number = {5}, - urldate = {2014-03-07}, - journal = {Cell}, - author = {Goldberg, Aaron D. and Banaszynski, Laura A. and Noh, Kyung-Min and Lewis, Peter W. and Elsaesser, Simon J. and Stadler, Sonja and Dewell, Scott and Law, Martin and Guo, Xingyi and Li, Xuan and Wen, Duancheng and Chapgier, Ariane and DeKelver, Russell C. and Miller, Jeffrey C. and Lee, Ya-Li and Boydston, Elizabeth A. and Holmes, Michael C. and Gregory, Philip D. and Greally, John M. and Rafii, Shahin and Yang, Chingwen and Scambler, Peter J. and Garrick, David and Gibbons, Richard J. and Higgs, Douglas R. and Cristea, Ileana M. and Urnov, Fyodor D. and Zheng, Deyou and Allis, C. David}, - month = mar, - year = {2010}, - keywords = {DNA, PROTEINS, STEMCELL}, - pages = {678--691}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B3CIZC9P/Goldberg et al. - 2010 - Distinct Factors Control Histone Variant H3.3 Loca.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3ADJ9N2F/S0092867410000048.html:text/html} -} - -@article{ho_chip-chip_2011, - title = {{ChIP}-chip versus {ChIP}-seq: {Lessons} for experimental design and data analysis}, - volume = {12}, - copyright = {2011 Ho et al; licensee BioMed Central Ltd.}, - issn = {1471-2164}, - shorttitle = {{ChIP}-chip versus {ChIP}-seq}, - url = {http://www.biomedcentral.com/1471-2164/12/134/abstract}, - doi = {10.1186/1471-2164-12-134}, - abstract = {Chromatin immunoprecipitation (ChIP) followed by microarray hybridization (ChIP-chip) or high-throughput sequencing (ChIP-seq) allows genome-wide discovery of protein-DNA interactions such as transcription factor bindings and histone modifications. Previous reports only compared a small number of profiles, and little has been done to compare histone modification profiles generated by the two technologies or to assess the impact of input DNA libraries in ChIP-seq analysis. Here, we performed a systematic analysis of a modENCODE dataset consisting of 31 pairs of ChIP-chip/ChIP-seq profiles of the coactivator CBP, RNA polymerase II (RNA PolII), and six histone modifications across four developmental stages of Drosophila melanogaster. -PMID: 21356108}, - language = {en}, - number = {1}, - urldate = {2014-02-27}, - journal = {BMC Genomics}, - author = {Ho, Joshua WK and Bishop, Eric and Karchenko, Peter V. and Nègre, Nicolas and White, Kevin P. and Park, Peter J.}, - month = feb, - year = {2011}, - pmid = {21356108}, - pages = {134}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A73GTHH6/Ho et al. - 2011 - ChIP-chip versus ChIP-seq Lessons for experimenta.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/59ATDH2S/134.html:text/html} -} - -@article{taub_liver_2004, - title = {Liver regeneration: from myth to mechanism}, - volume = {5}, - copyright = {© 2004 Nature Publishing Group}, - issn = {1471-0072}, - shorttitle = {Liver regeneration}, - url = {http://www.nature.com/nrm/journal/v5/n10/full/nrm1489.html}, - doi = {10.1038/nrm1489}, - abstract = {The unusual regenerative properties of the liver are a logical adaptation by organisms, as the liver is the main detoxifying organ of the body and is likely to be injured by ingested toxins. The numerous cytokine- and growth-factor-mediated pathways that are involved in regulating liver regeneration are being successfully dissected using molecular and genetic approaches. So what is known about this process at present and which questions remain?}, - language = {en}, - number = {10}, - urldate = {2014-03-14}, - journal = {Nature Reviews Molecular Cell Biology}, - author = {Taub, Rebecca}, - month = oct, - year = {2004}, - pages = {836--847}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RR2JA7R4/Taub - 2004 - Liver regeneration from myth to mechanism.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FQ46CJJZ/nrm1489.html:text/html} -} - -@article{freaney_high-density_2014, - title = {High-{Density} {Nucleosome} {Occupancy} {Map} of {Human} {Chromosome} 9p21–22 {Reveals} {Chromatin} {Organization} of the {Type} {I} {Interferon} {Gene} {Cluster}}, - issn = {1079-9907, 1557-7465}, - url = {http://online.liebertpub.com/doi/full/10.1089/jir.2013.0118}, - doi = {10.1089/jir.2013.0118}, - language = {en}, - urldate = {2014-04-02}, - journal = {Journal of Interferon \& Cytokine Research}, - author = {Freaney, Jonathan E. and Zhang, Quanwei and Yigit, Erbay and Kim, Rebecca and Widom, Jonathan and Wang, Ji-Ping and Horvath, Curt M.}, - month = mar, - year = {2014}, - pages = {140327155152002}, - file = {High-Density Nucleosome Occupancy Map of Human Chromosome 9p21–\;22 Reveals Chromatin Organization of the Type I Interferon Gene Cluster:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H8RZZ6HD/jir.2013.html:text/html} -} - -@article{kang_closing_2013, - title = {Closing the door to human immunodeficiency virus}, - volume = {4}, - issn = {1674-8018}, - doi = {10.1007/s13238-012-2111-9}, - abstract = {The pandemic of human immunodeficiency virus type one (HIV-1), the major etiologic agent of acquired immunodeficiency disease (AIDS), has led to over 33 million people living with the virus, among which 18 million are women and children. Until now, there is neither an effective vaccine nor a therapeutic cure despite over 30 years of efforts. Although the Thai RV144 vaccine trial has demonstrated an efficacy of 31.2\%, an effective vaccine will likely rely on a breakthrough discovery of immunogens to elicit broadly reactive neutralizing antibodies, which may take years to achieve. Therefore, there is an urgency of exploring other prophylactic strategies. Recently, antiretroviral treatment as prevention is an exciting area of progress in HIV-1 research. Although effective, the implementation of such strategy faces great financial, political and social challenges in heavily affected regions such as developing countries where drug resistant viruses have already been found with growing incidence. Activating latently infected cells for therapeutic cure is another area of challenge. Since it is greatly difficult to eradicate HIV-1 after the establishment of viral latency, it is necessary to investigate strategies that may close the door to HIV-1. Here, we review studies on non-vaccine strategies in targeting viral entry, which may have critical implications for HIV-1 prevention.}, - language = {eng}, - number = {2}, - journal = {Protein \& cell}, - author = {Kang, Yuanxi and Guo, Jia and Chen, Zhiwei}, - month = feb, - year = {2013}, - pmid = {23479426}, - keywords = {AIDS Vaccines, Antibodies, Monoclonal, Antibodies, Neutralizing, Genetic Therapy, HIV Infections, HIV-1, Humans, Peptides, Small Molecule Libraries, Virus Internalization}, - pages = {86--102} -} - -@article{ehrensberger_mechanistic_2013, - title = {Mechanistic {Interpretation} of {Promoter}-{Proximal} {Peaks} and {RNAPII} {Density} {Maps}}, - volume = {154}, - issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867413009033}, - doi = {10.1016/j.cell.2013.07.032}, - number = {4}, - urldate = {2014-05-14}, - journal = {Cell}, - author = {Ehrensberger, Andreas H. and Kelly, Gavin P. and Svejstrup, Jesper Q.}, - month = aug, - year = {2013}, - pages = {713--715}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VT8I5V25/Ehrensberger et al. - 2013 - Mechanistic Interpretation of Promoter-Proximal Pe.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z3ZNGBDP/S0092867413009033.html:text/html} -} - -@article{ruelas_integrated_2013, - title = {An {Integrated} {Overview} of {HIV}-1 {Latency}}, - volume = {155}, - issn = {0092-8674}, - url = {http://www.cell.com/abstract/S0092-8674(13)01218-X}, - doi = {10.1016/j.cell.2013.09.044}, - number = {3}, - urldate = {2013-11-05}, - journal = {Cell}, - author = {Ruelas, Debbie S. and Greene, Warner C.}, - month = oct, - year = {2013}, - pages = {519--529}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AW6B32HM/Ruelas et Greene - 2013 - An Integrated Overview of HIV-1 Latency.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/I5RUR9H2/S0092-8674(13)01218-X.html:text/html} -} - -@article{baze_gene_2010, - title = {Gene expression of the liver in response to chronic hypoxia}, - volume = {41}, - issn = {1094-8341}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2869108/}, - doi = {10.1152/physiolgenomics.00075.2009}, - abstract = {Hypoxia is an important ecological, evolutionary, and biomedical stressor. While physiological acclimatization of mammals to hypoxia is well studied, the variation in gene expression that underlies acclimatization is not well studied. We acclimatized inbred mice for 32 days to hypoxic conditions that simulated altitudes of 1400, 3000, and 4500 m. We used oligonucleotide microarrays to measure changes in steady-state abundance of mRNA in the livers of these mice. Mice exposed to more severe hypoxia (simulated altitude of 4500 m) were smaller in mass and had higher hematocrit than mice exposed to less severe hypoxia. ANOVA and false discovery rate tests indicated that 580 genes were significantly differentially expressed in response to chronic hypoxia. Few of these 580 genes have previously been reported to respond to hypoxia. In contrast, many of these 580 genes belonged to same functional groups typically respond to acute hypoxia. That is, both chronic and acute hypoxia elicit changes in transcript abundance for genes involved in angiogenesis, glycolysis, lipid metabolism, carbohydrate metabolism, and protein amino acid phosphorylation, but the particular genes affected by the two types of hypoxia were mostly different. Numerous genes affecting the immune system were differentially expressed in response to chronic hypoxia, which supports recently proposed hypotheses that link immune function and hypoxia. Furthermore, our results discovered novel elevated mRNA abundance of genes involved in hematopoiesis and oxygen transport not reported previously, but consistent with extreme hematocrits found in hypoxic mice.}, - number = {3}, - urldate = {2014-03-25}, - journal = {Physiological Genomics}, - author = {Baze, Monica M. and Schlauch, Karen and Hayes, Jack P.}, - month = may, - year = {2010}, - pmid = {20103700}, - pmcid = {PMC2869108}, - pages = {275--288} -} - -@article{neil_tetherin_2008, - title = {Tetherin inhibits retrovirus release and is antagonized by {HIV}-1 {Vpu}}, - volume = {451}, - copyright = {© 2008 Nature Publishing Group}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v451/n7177/full/nature06553.html}, - doi = {10.1038/nature06553}, - abstract = {Human cells possess an antiviral activity that inhibits the release of retrovirus particles, and other enveloped virus particles, and is antagonized by the HIV-1 accessory protein, Vpu. This antiviral activity can be constitutively expressed or induced by interferon-α, and it consists of protein-based tethers, which we term ‘tetherins’, that cause retention of fully formed virions on infected cell surfaces. Using deductive constraints and gene expression analyses, we identify CD317 (also called BST2 or HM1.24), a membrane protein of previously unknown function, as a tetherin. Specifically, CD317 expression correlated with, and induced, a requirement for Vpu during HIV-1 and murine leukaemia virus particle release. Furthermore, in cells where HIV-1 virion release requires Vpu expression, depletion of CD317 abolished this requirement. CD317 caused retention of virions on cell surfaces and, after endocytosis, in CD317-positive compartments. Vpu co-localized with CD317 and inhibited these effects. Inhibition of Vpu function and consequent mobilization of tetherin’s antiviral activity is a potential therapeutic strategy in HIV/AIDS.}, - language = {en}, - number = {7177}, - urldate = {2013-11-10}, - journal = {Nature}, - author = {Neil, Stuart J. D. and Zang, Trinity and Bieniasz, Paul D.}, - month = jan, - year = {2008}, - keywords = {DNA, RNA, astronomy, astrophysics, biochemistry, bioinformatics, biology, biotechnology, cancer, cell cycle, cell signalling, climate change, computational biology, development, developmental biology, drug discovery, earth science, ecology, environmental science, evolution, evolutionary biology, functional genomics, genetics, genomics, geophysics, immunology, interdisciplinary science, life, marine biology, materials science, medical research, medicine, metabolomics, molecular biology, molecular interactions, nanotechnology, nature, neurobiology, neuroscience, palaeobiology, pharmacology, physics, proteomics, quantum physics, science, science news, science policy, signal transduction, structural biology, systems biology, transcriptomics}, - pages = {425--430}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2BFUMBAT/Neil et al. - 2008 - Tetherin inhibits retrovirus release and is antago.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SQ66DBQC/nature06553.html:text/html} -} - -@article{boyle_high-resolution_2008, - title = {High-{Resolution} {Mapping} and {Characterization} of {Open} {Chromatin} across the {Genome}}, - volume = {132}, - issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867407016133}, - doi = {10.1016/j.cell.2007.12.014}, - abstract = {Summary -Mapping DNase I hypersensitive (HS) sites is an accurate method of identifying the location of genetic regulatory elements, including promoters, enhancers, silencers, insulators, and locus control regions. We employed high-throughput sequencing and whole-genome tiled array strategies to identify DNase I HS sites within human primary CD4+ T cells. Combining these two technologies, we have created a comprehensive and accurate genome-wide open chromatin map. Surprisingly, only 16\%–21\% of the identified 94,925 DNase I HS sites are found in promoters or first exons of known genes, but nearly half of the most open sites are in these regions. In conjunction with expression, motif, and chromatin immunoprecipitation data, we find evidence of cell-type-specific characteristics, including the ability to identify transcription start sites and locations of different chromatin marks utilized in these cells. In addition, and unexpectedly, our analyses have uncovered detailed features of nucleosome structure.}, - number = {2}, - urldate = {2015-09-11}, - journal = {Cell}, - author = {Boyle, Alan P. and Davis, Sean and Shulha, Hennady P. and Meltzer, Paul and Margulies, Elliott H. and Weng, Zhiping and Furey, Terrence S. and Crawford, Gregory E.}, - month = jan, - year = {2008}, - keywords = {DNA}, - pages = {311--322}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AT3JAG9P/Boyle et al. - 2008 - High-Resolution Mapping and Characterization of Op.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W2KDFIGZ/S0092867407016133.html:text/html} -} - -@article{barski_high-resolution_2007, - title = {High-{Resolution} {Profiling} of {Histone} {Methylations} in the {Human} {Genome}}, - volume = {129}, - issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867407006009}, - doi = {10.1016/j.cell.2007.05.009}, - abstract = {Histone modifications are implicated in influencing gene expression. We have generated high-resolution maps for the genome-wide distribution of 20 histone lysine and arginine methylations as well as histone variant H2A.Z, RNA polymerase II, and the insulator binding protein CTCF across the human genome using the Solexa 1G sequencing technology. Typical patterns of histone methylations exhibited at promoters, insulators, enhancers, and transcribed regions are identified. The monomethylations of H3K27, H3K9, H4K20, H3K79, and H2BK5 are all linked to gene activation, whereas trimethylations of H3K27, H3K9, and H3K79 are linked to repression. H2A.Z associates with functional regulatory elements, and CTCF marks boundaries of histone methylation domains. Chromosome banding patterns are correlated with unique patterns of histone modifications. Chromosome breakpoints detected in T cell cancers frequently reside in chromatin regions associated with H3K4 methylations. Our data provide new insights into the function of histone methylation and chromatin organization in genome function.}, - number = {4}, - urldate = {2014-03-05}, - journal = {Cell}, - author = {Barski, Artem and Cuddapah, Suresh and Cui, Kairong and Roh, Tae-Young and Schones, Dustin E. and Wang, Zhibin and Wei, Gang and Chepelev, Iouri and Zhao, Keji}, - month = may, - year = {2007}, - keywords = {DNA, PROTEINS, SYSBIO}, - pages = {823--837}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QUNNP84A/Barski et al. - 2007 - High-Resolution Profiling of Histone Methylations .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AD6CEICR/S0092867407006009.html:text/html} -} - -@article{karn_transcriptional_2012-1, - title = {Transcriptional and {Posttranscriptional} {Regulation} of {HIV}-1 {Gene} {Expression}}, - volume = {2}, - issn = {2157-1422}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3281586/}, - doi = {10.1101/cshperspect.a006916}, - abstract = {Control of HIV-1 gene expression depends on two viral regulatory proteins, Tat and Rev. Tat stimulates transcription elongation by directing the cellular transcriptional elongation factor P-TEFb to nascent RNA polymerases. Rev is required for the transport from the nucleus to the cytoplasm of the unspliced and incompletely spliced mRNAs that encode the structural proteins of the virus. Molecular studies of both proteins have revealed how they interact with the cellular machinery to control transcription from the viral LTR and regulate the levels of spliced and unspliced mRNAs. The regulatory feedback mechanisms driven by HIV-1 Tat and Rev ensure that HIV-1 transcription proceeds through distinct phases. In cells that are not fully activated, limiting levels of Tat and Rev act as potent blocks to premature virus production., HIV-1 gene expression is controlled by RNA-binding proteins Tat and Rev. They orchestrate complex interactions with the cellular transcription, RNA splicing, and RNA transport machinery, and are important targets for drug discovery.}, - number = {2}, - urldate = {2013-11-17}, - journal = {Cold Spring Harbor Perspectives in Medicine}, - author = {Karn, Jonathan and Stoltzfus, C. Martin}, - month = feb, - year = {2012}, - pmid = {22355797}, - pmcid = {PMC3281586}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AX7PM55A/Karn et Stoltzfus - 2012 - Transcriptional and Posttranscriptional Regulation.pdf:application/pdf} -} - -@article{henikoff_assembly_2005, - title = {Assembly of {Variant} {Histones} into {Chromatin}}, - volume = {21}, - url = {http://www.annualreviews.org/doi/abs/10.1146/annurev.cellbio.21.012704.133518}, - doi = {10.1146/annurev.cellbio.21.012704.133518}, - abstract = {Abstract Chromatin can be differentiated by the deposition of variant histones at centromeres, active genes, and silent loci. Variant histones are assembled into nucleosomes in a replication-independent manner, in contrast to assembly of bulk chromatin that is coupled to replication. Recent in vitro studies have provided the first glimpses of protein machines dedicated to building and replacing alternative nucleosomes. They deposit variant H2A and H3 histones and are targeted to particular functional sites in the genome. Differences between variant and canonical histones can have profound consequences, either for delivery of the histones to sites of assembly or for their function after incorporation into chromatin. Recent studies have also revealed connections between assembly of variant nucleosomes, chromatin remodeling, and histone post-translational modification. Taken together, these findings indicate that chromosome architecture can be highly dynamic at the most fundamental level, with epigenetic consequences.}, - number = {1}, - urldate = {2014-02-18}, - journal = {Annual Review of Cell and Developmental Biology}, - author = {Henikoff, Steven and Ahmad, Kami}, - year = {2005}, - pmid = {16212490}, - keywords = {centromeric chromatin, chromatin remodeling, epigenetics, histone replacement, nucleosome}, - pages = {133--153}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RGX3D9KX/Henikoff et Ahmad - 2005 - Assembly of Variant Histones into Chromatin.pdf:application/pdf} -} - -@article{weiner_high-resolution_2010, - title = {High-resolution nucleosome mapping reveals transcription-dependent promoter packaging}, - volume = {20}, - issn = {1088-9051, 1549-5469}, - url = {http://genome.cshlp.org/content/20/1/90}, - doi = {10.1101/gr.098509.109}, - abstract = {Genome-wide mapping of nucleosomes has revealed a great deal about the relationships between chromatin structure and control of gene expression, and has led to mechanistic hypotheses regarding the rules by which chromatin structure is established. High-throughput sequencing has recently become the technology of choice for chromatin mapping studies, yet analysis of these experiments is still in its infancy. Here, we introduce a pipeline for analyzing deep sequencing maps of chromatin structure and apply it to data from S. cerevisiae. We analyze a digestion series where nucleosomes are isolated from under- and overdigested chromatin. We find that certain classes of nucleosomes are unusually susceptible or resistant to overdigestion, with promoter nucleosomes easily digested and mid-coding region nucleosomes being quite stable. We find evidence for highly sensitive nucleosomes located within “nucleosome-free regions,” suggesting that these regions are not always completely naked but instead are likely associated with easily digested nucleosomes. Finally, since RNA polymerase is the dominant energy-consuming machine that operates on the chromatin template, we analyze changes in chromatin structure when RNA polymerase is inactivated via a temperature-sensitive mutation. We find evidence that RNA polymerase plays a role in nucleosome eviction at promoters and is also responsible for retrograde shifts in nucleosomes during transcription. Loss of RNA polymerase results in a relaxation of chromatin structure to more closely match in vitro nucleosome positioning preferences. Together, these results provide analytical tools and experimental guidance for nucleosome mapping experiments, and help disentangle the interlinked processes of transcription and chromatin packaging.}, - language = {en}, - number = {1}, - urldate = {2014-04-03}, - journal = {Genome Research}, - author = {Weiner, Assaf and Hughes, Amanda and Yassour, Moran and Rando, Oliver J. and Friedman, Nir}, - month = jan, - year = {2010}, - pmid = {19846608}, - pages = {90--100}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PHAUUI6G/Weiner et al. - 2010 - High-resolution nucleosome mapping reveals transcr.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XX7QD9UB/90.html:text/html} -} - -@article{triboulet_suppression_2007, - title = {Suppression of {MicroRNA}-{Silencing} {Pathway} by {HIV}-1 {During} {Virus} {Replication}}, - volume = {315}, - issn = {0036-8075, 1095-9203}, - url = {http://www.sciencemag.org/content/315/5818/1579}, - doi = {10.1126/science.1136319}, - abstract = {MicroRNAs (miRNAs) are single-stranded noncoding RNAs of 19 to 25 nucleotides that function as gene regulators and as a host cell defense against both RNA and DNA viruses. We provide evidence for a physiological role of the miRNA-silencing machinery in controlling HIV-1 replication. Type III RNAses Dicer and Drosha, responsible for miRNA processing, inhibited virus replication both in peripheral blood mononuclear cells from HIV-1–infected donors and in latently infected cells. In turn, HIV-1 actively suppressed the expression of the polycistronic miRNA cluster miR-17/92. This suppression was found to be required for efficient viral replication and was dependent on the histone acetyltransferase Tat cofactor PCAF. Our results highlight the involvement of the miRNA-silencing pathway in HIV-1 replication and latency.}, - language = {en}, - number = {5818}, - urldate = {2013-10-08}, - journal = {Science}, - author = {Triboulet, Robinson and Mari, Bernard and Lin, Yea-Lih and Chable-Bessia, Christine and Bennasser, Yamina and Lebrigand, Kevin and Cardinaud, Bruno and Maurin, Thomas and Barbry, Pascal and Baillat, Vincent and Reynes, Jacques and Corbeau, Pierre and Jeang, Kuan-Teh and Benkirane, Monsef}, - month = mar, - year = {2007}, - pmid = {17322031}, - pages = {1579--1582}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DWR3576A/Triboulet et al. - 2007 - Suppression of MicroRNA-Silencing Pathway by HIV-1.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K299R4RF/1579.html:text/html} -} - -@article{suhasini_cellular_2009, - title = {Cellular {Proteins} and {HIV}-1 {Rev} {Function}}, - volume = {7}, - issn = {1570162X}, - url = {http://www.eurekaselect.com/93072/article}, - doi = {10.2174/157016209787048474}, - number = {1}, - urldate = {2013-11-10}, - journal = {Current HIV Research}, - author = {Suhasini, Modem and Reddy, Thipparthi}, - month = jan, - year = {2009}, - pages = {91--100}, - file = {Cellular Proteins and HIV-1 Rev Function | BenthamScience:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8WFZKT67/article.html:text/html} -} - -@article{cifuentes_novel_2010, - title = {A {Novel} {miRNA} {Processing} {Pathway} {Independent} of {Dicer} {Requires} {Argonaute}2 {Catalytic} {Activity}}, - volume = {328}, - issn = {0036-8075, 1095-9203}, - url = {http://www.sciencemag.org/content/328/5986/1694}, - doi = {10.1126/science.1190809}, - abstract = {Dicer is a central enzyme in microRNA (miRNA) processing. We identified a Dicer-independent miRNA biogenesis pathway that uses Argonaute2 (Ago2) slicer catalytic activity. In contrast to other miRNAs, miR-451 levels were refractory to dicer loss of function but were reduced in MZago2 (maternal-zygotic) mutants. We found that pre-miR-451 processing requires Ago2 catalytic activity in vivo. MZago2 mutants showed delayed erythropoiesis that could be rescued by wild-type Ago2 or miR-451-duplex but not by catalytically dead Ago2. Changing the secondary structure of Dicer-dependent miRNAs to mimic that of pre-miR-451 restored miRNA function and rescued developmental defects in MZdicer mutants, indicating that the pre-miRNA secondary structure determines the processing pathway in vivo. We propose that Ago2-mediated cleavage of pre-miRNAs, followed by uridylation and trimming, generates functional miRNAs independently of Dicer.}, - language = {en}, - number = {5986}, - urldate = {2013-10-27}, - journal = {Science}, - author = {Cifuentes, Daniel and Xue, Huiling and Taylor, David W. and Patnode, Heather and Mishima, Yuichiro and Cheloufi, Sihem and Ma, Enbo and Mane, Shrikant and Hannon, Gregory J. and Lawson, Nathan D. and Wolfe, Scot A. and Giraldez, Antonio J.}, - month = jun, - year = {2010}, - pmid = {20448148}, - pages = {1694--1698}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5JZBD2NG/Cifuentes et al. - 2010 - A Novel miRNA Processing Pathway Independent of Di.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BWUIUMKI/1694.html:text/html} -} - -@article{clarke_protein_2013, - title = {Protein methylation at the surface and buried deep: thinking outside the histone box}, - volume = {38}, - issn = {0968-0004}, - shorttitle = {Protein methylation at the surface and buried deep}, - url = {http://www.sciencedirect.com/science/article/pii/S096800041300025X}, - doi = {10.1016/j.tibs.2013.02.004}, - abstract = {Methylated lysine and arginine residues in histones represent a crucial part of the histone code, and recognition of these methylated residues by protein interaction domains modulates transcription. Although some methylating enzymes appear to be histone specific, many can modify histone and non-histone substrates and an increasing number are specific for non-histone substrates. Some of the non-histone substrates can also be involved in transcription, but a distinct subset of protein methylation reactions occurs at residues buried deeply in ribosomal proteins that may function in protein–RNA interactions rather than protein–protein interactions. Additionally, recent work has identified enzymes that catalyze protein methylation reactions at new sites in ribosomal and other proteins. These reactions include modifications of histidine and cysteine residues as well as the N terminus.}, - number = {5}, - urldate = {2014-02-28}, - journal = {Trends in Biochemical Sciences}, - author = {Clarke, Steven G.}, - month = may, - year = {2013}, - keywords = {PRMTs, SET-domain methyltransferases, histone methylation, ribosomal protein methylation}, - pages = {243--252}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/83NA87D7/Clarke - 2013 - Protein methylation at the surface and buried deep.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J5WCR7JP/S096800041300025X.html:text/html} -} - -@article{pillai_repression_2007, - title = {Repression of protein synthesis by {miRNAs}: how many mechanisms?}, - volume = {17}, - issn = {0962-8924}, - shorttitle = {Repression of protein synthesis by {miRNAs}}, - url = {http://www.sciencedirect.com/science/article/pii/S096289240600359X}, - doi = {10.1016/j.tcb.2006.12.007}, - abstract = {MicroRNAs are ∼21-nucleotide-long regulators of gene expression that gain access to their target mRNAs by complementary base pairing. Recent studies have revealed that animal microRNAs might take diverse routes to repress gene expression, affecting both target mRNA levels and translation. Mechanistic details of microRNA-mediated repression are starting to emerge but a comprehensive picture of the inhibition, and particularly the effects on mRNA translation, is still lacking. Recent data support different microRNA mechanisms and a role for cytoplasmic processing bodies in the degradation and storage of mRNAs targeted by microRNA regulators.}, - number = {3}, - urldate = {2013-10-12}, - journal = {Trends in Cell Biology}, - author = {Pillai, Ramesh S. and Bhattacharyya, Suvendra N. and Filipowicz, Witold}, - month = mar, - year = {2007}, - pages = {118--126}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6SC25NBC/Pillai et al. - 2007 - Repression of protein synthesis by miRNAs how man.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/I35PSR34/S096289240600359X.html:text/html} -} - -@article{bassi_primer_2007, - title = {A {Primer} on {Python} for {Life} {Science} {Researchers}}, - volume = {3}, - url = {http://dx.doi.org/10.1371/journal.pcbi.0030199}, - doi = {10.1371/journal.pcbi.0030199}, - number = {11}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Bassi, Sebastian}, - month = nov, - year = {2007}, - pages = {e199}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4HUI2K2E/Bassi - 2007 - A Primer on Python for Life Science Researchers.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PWP7C2VX/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{chen_h3.3_2013, - title = {H3.3 actively marks enhancers and primes gene transcription via opening higher-ordered chromatin}, - volume = {27}, - issn = {0890-9369, 1549-5477}, - url = {http://genesdev.cshlp.org/content/27/19/2109}, - doi = {10.1101/gad.222174.113}, - abstract = {The histone variants H3.3 and H2A.Z have recently emerged as two of the most important features in transcriptional regulation, the molecular mechanism of which still remains poorly understood. In this study, we investigated the regulation of H3.3 and H2A.Z on chromatin dynamics during transcriptional activation. Our in vitro biophysical and biochemical investigation showed that H2A.Z promoted chromatin compaction and repressed transcriptional activity. Surprisingly, with only four to five amino acid differences from the canonical H3, H3.3 greatly impaired higher-ordered chromatin folding and promoted gene activation, although it has no significant effect on the stability of mononucleosomes. We further demonstrated that H3.3 actively marks enhancers and determines the transcriptional potential of retinoid acid (RA)-regulated genes via creating an open chromatin signature that enables the binding of RAR/RXR. Additionally, the H3.3-dependent recruitment of H2A.Z on promoter regions resulted in compaction of chromatin to poise transcription, while RA induction results in the incorporation of H3.3 on promoter regions to activate transcription via counteracting H2A.Z-mediated chromatin compaction. Our results provide key insights into the mechanism of how histone variants H3.3 and H2A.Z function together to regulate gene transcription via the modulation of chromatin dynamics over the enhancer and promoter regions.}, - language = {en}, - number = {19}, - urldate = {2014-02-17}, - journal = {Genes \& Development}, - author = {Chen, Ping and Zhao, Jicheng and Wang, Yan and Wang, Min and Long, Haizhen and Liang, Dan and Huang, Li and Wen, Zengqi and Li, Wei and Li, Xia and Feng, Hongli and Zhao, Haiyong and Zhu, Ping and Li, Ming and Wang, Qian-fei and Li, Guohong}, - month = oct, - year = {2013}, - pmid = {24065740}, - keywords = {H2A.Z, H3.3, Histone variants, chromatin dynamics, gene transcription, higher-ordered chromatin structure}, - pages = {2109--2124}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AFE9ZXJN/Chen et al. - 2013 - H3.3 actively marks enhancers and primes gene tran.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NV89I5GC/2109.html:text/html} -} - -@article{bailey_practical_2013, - title = {Practical {Guidelines} for the {Comprehensive} {Analysis} of {ChIP}-seq {Data}}, - volume = {9}, - url = {http://dx.doi.org/10.1371/journal.pcbi.1003326}, - doi = {10.1371/journal.pcbi.1003326}, - abstract = {Mapping the chromosomal locations of transcription factors, nucleosomes, histone modifications, chromatin remodeling enzymes, chaperones, and polymerases is one of the key tasks of modern biology, as evidenced by the Encyclopedia of DNA Elements (ENCODE) Project. To this end, chromatin immunoprecipitation followed by high-throughput sequencing (ChIP-seq) is the standard methodology. Mapping such protein-DNA interactions in vivo using ChIP-seq presents multiple challenges not only in sample preparation and sequencing but also for computational analysis. Here, we present step-by-step guidelines for the computational analysis of ChIP-seq data. We address all the major steps in the analysis of ChIP-seq data: sequencing depth selection, quality checking, mapping, data normalization, assessment of reproducibility, peak calling, differential binding analysis, controlling the false discovery rate, peak annotation, visualization, and motif analysis. At each step in our guidelines we discuss some of the software tools most frequently used. We also highlight the challenges and problems associated with each step in ChIP-seq data analysis. We present a concise workflow for the analysis of ChIP-seq data in Figure 1 that complements and expands on the recommendations of the ENCODE and modENCODE projects. Each step in the workflow is described in detail in the following sections.}, - number = {11}, - urldate = {2014-05-22}, - journal = {PLoS Comput Biol}, - author = {Bailey, Timothy and Krajewski, Pawel and Ladunga, Istvan and Lefebvre, Celine and Li, Qunhua and Liu, Tao and Madrigal, Pedro and Taslim, Cenny and Zhang, Jie}, - month = nov, - year = {2013}, - pages = {e1003326}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4FGJAV84/Bailey et al. - 2013 - Practical Guidelines for the Comprehensive Analysi.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4SF6WQ4C/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{compeau_how_2011, - title = {How to apply de {Bruijn} graphs to genome assembly}, - volume = {29}, - copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1087-0156}, - url = {http://www.nature.com/nbt/journal/v29/n11/full/nbt.2023.html}, - doi = {10.1038/nbt.2023}, - abstract = {A mathematical concept known as a de Bruijn graph turns the formidable challenge of assembling a contiguous genome from billions of short sequencing reads into a tractable computational problem.}, - language = {en}, - number = {11}, - urldate = {2014-01-24}, - journal = {Nature Biotechnology}, - author = {Compeau, Phillip E. C. and Pevzner, Pavel A. and Tesler, Glenn}, - month = nov, - year = {2011}, - pages = {987--991}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GWGZQGSI/Compeau et al. - 2011 - How to apply de Bruijn graphs to genome assembly.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VTC6B66P/nbt.2023.html:text/html} -} - -@article{hansen_immune_2013, - title = {Immune clearance of highly pathogenic {SIV} infection}, - volume = {advance online publication}, - copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1476-4687}, - url = {http://www.nature.com/nature/journal/vaop/ncurrent/full/nature12519.html}, - doi = {10.1038/nature12519}, - abstract = {Established infections with the human and simian immunodeficiency viruses (HIV and SIV, respectively) are thought to be permanent with even the most effective immune responses and antiretroviral therapies only able to control, but not clear, these infections. Whether the residual virus that maintains these infections is vulnerable to clearance is a question of central importance to the future management of millions of HIV-infected individuals. We recently reported that approximately 50\% of rhesus macaques (RM; Macaca mulatta) vaccinated with SIV protein-expressing rhesus cytomegalovirus (RhCMV/SIV) vectors manifest durable, aviraemic control of infection with the highly pathogenic strain SIVmac239 (ref. 5). Here we show that regardless of the route of challenge, RhCMV/SIV vector-elicited immune responses control SIVmac239 after demonstrable lymphatic and haematogenous viral dissemination, and that replication-competent SIV persists in several sites for weeks to months. Over time, however, protected RM lost signs of SIV infection, showing a consistent lack of measurable plasma- or tissue-associated virus using ultrasensitive assays, and a loss of T-cell reactivity to SIV determinants not in the vaccine. Extensive ultrasensitive quantitative PCR and quantitative PCR with reverse transcription analyses of tissues from RhCMV/SIV vector-protected RM necropsied 69–172 weeks after challenge did not detect SIV RNA or DNA sequences above background levels, and replication-competent SIV was not detected in these RM by extensive co-culture analysis of tissues or by adoptive transfer of 60 million haematolymphoid cells to naive RM. These data provide compelling evidence for progressive clearance of a pathogenic lentiviral infection, and suggest that some lentiviral reservoirs may be susceptible to the continuous effector memory T-cell-mediated immune surveillance elicited and maintained by cytomegalovirus vectors.}, - language = {en}, - urldate = {2013-09-25}, - journal = {Nature}, - author = {Hansen, Scott G. and Jr, Michael Piatak and Ventura, Abigail B. and Hughes, Colette M. and Gilbride, Roxanne M. and Ford, Julia C. and Oswald, Kelli and Shoemaker, Rebecca and Li, Yuan and Lewis, Matthew S. and Gilliam, Awbrey N. and Xu, Guangwu and Whizin, Nathan and Burwitz, Benjamin J. and Planer, Shannon L. and Turner, John M. and Legasse, Alfred W. and Axthelm, Michael K. and Nelson, Jay A. and Früh, Klaus and Sacha, Jonah B. and Estes, Jacob D. and Keele, Brandon F. and Edlefsen, Paul T. and Lifson, Jeffrey D. and Picker, Louis J.}, - month = sep, - year = {2013}, - keywords = {Live attenuated vaccines, Pathogens, Vaccines}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/988PVJ9J/Hansen et al. - 2013 - Immune clearance of highly pathogenic SIV infectio.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/27I96AG7/nature12519.html:text/html} -} - -@article{andreux_systems_2012, - title = {Systems {Genetics} of {Metabolism}: {The} {Use} of the {BXD} {Murine} {Reference} {Panel} for {Multiscalar} {Integration} of {Traits}}, - volume = {150}, - issn = {0092-8674}, - shorttitle = {Systems {Genetics} of {Metabolism}}, - url = {http://www.sciencedirect.com/science/article/pii/S0092867412010070}, - doi = {10.1016/j.cell.2012.08.012}, - abstract = {Metabolic homeostasis is achieved by complex molecular and cellular networks that differ significantly among individuals and are difficult to model with genetically engineered lines of mice optimized to study single gene function. Here, we systematically acquired metabolic phenotypes by using the EUMODIC EMPReSS protocols across a large panel of isogenic but diverse strains of mice (BXD type) to study the genetic control of metabolism. We generated and analyzed 140 classical phenotypes and deposited these in an open-access web service for systems genetics (www.genenetwork.org). Heritability, influence of sex, and genetic modifiers of traits were examined singly and jointly by using quantitative-trait locus (QTL) and expression QTL-mapping methods. Traits and networks were linked to loci encompassing both known variants and novel candidate genes, including alkaline phosphatase (ALPL), here linked to hypophosphatasia. The assembled and curated phenotypes provide key resources and exemplars that can be used to dissect complex metabolic traits and disorders.}, - number = {6}, - urldate = {2014-03-30}, - journal = {Cell}, - author = {Andreux, Pénélope A. and Williams, Evan G. and Koutnikova, Hana and Houtkooper, Riekelt H. and Champy, Marie-France and Henry, Hugues and Schoonjans, Kristina and Williams, Robert W. and Auwerx, Johan}, - month = sep, - year = {2012}, - pages = {1287--1299}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/994RXI8U/Andreux et al. - 2012 - Systems Genetics of Metabolism The Use of the BXD.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HRCK7MBE/S0092867412010070.html:text/html} -} - -@article{henikoff_nucleosome_2008, - title = {Nucleosome destabilization in the epigenetic regulation of gene expression}, - volume = {9}, - copyright = {© 2008 Nature Publishing Group}, - issn = {1471-0056}, - url = {http://www.nature.com/nrg/journal/v9/n1/full/nrg2206.html#top}, - doi = {10.1038/nrg2206}, - abstract = {Assembly, mobilization and disassembly of nucleosomes can influence the regulation of gene expression and other processes that act on eukaryotic DNA. Distinct nucleosome-assembly pathways deposit dimeric subunits behind the replication fork or at sites of active processes that mobilize pre-existing nucleosomes. Replication-coupled nucleosome assembly appears to be the default process that maintains silent chromatin, counteracted by active processes that destabilize nucleosomes. Nucleosome stability is regulated by the combined effects of nucleosome-positioning sequences, histone chaperones, ATP-dependent nucleosome remodellers, post-translational modifications and histone variants. Recent studies suggest that histone turnover helps to maintain continuous access to sequence-specific DNA-binding proteins that regulate epigenetic inheritance, providing a dynamic alternative to histone-marking models for the propagation of active chromatin.}, - language = {en}, - number = {1}, - urldate = {2014-03-11}, - journal = {Nature Reviews Genetics}, - author = {Henikoff, Steven}, - month = jan, - year = {2008}, - pages = {15--26}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BJQ7JWZD/Henikoff - 2008 - Nucleosome destabilization in the epigenetic regul.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6KSQPXIB/nrg2206.html:text/html} -} - -@article{yang_histone_2012, - title = {Histone {Methyltransferase} {NSD}2/{MMSET} {Mediates} {Constitutive} {NF}-κ{B} {Signaling} for {Cancer} {Cell} {Proliferation}, {Survival}, and {Tumor} {Growth} via a {Feed}-{Forward} {Loop}}, - volume = {32}, - issn = {0270-7306, 1098-5549}, - url = {http://mcb.asm.org/content/32/15/3121}, - doi = {10.1128/MCB.00204-12}, - abstract = {Constitutive NF-κB activation by proinflammatory cytokines plays a major role in cancer progression. However, the underlying mechanism is still unclear. We report here that histone methyltransferase NSD2 (also known as MMSET or WHSC1), a target of bromodomain protein ANCCA/ATAD2, acts as a strong coactivator of NF-κB by directly interacting with NF-κB for activation of target genes, including those for interleukin-6 (IL-6), IL-8, vascular endothelial growth factor A (VEGFA), cyclin D, Bcl-2, and survivin, in castration-resistant prostate cancer (CRPC) cells. NSD2 is recruited to the target gene promoters upon induction and mediates NF-κB activation-associated elevation of histone H3K36me2 and H3K36me3 marks at the promoter, which involves its methylase activity. Interestingly, we found that NSD2 is also critical for cytokine-induced recruitment of NF-κB and acetyltransferase p300 and histone hyperacetylation. Importantly, NSD2 is overexpressed in prostate cancer tumors, and its overexpression correlates with NF-κB activation. Furthermore, NSD2 expression is strongly induced by tumor necrosis factor alpha (TNF-α) and IL-6 via NF-κB and plays a crucial role in tumor growth. These results identify NSD2 to be a key chromatin regulator of NF-κB and mediator of the cytokine autocrine loop for constitutive NF-κB activation and emphasize the important roles played by NSD2 in cancer cell proliferation and survival and tumor growth.}, - language = {en}, - number = {15}, - urldate = {2014-03-18}, - journal = {Molecular and Cellular Biology}, - author = {Yang, Ping and Guo, Linlang and Duan, Zhijian J. and Tepper, Clifford G. and Xue, Ling and Chen, Xinbin and Kung, Hsing-Jien and Gao, Allen C. and Zou, June X. and Chen, Hong-Wu}, - month = aug, - year = {2012}, - pmid = {22645312}, - pages = {3121--3131}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3SSXZ9CJ/Yang et al. - 2012 - Histone Methyltransferase NSD2MMSET Mediates Cons.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ERNJSACC/3121.html:text/html} -} - -@article{mavrich_nucleosome_2008, - title = {Nucleosome organization in the {Drosophila} genome}, - volume = {453}, - copyright = {© 2008 Nature Publishing Group}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v453/n7193/full/nature06929.html}, - doi = {10.1038/nature06929}, - abstract = {Comparative genomics of nucleosome positions provides a powerful means for understanding how the organization of chromatin and the transcription machinery co-evolve. Here we produce a high-resolution reference map of H2A.Z and bulk nucleosome locations across the genome of the fly Drosophila melanogaster and compare it to that from the yeast Saccharomyces cerevisiae. Like Saccharomyces, Drosophila nucleosomes are organized around active transcription start sites in a canonical -1, nucleosome-free region, +1 arrangement. However, Drosophila does not incorporate H2A.Z into the -1 nucleosome and does not bury its transcriptional start site in the +1 nucleosome. At thousands of genes, RNA polymerase II engages the +1 nucleosome and pauses. How the transcription initiation machinery contends with the +1 nucleosome seems to be fundamentally different across major eukaryotic lines.}, - language = {en}, - number = {7193}, - urldate = {2014-03-13}, - journal = {Nature}, - author = {Mavrich, Travis N. and Jiang, Cizhong and Ioshikhes, Ilya P. and Li, Xiaoyong and Venters, Bryan J. and Zanton, Sara J. and Tomsho, Lynn P. and Qi, Ji and Glaser, Robert L. and Schuster, Stephan C. and Gilmour, David S. and Albert, Istvan and Pugh, B. Franklin}, - month = may, - year = {2008}, - pages = {358--362}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7HPWIZQN/Mavrich et al. - 2008 - Nucleosome organization in the Drosophila genome.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q9ZDK9UX/nature06929.html:text/html} -} - -@article{obri_anp32e_2014, - title = {{ANP}32E is a histone chaperone that removes {H}2A.{Z} from chromatin}, - volume = {505}, - copyright = {© 2014 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v505/n7485/full/nature12922.html}, - doi = {10.1038/nature12922}, - abstract = {H2A.Z is an essential histone variant implicated in the regulation of key nuclear events. However, the metazoan chaperones responsible for H2A.Z deposition and its removal from chromatin remain unknown. Here we report the identification and characterization of the human protein ANP32E as a specific H2A.Z chaperone. We show that ANP32E is a member of the presumed H2A.Z histone-exchange complex p400/TIP60. ANP32E interacts with a short region of the docking domain of H2A.Z through a new motif termed H2A.Z interacting domain (ZID). The 1.48 Å resolution crystal structure of the complex formed between the ANP32E-ZID and the H2A.Z/H2B dimer and biochemical data support an underlying molecular mechanism for H2A.Z/H2B eviction from the nucleosome and its stabilization by ANP32E through a specific extension of the H2A.Z carboxy-terminal α-helix. Finally, analysis of H2A.Z localization in ANP32E−/− cells by chromatin immunoprecipitation followed by sequencing shows genome-wide enrichment, redistribution and accumulation of H2A.Z at specific chromatin control regions, in particular at enhancers and insulators.}, - language = {en}, - number = {7485}, - urldate = {2014-02-17}, - journal = {Nature}, - author = {Obri, Arnaud and Ouararhni, Khalid and Papin, Christophe and Diebold, Marie-Laure and Padmanabhan, Kiran and Marek, Martin and Stoll, Isabelle and Roy, Ludovic and Reilly, Patrick T. and Mak, Tak W. and Dimitrov, Stefan and Romier, Christophe and Hamiche, Ali}, - month = jan, - year = {2014}, - keywords = {Histone variants, biochemistry}, - pages = {648--653}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E8ASS9VF/Obri et al. - 2014 - ANP32E is a histone chaperone that removes H2A.Z f.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ABBGMVHE/nature12922.html:text/html} -} - -@article{gaffney_controls_2012, - title = {Controls of {Nucleosome} {Positioning} in the {Human} {Genome}}, - volume = {8}, - url = {http://dx.doi.org/10.1371/journal.pgen.1003036}, - doi = {10.1371/journal.pgen.1003036}, - abstract = {Author SummaryWithin the nucleus of the cell, the genome of eukaryotic organisms is tightly packaged into chromatin. Chromatin is composed of a repeating series of bead-like nucleosomes, each of which is encircled 1.7 times by a string of DNA. The organization of nucleosomes on the genome is fundamentally important because they can prevent other proteins from accessing the DNA. Previous studies of human nucleosomes concluded that most nucleosomes have fuzzy positioning and tend to occupy different locations in different cells. This interpretation, however, may be a consequence of the low resolution of existing data. Here we revisit the question of nucleosome positioning by generating the most precise map of nucleosome positions that has ever been created for a human cell line. We find that 8.7\% of nucleosomes have very consistent positioning, and most nucleosomes are more consistently positioned than expected by chance. Additionally, we estimate that almost half of the genome contains regularly spaced arrays of nucleosomes. Much of this positioning is due to the intrinsic preference of nucleosomes for some DNA sequences over others; but in some regions of the genome, the sequence preferences of nucleosomes are overridden by proteins that out-compete them for binding or displace them using energy from ATP.}, - number = {11}, - urldate = {2015-04-20}, - journal = {PLoS Genet}, - author = {Gaffney, Daniel J. and McVicker, Graham and Pai, Athma A. and Fondufe-Mittendorf, Yvonne N. and Lewellen, Noah and Michelini, Katelyn and Widom, Jonathan and Gilad, Yoav and Pritchard, Jonathan K.}, - month = nov, - year = {2012}, - pages = {e1003036}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZHPIVPHX/Gaffney et al. - 2012 - Controls of Nucleosome Positioning in the Human Ge.pdf:application/pdf} -} - -@article{freaney_high-density_2014-1, - title = {High-{Density} {Nucleosome} {Occupancy} {Map} of {Human} {Chromosome} 9p21–22 {Reveals} {Chromatin} {Organization} of the {Type} {I} {Interferon} {Gene} {Cluster}}, - issn = {1079-9907, 1557-7465}, - url = {http://online.liebertpub.com/doi/full/10.1089/jir.2013.0118}, - doi = {10.1089/jir.2013.0118}, - language = {en}, - urldate = {2014-04-02}, - journal = {Journal of Interferon \& Cytokine Research}, - author = {Freaney, Jonathan E. and Zhang, Quanwei and Yigit, Erbay and Kim, Rebecca and Widom, Jonathan and Wang, Ji-Ping and Horvath, Curt M.}, - month = mar, - year = {2014}, - pages = {140327155152002}, - file = {High-Density Nucleosome Occupancy Map of Human Chromosome 9p21–\;22 Reveals Chromatin Organization of the Type I Interferon Gene Cluster:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JGB4EBSI/jir.2013.html:text/html} -} - -@article{kraushaar_genome-wide_2013, - title = {Genome-wide incorporation dynamics reveal distinct categories of turnover for the histone variant {H}3.3}, - volume = {14}, - copyright = {2013 Kraushaar et al.; licensee BioMed Central Ltd.}, - issn = {1465-6906}, - url = {http://genomebiology.com/2013/14/10/R121/abstract}, - doi = {10.1186/gb-2013-14-10-r121}, - abstract = {Nucleosomes are present throughout the genome and must be dynamically regulated to accommodate binding of transcription factors and RNA polymerase machineries by various mechanisms. Despite the development of protocols and techniques that have enabled us to map nucleosome occupancy genome-wide, the dynamic properties of nucleosomes remain poorly understood, particularly in mammalian cells. The histone variant H3.3 is incorporated into chromatin independently of DNA replication and requires displacement of existing nucleosomes for its deposition. Here, we measure H3.3 turnover at high resolution in the mammalian genome in order to present a genome-wide characterization of replication-independent H3.3-nucleosome dynamics. -PMID: 24176123}, - language = {en}, - number = {10}, - urldate = {2014-03-05}, - journal = {Genome Biology}, - author = {Kraushaar, Daniel C. and Jin, Wenfei and Maunakea, Alika and Abraham, Brian and Ha, Misook and Zhao, Keji}, - month = oct, - year = {2013}, - pmid = {24176123}, - pages = {R121}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VGMR8DN9/Kraushaar et al. - 2013 - Genome-wide incorporation dynamics reveal distinct.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/85RAQECT/R121.html:text/html} -} - -@article{meer_evolution_1998, - title = {Evolution of a {Pathway} for {Chlorobenzene} {Metabolism} {Leads} to {Natural} {Attenuation} in {Contaminated} {Groundwater}}, - volume = {64}, - issn = {0099-2240, 1098-5336}, - url = {http://aem.asm.org/content/64/11/4185}, - abstract = {Complete metabolism of chlorinated benzenes is not a feature that is generally found in aerobic bacteria but is thought to be due to a novel recombination of two separate gene clusters. Such a recombination could be responsible for adaptation of a natural microbial community in response to contamination with synthetic chemicals. This hypothesis was tested in a chlorobenzene (CB)-contaminated aquifer. CB-degrading bacteria from a contaminated site were characterized for a number of years by examining a combination of growth characteristics and DNA-DNA hybridization, PCR, and DNA sequence data. The genetic information obtained for the CB pathway of the predominant microorganism, Ralstonia sp. strain JS705, revealed a unique combination of (partially duplicated) genes for chlorocatechol degradation and genes for a benzene-toluene type of aromatic ring dioxygenase. The organism was detected in CB-polluted groundwater by hybridizing colonies cultivated on low-strength heterotrophic media with probes for the CB pathway. Southern hybridizations performed to determine the organization of the CB pathway genes and the 16S ribosomal DNA indicated that CB-degrading organisms isolated from different wells at the site were identical to JS705. Physiological characterization by the Biolog test system revealed some differences. The genes for the aromatic ring dioxygenase and dihydrodiol dehydrogenase of JS705 were detected in toluene and benzene degraders from the same site. Our results suggest that recent horizontal gene transfer and genetic recombination of existing genes between indigenous microorganisms were the mechanisms for evolution of the catabolic pathway. Evolution of the CB pathway seems to have created the capacity for natural attenuation of CB at the contaminated site.}, - language = {en}, - number = {11}, - urldate = {2014-05-25}, - journal = {Applied and Environmental Microbiology}, - author = {Meer, Jan Roelof van der and Werlen, Christoph and Nishino, Shirley F. and Spain, Jim C.}, - month = nov, - year = {1998}, - pmid = {9797264}, - pages = {4185--4193}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IZP2BEI3/Meer et al. - 1998 - Evolution of a Pathway for Chlorobenzene Metabolis.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/729ZIE4M/4185.html:text/html} -} - -@article{gevry_histone_2009, - title = {Histone {H}2A.{Z} is essential for estrogen receptor signaling}, - volume = {23}, - issn = {0890-9369, 1549-5477}, - url = {http://genesdev.cshlp.org/content/23/13/1522}, - doi = {10.1101/gad.1787109}, - abstract = {Incorporation of H2A.Z into the chromatin of inactive promoters has been shown to poise genes for their expression. Here we provide strong evidence that H2A.Z is incorporated into the promoter regions of estrogen receptor (ERα) target genes only upon gene induction, and that, in a cyclic pattern. Moreover, members of the human H2A.Z-depositing complex, p400, also follow the same gene recruitment kinetics as H2A.Z. Importantly, cellular depletion of H2A.Z or p400 leads to a severe defect in estrogen signaling, including loss of estrogen-specific cell proliferation. We find that incorporation of H2A.Z within TFF1 promoter chromatin allows nucleosomes to adopt preferential positions along the DNA translational axis. Finally, we provide evidence that H2A.Z is essential to allow estrogen-responsive enhancer function. Taken together, our results provide strong mechanistic insight into how H2A.Z regulates ERα-mediated gene expression and provide a novel link between H2A.Z–p400 and ERα-dependent gene regulation and enhancer function.}, - language = {en}, - number = {13}, - urldate = {2014-03-19}, - journal = {Genes \& Development}, - author = {Gévry, Nicolas and Hardy, Sara and Jacques, Pierre-Étienne and Laflamme, Liette and Svotelis, Amy and Robert, François and Gaudreau, Luc}, - month = jul, - year = {2009}, - pmid = {19515975}, - keywords = {Chromatin, ER, FoxA1, H2A.Z, p400}, - pages = {1522--1533}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VVSPMKWZ/Gévry et al. - 2009 - Histone H2A.Z is essential for estrogen receptor s.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4AE4WBIG/1522.html:text/html} -} - -@article{placek_histone_2009, - title = {The {Histone} {Variant} {H}3.3 {Regulates} {Gene} {Expression} during {Lytic} {Infection} with {Herpes} {Simplex} {Virus} {Type} 1}, - volume = {83}, - issn = {0022-538X}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2620911/}, - doi = {10.1128/JVI.01276-08}, - abstract = {It has been proposed that incorporation of the histone variant H3.3 within actively transcribed regions of a genome helps to facilitate transcription. In this report we use lytic infection by herpes simplex virus type 1 (HSV-1) as a model to examine the temporal profile of histone H3 incorporation and to determine whether the variant histone H3.3 has a direct effect on transcription. We find that canonical H3.1 and variant H3.3 exhibit distinct temporal associations with the genome in cell lines expressing equal amounts of epitope-tagged H3 variants. At the earliest times examined after infection, the HSV-1 genome is incorporated into chromatin that predominantly contains the variant H3.3, whereas incorporation of canonical H3.1 occurs later in infection and is dependent on replication of the HSV-1 genome. Further, inhibition of H3.3 association, via reduced expression of the H3.3 chaperone HIRA, significantly reduces the levels of HSV-1 mRNA. These findings show that incorporation of H3.3 facilitates transcription, and they provide new evidence for a regulatory role of chromatin composition during HSV-1 acute infection.}, - number = {3}, - urldate = {2014-03-06}, - journal = {Journal of Virology}, - author = {Placek, Brandon J. and Huang, Jing and Kent, Jennifer R. and Dorsey, Jean and Rice, Lyndi and Fraser, Nigel W. and Berger, Shelley L.}, - month = feb, - year = {2009}, - pmid = {19004946}, - pmcid = {PMC2620911}, - pages = {1416--1421}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UVGU9RPW/Placek et al. - 2009 - The Histone Variant H3.3 Regulates Gene Expression.pdf:application/pdf} -} - -@article{iglesias-ussel_hiv_2011, - title = {{HIV} reservoirs: the new frontier}, - volume = {13}, - issn = {1698-6997}, - shorttitle = {{HIV} reservoirs}, - abstract = {Current antiretroviral therapies suppress viremia to very low levels, but are ineffective in eliminating reservoirs of persistent HIV infection. Efforts toward the development of therapies aimed at HIV reservoirs are complicated by the evidence that HIV establishes persistent productive and nonproductive infection in a number of cell types and through a variety of mechanisms. Moreover, immunologically privileged sites such as the brain also act as HIV sanctuaries. To facilitate the advancement of our knowledge in this new area of research, in vitro models of HIV persistence in different cellular reservoirs have been developed, particularly in CD4+ T-cells that represent the largest pool of persistently infected cells in the body. Whereas each model presents clear advantages, they all share one common limitation: they are systems attempting to recapitulate extremely complex virus-cell interactions occurring in vivo, which we know very little about. Potentially conflicting results arising from different models may be difficult to interpret without validation with clinical samples. Addressing these issues, among others, merits careful consideration for the identification of valid targets and the design of effective strategies for therapy, which may increase the success of efforts toward HIV eradication.}, - language = {eng}, - number = {1}, - journal = {AIDS reviews}, - author = {Iglesias-Ussel, Maria D and Romerio, Fabio}, - month = mar, - year = {2011}, - pmid = {21412386}, - keywords = {Anti-HIV Agents, HIV, HIV Infections, Humans, Proviruses, Virus Latency}, - pages = {13--29} -} - -@article{toedling_analyzing_2008, - title = {Analyzing {ChIP}-chip {Data} {Using} {Bioconductor}}, - volume = {4}, - url = {http://dx.doi.org/10.1371/journal.pcbi.1000227}, - doi = {10.1371/journal.pcbi.1000227}, - number = {11}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Toedling, Joern and Huber, Wolfgang}, - month = nov, - year = {2008}, - pages = {e1000227}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3NNDRGSW/Toedling et Huber - 2008 - Analyzing ChIP-chip Data Using Bioconductor.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M8UDJD9T/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{kuo_nsd2_2011, - title = {{NSD}2 {Links} {Dimethylation} of {Histone} {H}3 at {Lysine} 36 to {Oncogenic} {Programming}}, - volume = {44}, - issn = {1097-2765}, - url = {http://www.sciencedirect.com/science/article/pii/S1097276511008136}, - doi = {10.1016/j.molcel.2011.08.042}, - abstract = {The histone lysine methyltransferase NSD2 (MMSET/WHSC1) is implicated in diverse diseases and commonly overexpressed in multiple myeloma due to a recurrent t(4;14) chromosomal translocation. However, the precise catalytic activity of NSD2 is obscure, preventing progress in understanding how this enzyme influences chromatin biology and myeloma pathogenesis. Here, we show that dimethylation of histone H3 at lysine 36 (H3K36me2) is the principal chromatin-regulatory activity of NSD2. Catalysis of H3K36me2 by NSD2 is sufficient for gene activation. In t(4;14)-positive myeloma cells, the normal genome-wide and gene-specific distribution of H3K36me2 is obliterated, creating a chromatin landscape that selects for a transcription profile favorable for myelomagenesis. Catalytically active NSD2 confers xenograft tumor formation upon t(4;14)-negative cells and promotes oncogenic transformation of primary cells in an H3K36me2-dependent manner. Together, our findings establish H3K36me2 as the primary product generated by NSD2 and demonstrate that genomic disorganization of this canonical chromatin mark by NSD2 initiates oncogenic programming.}, - number = {4}, - urldate = {2014-03-10}, - journal = {Molecular Cell}, - author = {Kuo, Alex J. and Cheung, Peggie and Chen, Kaifu and Zee, Barry M. and Kioi, Mitomu and Lauring, Josh and Xi, Yuanxin and Park, Ben Ho and Shi, Xiaobing and Garcia, Benjamin A. and Li, Wei and Gozani, Or}, - month = nov, - year = {2011}, - pages = {609--620}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PGVZ9EZF/Kuo et al. - 2011 - NSD2 Links Dimethylation of Histone H3 at Lysine 3.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2C2GEZWZ/S1097276511008136.html:text/html} -} - -@article{ryan_snf2-family_2011, - title = {Snf2-family proteins: chromatin remodellers for any occasion}, - volume = {15}, - issn = {1367-5931}, - shorttitle = {Snf2-family proteins}, - url = {http://www.sciencedirect.com/science/article/pii/S1367593111001293}, - doi = {10.1016/j.cbpa.2011.07.022}, - abstract = {Chromatin facilitates the housing of eukaryotic DNA within the nucleus and restricts access to the underlying sequences. Thus, the regulation of chromatin structure provides an excellent platform for regulating processes that require information stored within genomic DNA. Snf2 proteins are a family of helicase-like proteins that direct energy derived from ATP hydrolysis into the mechanical remodelling of chromatin structure. Here, we highlight some of the recent discoveries regarding this family of proteins and show Snf2 proteins have roles in many aspects of genetic metabolism. Recent developments include new insights into the mechanism for nucleosome spacing and histone dimer exchange; together with growing evidence for the involvement of Snf2 proteins in DNA repair.}, - number = {5}, - urldate = {2014-02-28}, - journal = {Current Opinion in Chemical Biology}, - author = {Ryan, Daniel P and Owen-Hughes, Tom}, - month = oct, - year = {2011}, - pages = {649--656}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GRPMT82G/Ryan et Owen-Hughes - 2011 - Snf2-family proteins chromatin remodellers for an.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/32TWSA5S/S1367593111001293.html:text/html} -} - -@article{loftis_brief_2000, - title = {Brief hypoxic stress suppresses postbacteremic {NF}-κ{B} activation and {TNF}-α bioactivity in perfused liver}, - volume = {279}, - copyright = {Copyright © 2000 the American Physiological Society}, - url = {http://ajpregu.physiology.org/content/279/1/R99}, - abstract = {Reductions in hepatic O2 delivery are common early after gram-negative bacteremic sepsis owing to cardiopulmonary dysfunction and derangements in sinusoidal perfusion. Although gram-negative endotoxin and cellular hypoxia independently enhance activation of nuclear factor-κB (NF-κB) via generation of reactive O2 species (ROS), the combination of these stimuli downregulates hepatic TNF-α gene expression. Here we tested the hypothesis that hypoxic suppression of postbacteremic TNF-α gene expression is transcriptionally mediated by reduced activation of NF-κB. Buffer-perfused rat livers (n = 52) were studied over 180 min after intraportal infection at t = 0 with 109 liveEscherichia coli (EC), serotype O55:B5, or 0.9\% NaCl controls under normoxic conditions, compared with 0.5 h of constant-flow hypoxia (Po 2 ∼41 ± 7 Torr) beginning at t = 30 min, followed by 120 min of reoxygenation. In parallel studies, tissue was obtained at peak hypoxia (t = 60 min). To determine the role of xanthine oxidase (XO)-induced ROS in modulating NF-κB activity after hypoxia/reoxygenation (H/R), livers were pretreated with the XO inhibitor allopurinol, with results confirmed in organs of tungstate-fed animals. Electrophoretic mobility shift assays were performed on nuclear extracts of whole liver lysates using32P-labeled oligonucleotides specific for NF-κB. Compared with normoxic EC controls, hypoxia reduced postbacteremic NF-κB nuclear translocation and TNF-α bioactivity, independent of reoxygenation, tissue levels of reduced glutathione, or posthypoxic O2 consumption. XO inhibition reversed the hypoxic suppression of NF-κB nuclear translocation and ameliorated decreases in cell-associated TNF-α. Thus decreases in hepatic O2delivery reduce postbacteremic nuclear translocation of NF-κB and hepatic TNF-α biosynthesis by signaling mechanisms involving low-level generation of XO-mediated ROS.}, - language = {en}, - number = {1}, - urldate = {2014-03-20}, - journal = {American Journal of Physiology - Regulatory, Integrative and Comparative Physiology}, - author = {Loftis, Laura L. and Johanns, Cheryl A. and Lechner, Andrew J. and Matuschak, George M.}, - month = jul, - year = {2000}, - pmid = {10896870}, - note = {Reductions in hepatic O2 delivery are common early after gram-negative bacteremic sepsis owing to cardiopulmonary dysfunction and derangements in sinusoidal perfusion. Although gram-negative endotoxin and cellular hypoxia independently enhance activation of nuclear factor-κB (NF-κB) via generation of reactive O2 species (ROS), the combination of these stimuli downregulates hepatic TNF-α gene expression. Here we tested the hypothesis that hypoxic suppression of postbacteremic TNF-α gene expression is transcriptionally mediated by reduced activation of NF-κB. Buffer-perfused rat livers ( n = 52) were studied over 180 min after intraportal infection at t = 0 with 109 live Escherichia coli (EC), serotype O55:B5, or 0.9\% NaCl controls under normoxic conditions, compared with 0.5 h of constant-flow hypoxia (Po 2 ∼41 ± 7 Torr) beginning at t = 30 min, followed by 120 min of reoxygenation. In parallel studies, tissue was obtained at peak hypoxia ( t = 60 min). To determine the role of xanthine oxidase (XO)-induced ROS in modulating NF-κB activity after hypoxia/reoxygenation (H/R), livers were pretreated with the XO inhibitor allopurinol, with results confirmed in organs of tungstate-fed animals. Electrophoretic mobility shift assays were performed on nuclear extracts of whole liver lysates using32P-labeled oligonucleotides specific for NF-κB. Compared with normoxic EC controls, hypoxia reduced postbacteremic NF-κB nuclear translocation and TNF-α bioactivity, independent of reoxygenation, tissue levels of reduced glutathione, or posthypoxic O2 consumption. XO inhibition reversed the hypoxic suppression of NF-κB nuclear translocation and ameliorated decreases in cell-associated TNF-α. Thus decreases in hepatic O2delivery reduce postbacteremic nuclear translocation of NF-κB and hepatic TNF-α biosynthesis by signaling mechanisms involving low-level generation of XO-mediated ROS.}, - pages = {R99--R108}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TEEWAM3A/Loftis et al. - 2000 - Brief hypoxic stress suppresses postbacteremic NF-.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/83488U3N/R99.html:text/html} -} - -@article{hutter_long-term_2009, - title = {Long-{Term} {Control} of {HIV} by {CCR}5 {Delta}32/{Delta}32 {Stem}-{Cell} {Transplantation}}, - volume = {360}, - issn = {0028-4793}, - url = {http://www.nejm.org/doi/full/10.1056/NEJMoa0802905}, - doi = {10.1056/NEJMoa0802905}, - abstract = {HIV-1 enters host cells by binding to a CD4 receptor and then interacting with either CCR5 or the CXC chemokine receptor (CXCR4). Homozygosity for a 32-bp deletion (delta32/delta32) in the CCR5 allele results in an inactive CCR5 gene product and consequently confers high resistance against HIV-1 acquisition.1 Allogeneic stem-cell transplantation from an HLA-matched donor is a feasible option for patients with hematologic neoplasms, but it has not been established as a therapeutic option for patients who are also infected with HIV.2 Survival of patients with HIV infection has improved considerably since the introduction of highly active antiretroviral therapy (HAART),3 and . . .}, - number = {7}, - urldate = {2013-11-09}, - journal = {New England Journal of Medicine}, - author = {Hütter, Gero and Nowak, Daniel and Mossner, Maximilian and Ganepola, Susanne and Müßig, Arne and Allers, Kristina and Schneider, Thomas and Hofmann, Jörg and Kücherer, Claudia and Blau, Olga and Blau, Igor W. and Hofmann, Wolf K. and Thiel, Eckhard}, - year = {2009}, - pmid = {19213682}, - pages = {692--698}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AQP66AKW/Hütter et al. - 2009 - Long-Term Control of HIV by CCR5 Delta32Delta32 S.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZRJZWKUJ/NEJMoa0802905.html:text/html} -} - -@article{soboleva_unique_2012, - title = {A unique {H}2A histone variant occupies the transcriptional start site of active genes}, - volume = {19}, - copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1545-9993}, - url = {http://www.nature.com/nsmb/journal/v19/n1/full/nsmb.2161.html}, - doi = {10.1038/nsmb.2161}, - abstract = {Transcriptional activation is controlled by chromatin, which needs to be unfolded and remodeled to ensure access to the transcription start site (TSS). However, the mechanisms that yield such an 'open' chromatin structure, and how these processes are coordinately regulated during differentiation, are poorly understood. We identify the mouse (Mus musculus) H2A histone variant H2A.Lap1 as a previously undescribed component of the TSS of active genes expressed during specific stages of spermatogenesis. This unique chromatin landscape also includes a second histone variant, H2A.Z. In the later stages of round spermatid development, H2A.Lap1 dynamically loads onto the inactive X chromosome, enabling the transcriptional activation of previously repressed genes. Mechanistically, we show that H2A.Lap1 imparts unique unfolding properties to chromatin. We therefore propose that H2A.Lap1 coordinately regulates gene expression by directly opening the chromatin structure of the TSS at genes regulated during spermatogenesis.}, - language = {en}, - number = {1}, - urldate = {2014-03-06}, - journal = {Nature Structural \& Molecular Biology}, - author = {Soboleva, Tatiana A. and Nekrasov, Maxim and Pahwa, Anuj and Williams, Rohan and Huttley, Gavin A. and Tremethick, David J.}, - month = jan, - year = {2012}, - pages = {25--30}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6MMNZGF5/Soboleva et al. - 2012 - A unique H2A histone variant occupies the transcri.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GCEE7AFV/nsmb.2161.html:text/html} -} - -@article{katlama_barriers_2013, - title = {Barriers to a cure for {HIV}: new ways to target and eradicate {HIV}-1 reservoirs}, - volume = {381}, - issn = {1474-547X}, - shorttitle = {Barriers to a cure for {HIV}}, - doi = {10.1016/S0140-6736(13)60104-X}, - abstract = {Antiretroviral therapy for HIV infection needs lifelong access and strict adherence to regimens that are both expensive and associated with toxic effects. A curative intervention will be needed to fully stop the epidemic. The failure to eradicate HIV infection during long-term antiretroviral therapy shows the intrinsic stability of the viral genome in latently infected CD4T cells and other cells, and possibly a sustained low-level viral replication. Heterogeneity in latently infected cell populations and homoeostatic proliferation of infected cells might affect the dynamics of virus production and persistence. Despite potent antiretroviral therapy, chronic immune activation, inflammation, and immune dysfunction persist, and are likely to have important effects on the size and distribution of the viral reservoir. The inability of the immune system to recognise cells harbouring latent virus and to eliminate cells actively producing virus is the biggest challenge to finding a cure. We look at new approaches to unravelling the complex virus-host interactions that lead to persistent infection and latency, and discuss the rationale for combination of novel treatment strategies with available antiretroviral treatment options to cure HIV.}, - language = {eng}, - number = {9883}, - journal = {Lancet}, - author = {Katlama, Christine and Deeks, Steven G and Autran, Brigitte and Martinez-Picado, Javier and van Lunzen, Jan and Rouzioux, Christine and Miller, Michael and Vella, Stefano and Schmitz, Joern E and Ahlers, Jeffrey and Richman, Douglas D and Sekaly, Rafick P}, - month = jun, - year = {2013}, - pmid = {23541541}, - keywords = {Anti-HIV Agents, CD4-Positive T-Lymphocytes, CD8-Positive T-Lymphocytes, Drug Therapy, Combination, HIV Infections, HIV-1, Humans, RNA, Viral, Receptors, CCR5, Virus Latency, Virus Replication}, - pages = {2109--2117} -} - -@article{nekrasov_histone_2012, - title = {Histone {H}2A.{Z} inheritance during the cell cycle and its impact on promoter organization and dynamics}, - volume = {19}, - copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1545-9993}, - url = {http://www.nature.com/nsmb/journal/v19/n11/full/nsmb.2424.html}, - doi = {10.1038/nsmb.2424}, - abstract = {Although it has been clearly established that well-positioned histone H2A.Z–containing nucleosomes flank the nucleosome-depleted region (NDR) at the transcriptional start site (TSS) of active mammalian genes, how this chromatin-based information is transmitted through the cell cycle is unknown. We show here that in mouse trophoblast stem cells, the amount of histone H2A.Z at promoters decreased during S phase, coinciding with homotypic (H2A.Z–H2A.Z) nucleosomes flanking the TSS becoming heterotypic (H2A.Z–H2A). To our surprise these nucleosomes remained heterotypic at M phase. At the TSS, we identified an unstable heterotypic histone H2A.Z–containing nucleosome in G1 phase that was lost after DNA replication. These dynamic changes at the TSS mirror a global expansion of the NDR at S and M phases, which, unexpectedly, is unrelated to transcriptional activity. Coincident with the loss of histone H2A.Z at promoters, histone H2A.Z is targeted to the centromere when mitosis begins.}, - language = {en}, - number = {11}, - urldate = {2014-03-06}, - journal = {Nature Structural \& Molecular Biology}, - author = {Nekrasov, Maxim and Amrichova, Jana and Parker, Brian J. and Soboleva, Tatiana A. and Jack, Cameron and Williams, Rohan and Huttley, Gavin A. and Tremethick, David J.}, - month = nov, - year = {2012}, - pages = {1076--1083}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M8HHCT58/Nekrasov et al. - 2012 - Histone H2A.Z inheritance during the cell cycle an.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JDJP7H6T/nsmb.2424.html:text/html} -} - -@article{ponia_arginine_2013, - title = {Arginine rich short linear motif of {HIV}-1 regulatory proteins inhibits {Dicer} dependent {RNA} interference}, - volume = {10}, - copyright = {2013 Ponia et al.; licensee BioMed Central Ltd.}, - issn = {1742-4690}, - url = {http://www.retrovirology.com/content/10/1/97/abstract}, - doi = {10.1186/1742-4690-10-97}, - abstract = {Arginine Rich Motif (ARM) of HIV-1 Tat and Rev are extensively studied linear motifs (LMs). They are already established as an inefficient bipartite nuclear localisation signal (NLS). The unusual passive diffusion of HIV-1 NLS tagged reporter proteins across the nucleus is due to an unknown competing functionality of ARM. Recent findings about the role of retroviral proteins as a suppressor of RNA interference (RNAi) involving their basic residues hint an interesting answer to this alternate functionality. The present work explores the role of HIV-1 ARM as a uniquely evolved viral motif to combat Dicer dependent RNAi.}, - language = {en}, - number = {1}, - urldate = {2013-10-22}, - journal = {Retrovirology}, - author = {Ponia, Sanket S. and Arora, Sakshi and Kumar, Binod and Banerjea, Akhil C.}, - month = sep, - year = {2013}, - pmid = {24025624}, - pages = {97}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MNS6N546/Ponia et al. - 2013 - Arginine rich short linear motif of HIV-1 regulato.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T8FVTX7G/97.html:text/html} -} - -@article{subramanian_h2a.z_2013, - title = {H2A.{Z} {Acidic} {Patch} {Couples} {Chromatin} {Dynamics} to {Regulation} of {Gene} {Expression} {Programs} during {ESC} {Differentiation}}, - volume = {9}, - url = {http://dx.doi.org/10.1371/journal.pgen.1003725}, - doi = {10.1371/journal.pgen.1003725}, - abstract = {Author SummaryElucidating how regulation of chromatin structure modulates gene expression patterns is fundamental for understanding mammalian development. Replacement of core histones with histone variants has recently emerged as a key mechanism for regulating chromatin states. The histone H2A variant H2A.Z is of particular interest because it is essential for embryonic development and for proper execution of developmental gene expression programs during cellular specification. ESCs provide a good model for investigating the function of H2A.Z during lineage commitment because these cells can generate an unlimited number of equivalent descendants while maintaining the capacity to differentiate into any cell type in the organism. Divergent regions in H2A.Z are likely key for functional specialization, but we know little about how these differences contribute to chromatin regulation. Here, we show that the unique H2A.Z acidic patch domain is necessary for regulation of lineage commitment during ESC differentiation by linking transcription to chromatin dynamics. Our work provides a critical foundation for elucidating how H2A.Z incorporation is key to cell fate determination. These findings are particularly important given that H2A.Z has been implicated in many diseased conditions, including cancer.}, - number = {8}, - urldate = {2014-04-18}, - journal = {PLoS Genet}, - author = {Subramanian, Vidya and Mazumder, Aprotim and Surface, Lauren E. and Butty, Vincent L. and Fields, Paul A. and Alwan, Allison and Torrey, Lillian and Thai, Kevin K. and Levine, Stuart S. and Bathe, Mark and Boyer, Laurie A.}, - month = aug, - year = {2013}, - pages = {e1003725}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VG3DZW37/Subramanian et al. - 2013 - H2A.Z Acidic Patch Couples Chromatin Dynamics to R.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/S6K8JWXP/infodoi10.1371journal.pgen.html:text/html} -} - -@article{jin_nucleosome_2007, - title = {Nucleosome stability mediated by histone variants {H}3.3 and {H}2A.{Z}}, - volume = {21}, - issn = {0890-9369, 1549-5477}, - url = {http://genesdev.cshlp.org/content/21/12/1519}, - doi = {10.1101/gad.1547707}, - abstract = {Nucleosomes containing the histone variant H3.3 tend to be clustered in vivo in the neighborhood of transcriptionally active genes and over regulatory elements. It has not been clear, however, whether H3.3-containing nucleosomes possess unique properties that would affect transcription. We report here that H3.3 nucleosomes isolated from vertebrates, regardless of whether they are partnered with H2A or H2A.Z, are unusually sensitive to salt-dependent disruption, losing H2A/H2B or H2A.Z/H2B dimers. Immunoprecipitation studies of nucleosome core particles (NCPs) show that NCPs that contain both H3.3 and H2A.Z are even less stable than NCPs containing H3.3 and H2A. Intriguingly, NCPs containing H3 and H2A.Z are at least as stable as H3/H2A NCPs. These results establish an hierarchy of stabilities for native nucleosomes carrying different complements of variants, and suggest how H2A.Z could play different roles depending on its partners within the NCP. They also are consistent with the idea that H3.3 plays an active role in maintaining accessible chromatin structures in enhancer regions and transcribed regions. Consistent with this idea, promoters and enhancers at transcriptionally active genes and coding regions at highly expressed genes have nucleosomes that simultaneously carry both H3.3 and H2A.Z, and should therefore be extremely sensitive to disruption.}, - language = {en}, - number = {12}, - urldate = {2014-03-11}, - journal = {Genes \& Development}, - author = {Jin, Chunyuan and Felsenfeld, Gary}, - month = jun, - year = {2007}, - pmid = {17575053}, - keywords = {Histone H2A.Z, histone H3.3, nucleosome structure}, - pages = {1519--1529}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MJRMEA3B/Jin et Felsenfeld - 2007 - Nucleosome stability mediated by histone variants .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NIJCSPWZ/1519.html:text/html} -} - -@article{yuen_histone_2013, - title = {Histone {H}3.3 {Mutations}: {A} {Variant} {Path} to {Cancer}}, - volume = {24}, - issn = {1535-6108}, - shorttitle = {Histone {H}3.3 {Mutations}}, - url = {http://www.sciencedirect.com/science/article/pii/S1535610813004224}, - doi = {10.1016/j.ccr.2013.09.015}, - abstract = {A host of cancer types exhibit aberrant histone modifications. Recently, distinct and recurrent mutations in a specific histone variant, histone H3.3, have been implicated in a high proportion of malignant pediatric brain cancers. The presence of mutant H3.3 histone disrupts epigenetic posttranslational modifications near genes involved in cancer processes and in brain function. Here, we review possible mechanisms by which mutant H3.3 histones may act to promote tumorigenesis. Furthermore, we discuss how perturbations in normal H3.3 chromatin-related and epigenetic functions may more broadly contribute to the formation of human cancers.}, - number = {5}, - urldate = {2014-03-18}, - journal = {Cancer Cell}, - author = {Yuen, Benjamin T. K. and Knoepfler, Paul S.}, - month = nov, - year = {2013}, - pages = {567--574}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q36N644D/Yuen et Knoepfler - 2013 - Histone H3.3 Mutations A Variant Path to Cancer.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9TQ4H46H/S1535610813004224.html:text/html} -} - -@article{santisteban_histone_2011, - title = {Histone {Variant} {H}2A.{Z} and {RNA} {Polymerase} {II} {Transcription} {Elongation} ▿}, - volume = {31}, - issn = {0270-7306}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3133230/}, - doi = {10.1128/MCB.01346-10}, - abstract = {Nucleosomes containing histone variant H2A.Z (Htz1) serve to poise quiescent genes for activation and transcriptional initiation. However, little is known about their role in transcription elongation. Here we show that dominant mutations in the elongation genes SPT5 and SPT16 suppress the hypersensitivity of htz1Δ strains to drugs that inhibit elongation, indicating that Htz1 functions at the level of transcription elongation. Direct kinetic measurements of RNA polymerase II (Pol II) movement across the 9.5-kb GAL10p-VPS13 gene revealed that the elongation rate of polymerase is 24\% slower in the absence of Htz1. We provide evidence for two nonexclusive mechanisms. First, we observed that both the phospho-Ser2 levels in the elongating isoform of Pol II and the loading of Spt5 and Elongator over the GAL1 open reading frame (ORF) depend on Htz1. Second, in the absence of Htz1, the density of nucleosome occupancy is increased over the GAL10p-VPS13 ORF and the chromatin is refractory to remodeling during active transcription. These results establish a mechanistic role for Htz1 in transcription elongation and suggest that Htz1-containing nucleosomes facilitate Pol II passage by affecting the correct assembly and modification status of Pol II elongation complexes and by favoring efficient nucleosome remodeling over the gene.}, - number = {9}, - urldate = {2014-03-05}, - journal = {Molecular and Cellular Biology}, - author = {Santisteban, Maria Soledad and Hang, Mingda and Smith, M. Mitchell}, - month = may, - year = {2011}, - pmid = {21357739}, - pmcid = {PMC3133230}, - pages = {1848--1860}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZPSG29UK/Santisteban et al. - 2011 - Histone Variant H2A.Z and RNA Polymerase II Transc.pdf:application/pdf} -} - -@article{noauthor_notitle_nodate -} - -@article{oh_genome-scale_2007, - title = {Genome-scale {Reconstruction} of {Metabolic} {Network} in {Bacillus} subtilis {Based} on {High}-throughput {Phenotyping} and {Gene} {Essentiality} {Data}}, - volume = {282}, - issn = {0021-9258, 1083-351X}, - url = {http://www.jbc.org/content/282/39/28791}, - doi = {10.1074/jbc.M703759200}, - abstract = {In this report, a genome-scale reconstruction of Bacillus subtilis metabolism and its iterative development based on the combination of genomic, biochemical, and physiological information and high-throughput phenotyping experiments is presented. The initial reconstruction was converted into an in silico model and expanded in a four-step iterative fashion. First, network gap analysis was used to identify 48 missing reactions that are needed for growth but were not found in the genome annotation. Second, the computed growth rates under aerobic conditions were compared with high-throughput phenotypic screen data, and the initial in silico model could predict the outcomes qualitatively in 140 of 271 cases considered. Detailed analysis of the incorrect predictions resulted in the addition of 75 reactions to the initial reconstruction, and 200 of 271 cases were correctly computed. Third, in silico computations of the growth phenotypes of knock-out strains were found to be consistent with experimental observations in 720 of 766 cases evaluated. Fourth, the integrated analysis of the large-scale substrate utilization and gene essentiality data with the genome-scale metabolic model revealed the requirement of 80 specific enzymes (transport, 53; intracellular reactions, 27) that were not in the genome annotation. Subsequent sequence analysis resulted in the identification of genes that could be putatively assigned to 13 intracellular enzymes. The final reconstruction accounted for 844 open reading frames and consisted of 1020 metabolic reactions and 988 metabolites. Hence, the in silico model can be used to obtain experimentally verifiable hypothesis on the metabolic functions of various genes.}, - language = {en}, - number = {39}, - urldate = {2014-04-14}, - journal = {Journal of Biological Chemistry}, - author = {Oh, You-Kwan and Palsson, Bernhard O. and Park, Sung M. and Schilling, Christophe H. and Mahadevan, Radhakrishnan}, - month = sep, - year = {2007}, - pmid = {17573341}, - pages = {28791--28799}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5HM5ZAU3/Oh et al. - 2007 - Genome-scale Reconstruction of Metabolic Network i.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U43XD35H/28791.html:text/html} -} - -@article{matsuo_control_2003, - title = {Control {Mechanism} of the {Circadian} {Clock} for {Timing} of {Cell} {Division} in {Vivo}}, - volume = {302}, - issn = {0036-8075, 1095-9203}, - url = {http://www.sciencemag.org/content/302/5643/255}, - doi = {10.1126/science.1086271}, - abstract = {Cell division in many mammalian tissues is associated with specific times of day, but just how the circadian clock controls this timing has not been clear. Here, we show in the regenerating liver (of mice) that the circadian clock controls the expression of cell cycle–related genes that in turn modulate the expression of active Cyclin B1-Cdc2 kinase, a key regulator of mitosis. Among these genes, expression of wee1 was directly regulated by the molecular components of the circadian clockwork. In contrast, the circadian clockwork oscillated independently of the cell cycle in single cells. Thus, the intracellular circadian clockwork can control the cell-division cycle directly and unidirectionally in proliferating cells.}, - language = {en}, - number = {5643}, - urldate = {2014-03-14}, - journal = {Science}, - author = {Matsuo, Takuya and Yamaguchi, Shun and Mitsui, Shigeru and Emi, Aki and Shimoda, Fukuko and Okamura, Hitoshi}, - month = oct, - year = {2003}, - pmid = {12934012}, - pages = {255--259}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6CZ322AZ/Matsuo et al. - 2003 - Control Mechanism of the Circadian Clock for Timin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B9K8HK7V/255.html:text/html} -} - -@article{sutcliffe_dynamic_2009, - title = {Dynamic {Histone} {Variant} {Exchange} {Accompanies} {Gene} {Induction} in {T} {Cells}}, - volume = {29}, - issn = {0270-7306, 1098-5549}, - url = {http://mcb.asm.org/content/29/7/1972}, - doi = {10.1128/MCB.01590-08}, - abstract = {Changes in chromatin composition are often a prerequisite for gene induction. Nonallelic histone variants have recently emerged as key players in transcriptional control and chromatin modulation. While the changes in chromatin accessibility and histone posttranslational modification (PTM) distribution that accompany gene induction are well documented, the dynamics of histone variant exchange that parallel these events are still poorly defined. In this study, we have examined the changes in histone variant distribution that accompany activation of the inducible CD69 and heparanase genes in T cells. We demonstrate that the chromatin accessibility increases that accompany the induction of both of these genes are not associated with nucleosome loss but instead are paralleled by changes in histone variant distribution. Specifically, induction of these genes was paralleled by depletion of the H2A.Z histone variant and concomitant deposition of H3.3. Furthermore, H3.3 deposition was accompanied by changes in PTM patterns consistent with H3.3 enriching or depleting different PTMs upon incorporation into chromatin. Nevertheless, we present evidence that these H3.3-borne PTMs can be negated by recruited enzymatic activities. From these observations, we propose that H3.3 deposition may both facilitate chromatin accessibility increases by destabilizing nucleosomes and compete with recruited histone modifiers to alter PTM patterns upon gene induction.}, - language = {en}, - number = {7}, - urldate = {2014-03-19}, - journal = {Molecular and Cellular Biology}, - author = {Sutcliffe, Elissa L. and Parish, Ian A. and He, Yi Qing and Juelich, Torsten and Tierney, M. Louise and Rangasamy, Danny and Milburn, Peter J. and Parish, Christopher R. and Tremethick, David J. and Rao, Sudha}, - month = apr, - year = {2009}, - pmid = {19158270}, - pages = {1972--1986}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GQIWM2IM/Sutcliffe et al. - 2009 - Dynamic Histone Variant Exchange Accompanies Gene .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7W9HF8EG/1972.html:text/html} -} - -@article{edwards_beginners_2013, - title = {Beginner’s guide to comparative bacterial genome analysis using next-generation sequence data}, - volume = {3}, - copyright = {2013 Edwards and Holt; licensee BioMed Central Ltd.}, - issn = {2042-5783}, - url = {http://www.microbialinformaticsj.com/content/3/1/2/abstract}, - doi = {10.1186/2042-5783-3-2}, - abstract = {High throughput sequencing is now fast and cheap enough to be considered part of the toolbox for investigating bacteria, and there are thousands of bacterial genome sequences available for comparison in the public domain. Bacterial genome analysis is increasingly being performed by diverse groups in research, clinical and public health labs alike, who are interested in a wide array of topics related to bacterial genetics and evolution. Examples include outbreak analysis and the study of pathogenicity and antimicrobial resistance. In this beginner’s guide, we aim to provide an entry point for individuals with a biology background who want to perform their own bioinformatics analysis of bacterial genome data, to enable them to answer their own research questions. We assume readers will be familiar with genetics and the basic nature of sequence data, but do not assume any computer programming skills. The main topics covered are assembly, ordering of contigs, annotation, genome comparison and extracting common typing information. Each section includes worked examples using publicly available E. coli data and free software tools, all which can be performed on a desktop computer. -PMID: 23575213}, - language = {en}, - number = {1}, - urldate = {2014-05-25}, - journal = {Microbial Informatics and Experimentation}, - author = {Edwards, David J. and Holt, Kathryn E.}, - month = apr, - year = {2013}, - pmid = {23575213}, - keywords = {Analysis, Bacterial, Comparative, Methods, Microbial, Next generation sequencing, genomics}, - pages = {2}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VTGNU89C/Edwards et Holt - 2013 - Beginner’s guide to comparative bacterial genome a.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/V9FG8VW9/2.html:text/html} -} - -@article{sundquist_hiv-1_2012, - title = {{HIV}-1 {Assembly}, {Budding}, and {Maturation}}, - volume = {2}, - issn = {2157-1422}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3385941/}, - doi = {10.1101/cshperspect.a006924}, - abstract = {A defining property of retroviruses is their ability to assemble into particles that can leave producer cells and spread infection to susceptible cells and hosts. Virion morphogenesis can be divided into three stages: assembly, wherein the virion is created and essential components are packaged; budding, wherein the virion crosses the plasma membrane and obtains its lipid envelope; and maturation, wherein the virion changes structure and becomes infectious. All of these stages are coordinated by the Gag polyprotein and its proteolytic maturation products, which function as the major structural proteins of the virus. Here, we review our current understanding of the mechanisms of HIV-1 assembly, budding, and maturation, starting with a general overview and then providing detailed descriptions of each of the different stages of virion morphogenesis., The Gag polyprotein and its proteolytic maturation products coordinate all stages of HIV virion morphogenesis.}, - number = {7}, - urldate = {2013-11-10}, - journal = {Cold Spring Harbor Perspectives in Medicine}, - author = {Sundquist, Wesley I. and Krausslich, Hans-Georg}, - month = jul, - year = {2012}, - pmid = {22762019}, - pmcid = {PMC3385941}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J4DZ7NU5/Sundquist et Krausslich - 2012 - HIV-1 Assembly, Budding, and Maturation.pdf:application/pdf} -} - -@article{usami_escrt_2009, - title = {The {ESCRT} pathway and {HIV}-1 budding}, - volume = {37}, - issn = {0300-5127, 1470-8752}, - url = {http://www.biochemsoctrans.org/bst/037/0181/bst0370181.htm}, - doi = {10.1042/BST0370181}, - number = {1}, - urldate = {2013-11-10}, - journal = {Biochemical Society Transactions}, - author = {Usami, Yoshiko and Popov, Sergei and Popova, Elena and Inoue, Michio and Weissenhorn, Winfried and G. Göttlinger, Heinrich}, - month = feb, - year = {2009}, - pages = {181}, - file = {Biochem. Soc. Trans (2009) 37, 181-184 - Yoshiko Usami and others - ESCRTs\: from Cell Biology to Pathogenesis:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PCK242SX/bst0370181.html:text/html} -} - -@article{hardy_euchromatic_2009, - title = {The {Euchromatic} and {Heterochromatic} {Landscapes} {Are} {Shaped} by {Antagonizing} {Effects} of {Transcription} on {H}2A.{Z} {Deposition}}, - volume = {5}, - url = {http://dx.doi.org/10.1371/journal.pgen.1000687}, - doi = {10.1371/journal.pgen.1000687}, - abstract = {Author Summary -DNA in living cells is packaged into chromatin by histones and non-histone proteins. This packaging is very dynamic, allowing the controlled access of regulatory proteins such as transcription factors to DNA. Most chromatin is packaged with so-called canonical histones; namely H2A, H2B, H3, and H4. In some regions, however, variant histones replace canonical histones, creating special chromatin regions. Here we show that the variant histone H2A.Z is dynamically recruited to promoter regions where it helps in the recruitment of RNA polymerase II, the enzyme responsible for the first step of gene expression. In addition, we show that H2A.Z also associates randomly in the genome, but these molecules are removed during the passage of RNA polymerase II. In non-transcribed regions, H2A.Z accumulates in large domains called heterochromatin. We propose that a battle between random H2A.Z deposition and RNAPII-dependent H2A.Z eviction shapes the chromatin landscape.}, - number = {10}, - urldate = {2014-03-05}, - journal = {PLoS Genet}, - author = {Hardy, Sara and Jacques, Pierre-Étienne and Gévry, Nicolas and Forest, Audrey and Fortin, Marie-Ève and Laflamme, Liette and Gaudreau, Luc and Robert, François}, - month = oct, - year = {2009}, - pages = {e1000687}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZEXKFPEU/Hardy et al. - 2009 - The Euchromatic and Heterochromatic Landscapes Are.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ARIX4RI6/infodoi10.1371journal.pgen.html:text/html} -} - -@article{ishibashi_acetylation_2009, - title = {Acetylation of {Vertebrate} {H}2A.{Z} and {Its} {Effect} on the {Structure} of the {Nucleosome}}, - volume = {48}, - issn = {0006-2960}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2850812/}, - doi = {10.1021/bi900196c}, - abstract = {Purified histone H2A.Z from chicken erythrocytes and a sodium butyrate-treated chicken erythroleukemic cell line was used as a model system to identify the acetylation sites (K4, K7, K11, K13, and K15) and quantify their distribution in this vertebrate histone variant. To understand the role played by acetylation in the modulation of the H2A.Z nucleosome core particle (NCP) stability and conformation, an extensive analysis was conducted on NCPs reconstituted from acetylated forms of histones, including H2A.Z and recombinant H2A.Z (K/Q) acetylation mimic mutants. Although the overall global acetylation of core histones destabilizes the NCP, we found that H2A.Z stabilizes the NCP regardless of its state of acetylation. Interestingly and quite unexpectedly, we found that the change in NCP conformation induced by global histone acetylation is dependent on H2A/H2A.Z acetylation. This suggests that acetylated H2A variants act synergistically with the acetylated forms of the core histone complement to alter the particle conformation. Furthermore, the simultaneous occurrence of H2A.Z and H2A in heteromorphic NCPs that most likely occurs in vivo slightly destabilizes the NCP, but only in the presence of acetylation.}, - number = {22}, - urldate = {2014-04-14}, - journal = {Biochemistry}, - author = {Ishibashi, Toyotaka and Dryhurst, Deanna and Rose, Kristie L. and Shabanowitz, Jeffrey and Hunt, Donald F. and Ausio, Juan}, - month = jun, - year = {2009}, - pmid = {19385636}, - pmcid = {PMC2850812}, - pages = {5007--5017}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CRZI98CW/Ishibashi et al. - 2009 - Acetylation of Vertebrate H2A.Z and Its Effect on .pdf:application/pdf} -} - -@article{frankel_hiv-1:_1998, - title = {{HIV}-1: {Fifteen} {Proteins} and an {RNA}}, - volume = {67}, - shorttitle = {{HIV}-1}, - url = {http://www.annualreviews.org/doi/abs/10.1146/annurev.biochem.67.1.1}, - doi = {10.1146/annurev.biochem.67.1.1}, - abstract = {Human immunodeficiency virus type 1 is a complex retrovirus encoding 15 distinct proteins. Substantial progress has been made toward understanding the function of each protein, and three-dimensional structures of many components, including portions of the RNA genome, have been determined. This review describes the function of each component in the context of the viral life cycle: the Gag and Env structural proteins MA (matrix), CA (capsid), NC (nucleocapsid), p6, SU (surface), and TM (transmembrane); the Pol enzymes PR (protease), RT (reverse transcriptase), and IN (integrase); the gene regulatory proteins Tat and Rev; and the accessory proteins Nef, Vif, Vpr, and Vpu. The review highlights recent biochemical and structural studies that help clarify the mechanisms of viral assembly, infection, and replication.}, - number = {1}, - urldate = {2013-11-17}, - journal = {Annual Review of Biochemistry}, - author = {Frankel, Alan D. and Young, John A. T.}, - year = {1998}, - pmid = {9759480}, - keywords = {AIDS, Human Immunodeficiency Virus, retrovirus, viral RNA, viral proteins}, - pages = {1--25}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7H59VSJU/Frankel et Young - 1998 - HIV-1 Fifteen Proteins and an RNA.pdf:application/pdf} -} - -@article{brogaard_map_2012, - title = {A map of nucleosome positions in yeast at base-pair resolution}, - volume = {advance online publication}, - copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1476-4687}, - url = {http://www.nature.com/nature/journal/vaop/ncurrent/full/nature11142.html}, - doi = {10.1038/nature11142}, - abstract = {The exact positions of nucleosomes along genomic DNA can influence many aspects of chromosome function. However, existing methods for mapping nucleosomes do not provide the necessary single-base-pair accuracy to determine these positions. Here we develop and apply a new approach for direct mapping of nucleosome centres on the basis of chemical modification of engineered histones. The resulting map locates nucleosome positions genome-wide in unprecedented detail and accuracy. It shows new aspects of the in vivo nucleosome organization that are linked to transcription factor binding, RNA polymerase pausing and the higher-order structure of the chromatin fibre.}, - language = {en}, - urldate = {2014-04-02}, - journal = {Nature}, - author = {Brogaard, Kristin and Xi, Liqun and Wang, Ji-Ping and Widom, Jonathan}, - month = jun, - year = {2012}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MXTBTQNB/Brogaard et al. - 2012 - A map of nucleosome positions in yeast at base-pai.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NVGPHXC6/nature11142.html:text/html} -} - -@article{stuart_gene-coexpression_2003, - title = {A {Gene}-{Coexpression} {Network} for {Global} {Discovery} of {Conserved} {Genetic} {Modules}}, - volume = {302}, - issn = {0036-8075, 1095-9203}, - url = {http://www.sciencemag.org/content/302/5643/249}, - doi = {10.1126/science.1087447}, - abstract = {To elucidate gene function on a global scale, we identified pairs of genes that are coexpressed over 3182 DNA microarrays from humans, flies, worms, and yeast. We found 22,163 such coexpression relationships, each of which has been conserved across evolution. This conservation implies that the coexpression of these gene pairs confers a selective advantage and therefore that these genes are functionally related. Manyof these relationships provide strong evidence for the involvement of new genes in core biological functions such as the cell cycle, secretion, and protein expression. We experimentallyconfirmed the predictions implied bysome of these links and identified cell proliferation functions for several genes. By assembling these links into a gene-coexpression network, we found several components that were animal-specific as well as interrelationships between newly evolved and ancient modules.}, - language = {en}, - number = {5643}, - urldate = {2013-12-02}, - journal = {Science}, - author = {Stuart, Joshua M. and Segal, Eran and Koller, Daphne and Kim, Stuart K.}, - month = oct, - year = {2003}, - pmid = {12934013}, - pages = {249--255}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XUXGA5H3/Stuart et al. - 2003 - A Gene-Coexpression Network for Global Discovery o.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/R4S7SIRW/249.html:text/html} -} - -@article{suva_epigenetic_2013, - title = {Epigenetic {Reprogramming} in {Cancer}}, - volume = {339}, - issn = {0036-8075, 1095-9203}, - url = {http://www.sciencemag.org/content/339/6127/1567}, - doi = {10.1126/science.1230184}, - abstract = {The demonstration of induced pluripotency and direct lineage conversion has led to remarkable insights regarding the roles of transcription factors and chromatin regulators in mediating cell state transitions. Beyond its considerable implications for regenerative medicine, this body of work is highly relevant to multiple stages of oncogenesis, from the initial cellular transformation to the hierarchical organization of established malignancies. Here, we review conceptual parallels between the respective biological phenomena, highlighting important interrelationships among transcription factors, chromatin regulators, and preexisting epigenetic states. The shared mechanisms provide insights into oncogenic transformation, tumor heterogeneity, and cancer stem cell models.}, - language = {en}, - number = {6127}, - urldate = {2014-03-11}, - journal = {Science}, - author = {Suvà, Mario L. and Riggi, Nicolo and Bernstein, Bradley E.}, - month = mar, - year = {2013}, - pmid = {23539597}, - pages = {1567--1570}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AWB7KTNZ/Suvà et al. - 2013 - Epigenetic Reprogramming in Cancer.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DKI972T7/1567.html:text/html} -} - -@article{ouellet_emergence_2009, - title = {Emergence of a complex relationship between {HIV}-1 and the {microRNA} pathway}, - volume = {487}, - issn = {1064-3745}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2911478/}, - abstract = {Recent experimental evidences support the existence of an increasingly complex and multifaceted interaction between viruses and the microRNA-guided RNA silencing machinery of human cells. The discovery of small interfering RNAs (siRNAs), which are designed to mediate cleavage of specific messenger RNAs (mRNAs), prompted virologists to establish therapeutic strategies based on siRNAs with the aim to suppress replication of several viruses, including human immunodeficiency virus type 1 (HIV-1). It has been appreciated only recently that viral RNAs can also be processed endogenously by the microRNA-generating enzyme Dicer or recognized by cellular miRNAs, in processes that could be viewed as an adapted antiviral defense mechanism. Known to repress mRNA translation through recognition of specific binding sites usually located in their 3′ untranslated region, miRNAs of host or viral origin may exert regulatory effects towards host and/or viral genes and influence viral replication and/or the host response to viral infection. This article summarizes our current state of knowledge on the relationship between HIV-1 and miRNA-guided RNA silencing, and discusses the different aspects of their interaction.}, - urldate = {2013-10-26}, - journal = {Methods in molecular biology (Clifton, N.J.)}, - author = {Ouellet, Dominique L. and Plante, Isabelle and Barat, Corinne and Tremblay, Michel J. and Provost, Patrick}, - year = {2009}, - pmid = {19301659}, - pmcid = {PMC2911478}, - pages = {415--433} -} - -@article{persaud_absence_2013, - title = {Absence of {Detectable} {HIV}-1 {Viremia} after {Treatment} {Cessation} in an {Infant}}, - volume = {369}, - issn = {0028-4793}, - url = {http://www.nejm.org/doi/full/10.1056/NEJMoa1302976}, - doi = {10.1056/NEJMoa1302976}, - abstract = {Nearly 70 million persons have acquired HIV-1 infection since the epidemic was recognized,1 but a “cure” has been documented in one person, known as “the Berlin Patient.”2,3 A cure for HIV-1 infection occurred in this person after he underwent treatment for acute myelogenous leukemia with total ablative chemotherapy, radiation therapy, and stem-cell transplantation with donor cells homozygous for chemokine receptor 5 (CCR5) delta32, with associated graft-versus-host disease. The case of the Berlin Patient shows that long-lived, replication-competent HIV-1 reservoirs can be reduced or cleared sufficiently to permit the discontinuation of ART without subsequent viral rebound. We report data from . . .}, - number = {19}, - urldate = {2013-11-10}, - journal = {New England Journal of Medicine}, - author = {Persaud, Deborah and Gay, Hannah and Ziemniak, Carrie and Chen, Ya Hui and Piatak, Michael and Chun, Tae-Wook and Strain, Matthew and Richman, Douglas and Luzuriaga, Katherine}, - year = {2013}, - pmid = {24152233}, - pages = {1828--1835}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GTF82E2G/Persaud et al. - 2013 - Absence of Detectable HIV-1 Viremia after Treatmen.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SRNS98KN/NEJMoa1302976.html:text/html} -} - -@article{hamiche_chaperoning_2012, - title = {Chaperoning the histone {H}3 family}, - volume = {1819}, - issn = {1874-9399}, - url = {http://www.sciencedirect.com/science/article/pii/S1874939911001623}, - doi = {10.1016/j.bbagrm.2011.08.009}, - abstract = {Chromatin is a highly dynamic nucleoprotein structure, which orchestrates all nuclear process from DNA replication to DNA repair, from transcription to recombination. The proper in vivo assembly of nucleosome, the basic repeating unit of chromatin, requires the deposition of two H3–H4 dimer pairs followed by the addition of two dimers of H2A and H2B. Histone chaperones are responsible for delivery of histones to the site of chromatin assembly and histone deposition onto DNA, histone exchange and removal. Distinct factors have been found associated with different histone H3 variants, which facilitate their deposition. Unraveling the mechanism of histone deposition by specific chaperones is of key importance to epigenetic regulation. In this review, we focus on histone H3 variants and their deposition mechanisms. This article is part of a Special Issue entitled:Histone chaperones and Chromatin assembly.}, - number = {3–4}, - urldate = {2014-02-18}, - journal = {Biochimica et Biophysica Acta (BBA) - Gene Regulatory Mechanisms}, - author = {Hamiche, Ali and Shuaib, Muhammad}, - month = mar, - year = {2012}, - keywords = {Histone chaperones, chromatin assembly, Histone variants}, - pages = {230--237}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UP4HFUFS/Hamiche et Shuaib - 2012 - Chaperoning the histone H3 family.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IBMFB4SK/S1874939911001623.html:text/html} -} - -@article{chen_systematic_2012, - title = {Systematic evaluation of factors influencing {ChIP}-seq fidelity}, - volume = {9}, - copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1548-7091}, - url = {http://www.nature.com/nmeth/journal/v9/n6/full/nmeth.1985.html}, - doi = {10.1038/nmeth.1985}, - abstract = {We evaluated how variations in sequencing depth and other parameters influence interpretation of chromatin immunoprecipitation–sequencing (ChIP-seq) experiments. Using Drosophila melanogaster S2 cells, we generated ChIP-seq data sets for a site-specific transcription factor (Suppressor of Hairy-wing) and a histone modification (H3K36me3). We detected a chromatin-state bias: open chromatin regions yielded higher coverage, which led to false positives if not corrected. This bias had a greater effect on detection specificity than any base-composition bias. Paired-end sequencing revealed that single-end data underestimated ChIP-library complexity at high coverage. Removal of reads originating at the same base reduced false-positives but had little effect on detection sensitivity. Even at mappable-genome coverage depth of {\textasciitilde}1 read per base pair, {\textasciitilde}1\% of the narrow peaks detected on a tiling array were missed by ChIP-seq. Evaluation of widely used ChIP-seq analysis tools suggests that adjustments or algorithm improvements are required to handle data sets with deep coverage.}, - language = {en}, - number = {6}, - urldate = {2014-02-24}, - journal = {Nature Methods}, - author = {Chen, Yiwen and Negre, Nicolas and Li, Qunhua and Mieczkowska, Joanna O. and Slattery, Matthew and Liu, Tao and Zhang, Yong and Kim, Tae-Kyung and He, Housheng Hansen and Zieba, Jennifer and Ruan, Yijun and Bickel, Peter J. and Myers, Richard M. and Wold, Barbara J. and White, Kevin P. and Lieb, Jason D. and Liu, X. Shirley}, - month = jun, - year = {2012}, - pages = {609--614}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FIGGZKFQ/Chen et al. - 2012 - Systematic evaluation of factors influencing ChIP-.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AJC9XCQC/nmeth.1985.html:text/html} -} - -@article{coiras_understanding_2009, - title = {Understanding {HIV}-1 latency provides clues for the eradication of long-term reservoirs}, - volume = {7}, - copyright = {© 2009 Nature Publishing Group}, - issn = {1740-1526}, - url = {http://www.nature.com/nrmicro/journal/v7/n11/full/nrmicro2223.html}, - doi = {10.1038/nrmicro2223}, - abstract = {HIV-1 can infect both activated and resting, non-dividing cells, following which the viral genome can be permanently integrated into a host cell chromosome. Latent HIV-1 reservoirs are established early during primary infection and constitute a major barrier to eradication, even in the presence of highly active antiretroviral therapy. This Review analyses the molecular mechanisms that are necessary for the establishment of HIV-1 latency and their relationships with different cellular and anatomical reservoirs, and discusses the current treatment strategies for targeting viral persistence in reservoirs, their main limitations and future perspectives.}, - language = {en}, - number = {11}, - urldate = {2013-10-12}, - journal = {Nature Reviews Microbiology}, - author = {Coiras, Mayte and López-Huertas, María Rosa and Pérez-Olmeda, Mayte and Alcamí, José}, - month = nov, - year = {2009}, - pages = {798--812}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FIBKTQKD/Coiras et al. - 2009 - Understanding HIV-1 latency provides clues for the.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/X5X3FZ62/nrmicro2223.html:text/html} -} - -@article{tamura_inducible_2009, - title = {Inducible {Deposition} of the {Histone} {Variant} {H}3.3 in {Interferon}-stimulated {Genes}}, - volume = {284}, - issn = {0021-9258, 1083-351X}, - url = {http://www.jbc.org/content/284/18/12217}, - doi = {10.1074/jbc.M805651200}, - abstract = {The H3.3 histone variant is synthesized throughout cell cycle and deposited onto chromatin in a replication-independent manner. It is enriched in transcriptionally active regions of chromatin and is implicated in epigenetic memory. The dynamics of H3.3 deposition during transcriptional activation, however, have not been fully studied so far. Here we examined H3.3 incorporation into interferon (IFN)-stimulated genes in confluent mouse NIH3T3 cells expressing H3.3 fused to the yellow fluorescent protein (YFP). Following IFN stimulation, H3.3-YFP was rapidly incorporated into all four IFN-activated genes tested, with the highest enrichment seen in the distal end of the coding region. Surprisingly, H3.3 enrichment in the coding region continued for an extended period of time, long after transcription ceased. The promoter region, although constitutively enriched with H3.3-YFP, did not show an increase in its deposition in response to IFN stimulation. Further, although H3.3-YFP deposition stably remained in non-dividing cells for days after IFN stimulation, it was rapidly diminished in dividing cells. Lastly, we examined the role of H3.3 in IFN-stimulated transcription by a short hairpin RNA approach and found that IFN-stimulated transcription was significantly impaired in H3.3 knockdown cells. Results indicate that H3.3 plays a role in IFN-mediated transcription, and its deposition leaves a prolonged post-transcriptional mark in these genes.}, - language = {en}, - number = {18}, - urldate = {2014-03-06}, - journal = {Journal of Biological Chemistry}, - author = {Tamura, Tomohiko and Smith, Matthew and Kanno, Tomohiko and Dasenbrock, Hormuzdiyer and Nishiyama, Akira and Ozato, Keiko}, - month = may, - year = {2009}, - pmid = {19244243}, - pages = {12217--12225}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6VI5U5CN/Tamura et al. - 2009 - Inducible Deposition of the Histone Variant H3.3 i.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PBFMKC2I/12217.html:text/html} -} - -@article{noble_quick_2009, - title = {A {Quick} {Guide} to {Organizing} {Computational} {Biology} {Projects}}, - volume = {5}, - url = {http://dx.doi.org/10.1371/journal.pcbi.1000424}, - doi = {10.1371/journal.pcbi.1000424}, - number = {7}, - urldate = {2014-05-23}, - journal = {PLoS Comput Biol}, - author = {Noble, William Stafford}, - month = jul, - year = {2009}, - pages = {e1000424}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IMHDIBQE/Noble - 2009 - A Quick Guide to Organizing Computational Biology .pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BMD72C8E/infodoi10.1371journal.pcbi.html:text/html} -} - -@article{billon_precise_2012, - title = {Precise deposition of histone {H}2A.{Z} in chromatin for genome expression and maintenance}, - volume = {1819}, - issn = {1874-9399}, - url = {http://www.sciencedirect.com/science/article/pii/S1874939911001805}, - doi = {10.1016/j.bbagrm.2011.10.004}, - abstract = {Histone variant H2A.Z is essential in higher eukaryotes and has different functions in the cell. Several studies indicate that H2A.Z is found at specific loci in the genome such as regulatory-gene regions, where it poises genes for transcription. Its deposition creates chromatin regions with particular structural characteristics which could favor rapid transcription activation. This review focuses on the highly regulated mechanism of H2A.Z deposition in chromatin which is essential for genome integrity. Chaperones escort H2A.Z to large ATP-dependent chromatin remodeling enzymes which are responsible for its deposition/eviction. Over the last ten years, biochemical, genetic and genomic studies helped us understand the precise role of these complexes in this process. It has been suggested that a cooperation occurs between histone acetyltransferase and chromatin remodeling activities to incorporate H2A.Z in chromatin. Its regulated deposition near centromeres and telomeres also shows its implication in chromosomal structure integrity and parallels a role in DNA damage response. The dynamics of H2A.Z deposition/eviction at specific loci was shown to be critical for genome expression and maintenance, thus cell fate. Altogether, recent findings reassert the importance of the regulated deposition of this histone variant. This article is part of a Special Issue entitled: Histone chaperones and Chromatin assembly.}, - number = {3–4}, - urldate = {2014-02-24}, - journal = {Biochimica et Biophysica Acta (BBA) - Gene Regulatory Mechanisms}, - author = {Billon, Pierre and Côté, Jacques}, - month = mar, - year = {2012}, - keywords = {Chz1, H2A.Z, Histone variant, Htz1, INO80, NuA4, SRCAP, SWR1, p400}, - pages = {290--302}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K4VKDUAF/Billon et Côté - 2012 - Precise deposition of histone H2A.Z in chromatin f.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9B4SCGRM/S1874939911001805.html:text/html} -} - -@article{ivashkiv_regulation_2014, - title = {Regulation of type {I} interferon responses}, - volume = {14}, - copyright = {© 2014 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1474-1733}, - url = {http://www.nature.com/nri/journal/v14/n1/full/nri3581.html}, - doi = {10.1038/nri3581}, - abstract = {Type I interferons (IFNs) activate intracellular antimicrobial programmes and influence the development of innate and adaptive immune responses. Canonical type I IFN signalling activates the Janus kinase (JAK)–signal transducer and activator of transcription (STAT) pathway, leading to transcription of IFN-stimulated genes (ISGs). Host, pathogen and environmental factors regulate the responses of cells to this signalling pathway and thus calibrate host defences while limiting tissue damage and preventing autoimmunity. Here, we summarize the signalling and epigenetic mechanisms that regulate type I IFN-induced STAT activation and ISG transcription and translation. These regulatory mechanisms determine the biological outcomes of type I IFN responses and whether pathogens are cleared effectively or chronic infection or autoimmune disease ensues.}, - language = {en}, - number = {1}, - urldate = {2014-03-29}, - journal = {Nature Reviews Immunology}, - author = {Ivashkiv, Lionel B. and Donlin, Laura T.}, - month = jan, - year = {2014}, - pages = {36--49}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AWN8I5QK/Ivashkiv et Donlin - 2014 - Regulation of type I interferon responses.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4KBG8W8S/nri3581.html:text/html} -} - -@article{feist_reconstruction_2009, - title = {Reconstruction of biochemical networks in microorganisms}, - volume = {7}, - copyright = {© 2008 Nature Publishing Group}, - issn = {1740-1526}, - url = {http://www.nature.com/nrmicro/journal/v7/n2/full/nrmicro1949.html}, - doi = {10.1038/nrmicro1949}, - abstract = {Systems analysis of metabolic and growth functions in microbial organisms is rapidly developing and maturing. Such studies are enabled by reconstruction, at the genomic scale, of the biochemical reaction networks that underlie cellular processes. The network reconstruction process is organism specific and is based on an annotated genome sequence, high-throughput network-wide data sets and bibliomic data on the detailed properties of individual network components. Here we describe the process that is currently used to achieve comprehensive network reconstructions and discuss how these reconstructions are curated and validated. This Review should aid the growing number of researchers who are carrying out reconstructions for particular target organisms.}, +@article{nozaki_tight_2011, + title = {Tight associations between transcription promoter type and epigenetic variation in histone positioning and modification}, + volume = {12}, + copyright = {2011 Nozaki et al; licensee BioMed Central Ltd.}, + issn = {1471-2164}, + url = {http://www.biomedcentral.com/1471-2164/12/416/abstract}, + doi = {10.1186/1471-2164-12-416}, + abstract = {PMID: 21846408}, language = {en}, - number = {2}, - urldate = {2014-05-19}, - journal = {Nature Reviews Microbiology}, - author = {Feist, Adam M. and Herrgård, Markus J. and Thiele, Ines and Reed, Jennie L. and Palsson, Bernhard Ø}, - month = feb, - year = {2009}, - pages = {129--143}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ECKV3S8Q/Feist et al. - 2009 - Reconstruction of biochemical networks in microorg.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/482KCXMF/nrmicro1949.html:text/html} -} - -@article{brickner_transcriptional_2010, - title = {Transcriptional {Memory}: {Staying} in the {Loop}}, - volume = {20}, - issn = {0960-9822}, - shorttitle = {Transcriptional {Memory}}, - url = {http://www.sciencedirect.com/science/article/pii/S0960982209019885}, - doi = {10.1016/j.cub.2009.11.013}, - abstract = {Actively transcribed genes are organized into loops in which the 5′ and 3′ ends of the gene physically associate. Two new papers show that gene looping can persist after genes are repressed, promoting rapid reactivation of transcription, a phenomenon known as transcriptional memory.}, number = {1}, - urldate = {2014-02-24}, - journal = {Current Biology}, - author = {Brickner, Jason H.}, - month = jan, - year = {2010}, - pages = {R20--R21}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H54ZINRP/Brickner - 2010 - Transcriptional Memory Staying in the Loop.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BSBHJAR6/S0960982209019885.html:text/html} -} - -@article{xiao_discovering_2012, - title = {Discovering {Dysfunction} of {Multiple} {MicroRNAs} {Cooperation} in {Disease} by a {Conserved} {MicroRNA} {Co}-{Expression} {Network}}, - volume = {7}, - url = {http://dx.doi.org/10.1371/journal.pone.0032201}, - doi = {10.1371/journal.pone.0032201}, - abstract = {MicroRNAs, a new class of key regulators of gene expression, have been shown to be involved in diverse biological processes and linked to many human diseases. To elucidate miRNA function from a global perspective, we constructed a conserved miRNA co-expression network by integrating multiple human and mouse miRNA expression data. We found that these conserved co-expressed miRNA pairs tend to reside in close genomic proximity, belong to common families, share common transcription factors, and regulate common biological processes by targeting common components of those processes based on miRNA targets and miRNA knockout/transfection expression data, suggesting their strong functional associations. We also identified several co-expressed miRNA sub-networks. Our analysis reveals that many miRNAs in the same sub-network are associated with the same diseases. By mapping known disease miRNAs to the network, we identified three cancer-related miRNA sub-networks. Functional analyses based on targets and miRNA knockout/transfection data consistently show that these sub-networks are significantly involved in cancer-related biological processes, such as apoptosis and cell cycle. Our results imply that multiple co-expressed miRNAs can cooperatively regulate a given biological process by targeting common components of that process, and the pathogenesis of disease may be associated with the abnormality of multiple functionally cooperative miRNAs rather than individual miRNAs. In addition, many of these co-expression relationships provide strong evidence for the involvement of new miRNAs in important biological processes, such as apoptosis, differentiation and cell cycle, indicating their potential disease links.}, - number = {2}, - urldate = {2013-12-02}, - journal = {PLoS ONE}, - author = {Xiao, Yun and Xu, Chaohan and Guan, Jinxia and Ping, Yanyan and Fan, Huihui and Li, Yiqun and Zhao, Hongying and Li, Xia}, - month = feb, - year = {2012}, - pages = {e32201}, - file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HTPB84QM/Xiao et al. - 2012 - Discovering Dysfunction of Multiple MicroRNAs Coop.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W5P68JZ6/infodoi10.1371journal.pone.html:text/html} -} - -@article{zeng_principles_2006, - title = {Principles of micro-{RNA} production and maturation}, - volume = {25}, - copyright = {© 2006 Nature Publishing Group}, - issn = {0950-9232}, - url = {http://www.nature.com/onc/journal/v25/n46/full/1209908a.html}, - doi = {10.1038/sj.onc.1209908}, - abstract = {Micro-RNAs (miRNAs) are a class of approximately 22-nucleotide non-coding RNAs expressed in multicellular organisms. They are first transcribed in a similar manner to pre-mRNAs. The transcripts then go through a series of processing steps, including endonucleolytic cleavage, nuclear export and a strand selection procedure, to yield the single-stranded mature miRNA products. The transcription and processing of miRNAs determines the abundance and the sequence of mature miRNAs and has important implications for the function of miRNAs.}, - language = {en}, - number = {46}, - urldate = {2013-10-27}, - journal = {Oncogene}, - author = {Zeng, Y.}, - year = {2006}, - keywords = {Drosha, micro-RNA, micro-RNA processing, precursor miRNAs}, - pages = {6156--6162}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8JWTU8UN/Zeng - 2006 - Principles of micro-RNA production and maturation.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TU3UG5BB/1209908a.html:text/html} -} - -@article{szenker_double_2011, - title = {The double face of the histone variant {H}3.3}, - volume = {21}, - issn = {1001-0602}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3193428/}, - doi = {10.1038/cr.2011.14}, - abstract = {Histone proteins wrap DNA to form nucleosome particles that compact eukaryotic genomes while still allowing access for cellular processes such as transcription, replication and DNA repair. Histones exist as different variants that have evolved crucial roles in specialized functions in addition to their fundamental role in packaging DNA. H3.3 – a conserved histone variant that is structurally very close to the canonical histone H3 – has been associated with active transcription. Furthermore, its role in histone replacement at active genes and promoters is highly conserved and has been proposed to participate in the epigenetic transmission of active chromatin states. Unexpectedly, recent data have revealed accumulation of this specific variant at silent loci in pericentric heterochromatin and telomeres, raising questions concerning the actual function of H3.3. In this review, we describe the known properties of H3.3 and the current view concerning its incorporation modes involving particular histone chaperones. Finally, we discuss the functional significance of the use of this H3 variant, in particular during germline formation and early development in different species.}, - number = {3}, - urldate = {2014-02-18}, - journal = {Cell Research}, - author = {Szenker, Emmanuelle and Ray-Gallet, Dominique and Almouzni, Genevieve}, - month = mar, - year = {2011}, - pmid = {21263457}, - pmcid = {PMC3193428}, - pages = {421--434}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MED88XHV/Szenker et al. - 2011 - The double face of the histone variant H3.3.pdf:application/pdf} -} - -@article{donahue_cellular_2013, - title = {Cellular and molecular mechanisms involved in the establishment of {HIV}-1 latency}, - volume = {10}, - issn = {1742-4690}, - doi = {10.1186/1742-4690-10-11}, - abstract = {Latently infected cells represent the major barrier to either a sterilizing or a functional HIV-1 cure. Multiple approaches to reactivation and depletion of the latent reservoir have been attempted clinically, but full depletion of this compartment remains a long-term goal. Compared to the mechanisms involved in the maintenance of HIV-1 latency and the pathways leading to viral reactivation, less is known about the establishment of latent infection. This review focuses on how HIV-1 latency is established at the cellular and molecular levels. We first discuss how latent infection can be established following infection of an activated CD4 T-cell that undergoes a transition to a resting memory state and also how direct infection of a resting CD4 T-cell can lead to latency. Various animal, primary cell, and cell line models also provide insights into this process and are discussed with respect to the routes of infection that result in latency. A number of molecular mechanisms that are active at both transcriptional and post-transcriptional levels have been associated with HIV-1 latency. Many, but not all of these, help to drive the establishment of latent infection, and we review the evidence in favor of or against each mechanism specifically with regard to the establishment of latency. We also discuss the role of immediate silent integration of viral DNA versus silencing of initially active infections. Finally, we discuss potential approaches aimed at limiting the establishment of latent infection.}, - language = {eng}, - journal = {Retrovirology}, - author = {Donahue, Daniel A and Wainberg, Mark A}, - year = {2013}, - pmid = {23375003}, - keywords = {CD4-Positive T-Lymphocytes, Epigenesis, Genetic, HIV-1, Host-Pathogen Interactions, Humans, Models, Biological, Transcription, Genetic, Virus Latency}, - pages = {11} -} - -@article{kile_art_2005, - title = {The art and design of genetic screens: mouse}, - volume = {6}, - copyright = {© 2005 Nature Publishing Group}, - issn = {1471-0056}, - shorttitle = {The art and design of genetic screens}, - url = {http://www.nature.com/nrg/journal/v6/n7/full/nrg1636.html}, - doi = {10.1038/nrg1636}, - abstract = {Humans are mammals, not bacteria or plants, yeast or nematodes, insects or fish. Mice are also mammals, but unlike gorilla and goat, fox and ferret, giraffe and jackal, they are suited perfectly to the laboratory environment and genetic experimentation. In this review, we will summarize the tools, tricks and techniques for executing forward genetic screens in the mouse and argue that this approach is now accessible to most biologists, rather than being the sole domain of large national facilities and specialized genetics laboratories.}, - language = {en}, - number = {7}, - urldate = {2014-03-30}, - journal = {Nature Reviews Genetics}, - author = {Kile, Benjamin T. and Hilton, Douglas J.}, - month = jul, - year = {2005}, - pages = {557--567}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z9ZWDCZW/Kile et Hilton - 2005 - The art and design of genetic screens mouse.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BC5GKG9A/nrg1636.html:text/html} -} - -@article{brawand_evolution_2011, - title = {The evolution of gene expression levels in mammalian organs}, - volume = {478}, - copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v478/n7369/full/nature10532.html}, - doi = {10.1038/nature10532}, - abstract = {Changes in gene expression are thought to underlie many of the phenotypic differences between species. However, large-scale analyses of gene expression evolution were until recently prevented by technological limitations. Here we report the sequencing of polyadenylated RNA from six organs across ten species that represent all major mammalian lineages (placentals, marsupials and monotremes) and birds (the evolutionary outgroup), with the goal of understanding the dynamics of mammalian transcriptome evolution. We show that the rate of gene expression evolution varies among organs, lineages and chromosomes, owing to differences in selective pressures: transcriptome change was slow in nervous tissues and rapid in testes, slower in rodents than in apes and monotremes, and rapid for the X chromosome right after its formation. Although gene expression evolution in mammals was strongly shaped by purifying selection, we identify numerous potentially selectively driven expression switches, which occurred at different rates across lineages and tissues and which probably contributed to the specific organ biology of various mammals.}, - language = {en}, - number = {7369}, - urldate = {2013-12-13}, - journal = {Nature}, - author = {Brawand, David and Soumillon, Magali and Necsulea, Anamaria and Julien, Philippe and Csárdi, Gábor and Harrigan, Patrick and Weier, Manuela and Liechti, Angélica and Aximu-Petri, Ayinuer and Kircher, Martin and Albert, Frank W. and Zeller, Ulrich and Khaitovich, Philipp and Grützner, Frank and Bergmann, Sven and Nielsen, Rasmus and Pääbo, Svante and Kaessmann, Henrik}, - month = oct, + urldate = {2015-04-17}, + journal = {BMC Genomics}, + author = {Nozaki, Tadasu and Yachie, Nozomu and Ogawa, Ryu and Kratz, Anton and Saito, Rintaro and Tomita, Masaru}, + month = aug, year = {2011}, - keywords = {Genetics and genomics, evolution}, - pages = {343--348}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6DK5GSIU/Brawand et al. - 2011 - The evolution of gene expression levels in mammali.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MDIF5DKV/nature10532.html:text/html} + pmid = {21846408}, + pages = {416}, + file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5NVIJMZH/Nozaki et al. - 2011 - Tight associations between transcription promoter .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4R8FAQ3F/416.html:text/html} } -@article{gorry_diminished_1999, - title = {Diminished {Production} of {Human} {Immunodeficiency} {Virus} {Type} 1 in {Astrocytes} {Results} from {Inefficient} {Translation} ofgag, env, and nef {mRNAs} despite {Efficient} {Expression} of {Tat} and {Rev}}, - volume = {73}, - issn = {0022-538X, 1098-5514}, - url = {http://jvi.asm.org/content/73/1/352}, - abstract = {Astrocytes infected with human immunodeficiency virus type 1 (HIV-1) produce only minimal quantities of virus. The molecular events that limit acute-phase HIV-1 infection of astrocytes were examined after inducing acute-phase replication by transfection with the pNL4-3 proviral plasmid. The levels of HIV-1 mRNA were similarly high in both astrocytes and HeLa cells, but astrocytes produced approximately 50-fold less supernatant p24 than HeLa cells. We found that diminished HIV-1 production in astrocytes resulted from inefficient translation ofgag, env, and nef mRNAs that were efficiently transported to the cytoplasm. Tat- or Rev-dependent reporter constructs showed no defect in Tat or Rev function in astrocytes compared with HeLa cells. HIV-1 mRNAs were correctly spliced, but only Rev and Tat proteins were efficiently translated from their native mRNAs. Pulse-chase labelling and immunoblot experiments revealed no defect in protein processing, but levels of Gag, Env, or Nef protein expressed were dramatically reduced in astrocytes compared to HeLa cells. These results demonstrate that inefficient translation of HIV-1 structural proteins underlies the restricted infection of astrocytes. The efficient expression of functional Tat and Rev by astrocytes may contribute to HIV-1 neuropathogenesis.}, - language = {en}, - number = {1}, - urldate = {2013-11-05}, - journal = {Journal of Virology}, - author = {Gorry, Paul R. and Howard, Jane L. and Churchill, Melissa J. and Anderson, Jenny L. and Cunningham, Anthony and Adrian, Deborah and McPhee, Dale A. and Purcell, Damian F. J.}, +@article{boyle_high-resolution_2008, + title = {High-{Resolution} {Mapping} and {Characterization} of {Open} {Chromatin} across the {Genome}}, + volume = {132}, + issn = {0092-8674}, + url = {http://www.sciencedirect.com/science/article/pii/S0092867407016133}, + doi = {10.1016/j.cell.2007.12.014}, + abstract = {Summary +Mapping DNase I hypersensitive (HS) sites is an accurate method of identifying the location of genetic regulatory elements, including promoters, enhancers, silencers, insulators, and locus control regions. We employed high-throughput sequencing and whole-genome tiled array strategies to identify DNase I HS sites within human primary CD4+ T cells. Combining these two technologies, we have created a comprehensive and accurate genome-wide open chromatin map. Surprisingly, only 16\%–21\% of the identified 94,925 DNase I HS sites are found in promoters or first exons of known genes, but nearly half of the most open sites are in these regions. In conjunction with expression, motif, and chromatin immunoprecipitation data, we find evidence of cell-type-specific characteristics, including the ability to identify transcription start sites and locations of different chromatin marks utilized in these cells. In addition, and unexpectedly, our analyses have uncovered detailed features of nucleosome structure.}, + number = {2}, + urldate = {2015-09-11}, + journal = {Cell}, + author = {Boyle, Alan P. and Davis, Sean and Shulha, Hennady P. and Meltzer, Paul and Margulies, Elliott H. and Weng, Zhiping and Furey, Terrence S. and Crawford, Gregory E.}, month = jan, - year = {1999}, - pmid = {9847339}, - pages = {352--361}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RT4SSRH5/Gorry et al. - 1999 - Diminished Production of Human Immunodeficiency Vi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RBF48PI4/352.html:text/html} + year = {2008}, + keywords = {DNA}, + pages = {311--322}, + file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AT3JAG9P/Boyle et al. - 2008 - High-Resolution Mapping and Characterization of Op.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W2KDFIGZ/S0092867407016133.html:text/html} } -@article{creyghton_h2az_2008, - title = {H2AZ {Is} {Enriched} at {Polycomb} {Complex} {Target} {Genes} in {ES} {Cells} and {Is} {Necessary} for {Lineage} {Commitment}}, - volume = {135}, +@article{barski_high-resolution_2007, + title = {High-{Resolution} {Profiling} of {Histone} {Methylations} in the {Human} {Genome}}, + volume = {129}, issn = {0092-8674}, - url = {http://www.sciencedirect.com/science/article/pii/S009286740801252X}, - doi = {10.1016/j.cell.2008.09.056}, - abstract = {Elucidating how chromatin influences gene expression patterns and ultimately cell fate is fundamental to understanding development and disease. The histone variant H2AZ has emerged as a key regulator of chromatin function and plays an essential but unknown role during mammalian development. Here, genome-wide analysis reveals that H2AZ occupies the promoters of developmentally important genes in a manner that is remarkably similar to that of the Polycomb group (PcG) protein Suz12. By using RNAi, we demonstrate a role for H2AZ in regulating target gene expression, find that H2AZ and PcG protein occupancy is interdependent at promoters, and further show that H2AZ is necessary for ES cell differentiation. Notably, H2AZ occupies a different subset of genes in lineage-committed cells, suggesting that its dynamic redistribution is necessary for cell fate transitions. Thus, H2AZ, together with PcG proteins, may establish specialized chromatin states in ES cells necessary for the proper execution of developmental gene expression programs.}, + url = {http://www.sciencedirect.com/science/article/pii/S0092867407006009}, + doi = {10.1016/j.cell.2007.05.009}, + abstract = {Histone modifications are implicated in influencing gene expression. We have generated high-resolution maps for the genome-wide distribution of 20 histone lysine and arginine methylations as well as histone variant H2A.Z, RNA polymerase II, and the insulator binding protein CTCF across the human genome using the Solexa 1G sequencing technology. Typical patterns of histone methylations exhibited at promoters, insulators, enhancers, and transcribed regions are identified. The monomethylations of H3K27, H3K9, H4K20, H3K79, and H2BK5 are all linked to gene activation, whereas trimethylations of H3K27, H3K9, and H3K79 are linked to repression. H2A.Z associates with functional regulatory elements, and CTCF marks boundaries of histone methylation domains. Chromosome banding patterns are correlated with unique patterns of histone modifications. Chromosome breakpoints detected in T cell cancers frequently reside in chromatin regions associated with H3K4 methylations. Our data provide new insights into the function of histone methylation and chromatin organization in genome function.}, number = {4}, - urldate = {2014-03-07}, + urldate = {2014-03-05}, journal = {Cell}, - author = {Creyghton, Menno P. and Markoulaki, Styliani and Levine, Stuart S. and Hanna, Jacob and Lodato, Michael A. and Sha, Ky and Young, Richard A. and Jaenisch, Rudolf and Boyer, Laurie A.}, - month = nov, - year = {2008}, - keywords = {DNA, STEMCELL}, - pages = {649--661}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H7862I5Q/Creyghton et al. - 2008 - H2AZ Is Enriched at Polycomb Complex Target Genes .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7QH9JMNB/S009286740801252X.html:text/html} + author = {Barski, Artem and Cuddapah, Suresh and Cui, Kairong and Roh, Tae-Young and Schones, Dustin E. and Wang, Zhibin and Wei, Gang and Chepelev, Iouri and Zhao, Keji}, + month = may, + year = {2007}, + keywords = {DNA, PROTEINS, SYSBIO}, + pages = {823--837}, + file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QUNNP84A/Barski et al. - 2007 - High-Resolution Profiling of Histone Methylations .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AD6CEICR/S0092867407006009.html:text/html} } -@article{althaus_tailored_2012, - title = {Tailored enrichment strategy detects low abundant small noncoding {RNAs} in {HIV}-1 infected cells}, +@article{bailey_practical_2013, + title = {Practical {Guidelines} for the {Comprehensive} {Analysis} of {ChIP}-seq {Data}}, volume = {9}, - issn = {1742-4690}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3341194/}, - doi = {10.1186/1742-4690-9-27}, - abstract = {Background -The various classes of small noncoding RNAs (sncRNAs) are important regulators of gene expression across divergent types of organisms. While a rapidly increasing number of sncRNAs has been identified over recent years, the isolation of sncRNAs of low abundance remains challenging. Virally encoded sncRNAs, particularly those of RNA viruses, can be expressed at very low levels. This is best illustrated by HIV-1 where virus encoded sncRNAs represent approximately 0.1-1.0\% of all sncRNAs in HIV-1 infected cells or were found to be undetected. Thus, we applied a novel, sequence targeted enrichment strategy to capture HIV-1 derived sncRNAs in HIV-1 infected primary CD4+ T-lymphocytes and macrophages that allows a greater than 100-fold enrichment of low abundant sncRNAs. - -Results -Eight hundred and ninety-two individual HIV-1 sncRNAs were cloned and sequenced from nine different sncRNA libraries derived from five independent experiments. These clones represent up to 90\% of all sncRNA clones in the generated libraries. Two hundred and sixteen HIV-1 sncRNAs were distinguishable as unique clones. They are spread throughout the HIV-1 genome, however, forming certain clusters, and almost 10\% show an antisense orientation. The length of HIV-1 sncRNAs varies between 16 and 89 nucleotides with an unexpected peak at 31 to 50 nucleotides, thus, longer than cellular microRNAs or short-interfering RNAs (siRNAs). Exemplary HIV-1 sncRNAs were also generated in cells infected with different primary HIV-1 isolates and can inhibit HIV-1 replication. - -Conclusions -HIV-1 infected cells generate virally encoded sncRNAs, which might play a role in the HIV-1 life cycle. Furthermore, the enormous capacity to enrich low abundance sncRNAs in a sequence specific manner highly recommends our selection strategy for any type of investigation where origin or target sequences of the sought-after sncRNAs are known.}, - urldate = {2013-10-29}, - journal = {Retrovirology}, - author = {Althaus, Claudia F and Vongrad, Valentina and Niederost, Barbara and Joos, Beda and Di Giallonardo, Francesca and Rieder, Philip and Pavlovic, Jovan and Trkola, Alexandra and Gunthard, Huldrych F and Metzner, Karin J and Fischer, Marek}, - month = mar, - year = {2012}, - pmid = {22458358}, - pmcid = {PMC3341194}, - pages = {27}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HPJAHU6E/Althaus et al. - 2012 - Tailored enrichment strategy detects low abundant .pdf:application/pdf} -} - -@article{lassen_nuclear_2006, - title = {Nuclear {Retention} of {Multiply} {Spliced} {HIV}-1 {RNA} in {Resting} {CD}4+ {T} {Cells}}, - volume = {2}, - issn = {1553-7366}, - url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC1487174/}, - doi = {10.1371/journal.ppat.0020068}, - abstract = {HIV-1 latency in resting CD4+ T cells represents a major barrier to virus eradication in patients on highly active antiretroviral therapy (HAART). We describe here a novel post-transcriptional block in HIV-1 gene expression in resting CD4+ T cells from patients on HAART. This block involves the aberrant localization of multiply spliced (MS) HIV-1 RNAs encoding the critical positive regulators Tat and Rev. Although these RNAs had no previously described export defect, we show that they exhibit strict nuclear localization in resting CD4+ T cells from patients on HAART. Overexpression of the transcriptional activator Tat from non-HIV vectors allowed virus production in these cells. Thus, the nuclear retention of MS HIV-1 RNA interrupts a positive feedback loop and contributes to the non-productive nature of infection of resting CD4+ T cells. To define the mechanism of nuclear retention, proteomic analysis was used to identify proteins that bind MS HIV-1 RNA. Polypyrimidine tract binding protein (PTB) was identified as an HIV-1 RNA-binding protein differentially expressed in resting and activated CD4+ T cells. Overexpression of PTB in resting CD4+ T cells from patients on HAART allowed cytoplasmic accumulation of HIV-1 RNAs. PTB overexpression also induced virus production by resting CD4+ T cells. Virus culture experiments showed that overexpression of PTB in resting CD4+ T cells from patients on HAART allowed release of replication-competent virus, while preserving a resting cellular phenotype. Whether through effects on RNA export or another mechanism, the ability of PTB to reverse latency without inducing cellular activation is a result with therapeutic implications., HIV-1 has the ability to establish a state of latent infection in resting memory CD4+ T cells. These latently infected cells represent a stable reservoir for the virus that is a major barrier to viral eradication. Understanding how this reservoir is established, maintained, and reactivated is essential for developing methods to target and eliminate these cells. Currently, many proposed mechanisms of HIV-1 latency involve a dramatic reduction in ongoing HIV-1 transcription. However, some HIV-1 mRNAs are made, and it has been unclear why the cells are unable to produce virus. This study describes the surprising observation that mRNAs encoding the viral regulatory proteins Tat and Rev are retained in the nucleus of infected resting CD4+ T cells. A cellular HIV-1 RNA-binding protein called polypyrimidine tract binding protein was shown to reverse latency when overexpressed in resting CD4+ T cells. This overexpression of polypyrimidine tract binding protein was sufficient to allow release of replication-competent HIV-1 from latently infected cells without inducing cellular stimulation. These experiments suggest that multiple factors contribute to the maintenance of HIV-1 latency in vivo; however, perturbation of the level of a specific cellular protein is sufficient to overcome these blocks and allow for virus production.}, - number = {7}, - urldate = {2013-11-10}, - journal = {PLoS Pathogens}, - author = {Lassen, Kara G and Ramyar, Kasra X and Bailey, Justin R and Zhou, Yan and Siliciano, Robert F}, - month = jul, - year = {2006}, - pmid = {16839202}, - pmcid = {PMC1487174}, - file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2FIQQE8X/Lassen et al. - 2006 - Nuclear Retention of Multiply Spliced HIV-1 RNA in.pdf:application/pdf} -} - -@article{hammond_dicing_2005-1, - title = {Dicing and slicing: {The} core machinery of the {RNA} interference pathway}, - volume = {579}, - issn = {0014-5793}, - shorttitle = {Dicing and slicing}, - url = {http://www.sciencedirect.com/science/article/pii/S0014579305010884}, - doi = {10.1016/j.febslet.2005.08.079}, - abstract = {RNA interference (RNAi) is broadly defined as a gene silencing pathway that is triggered by double-stranded RNA (dsRNA). Many variations have been described on this theme. The dsRNA trigger can be supplied exogenously, as an experimental tool, or can derive from the genome in the form of microRNAs. Gene silencing can be the result of nucleolytic degradation of the mRNA, or by translational suppression. At the heart of the pathway are two ribonuclease machines. The ribonuclease III enzyme Dicer initiates the RNAi pathway by generating the active short interfering RNA trigger. Silencing is effected by the RNA-induced silencing complex and its RNaseH core enzyme Argonaute. This review describes the discovery of these machines and discusses future lines of work on this amazing biochemical pathway.}, - number = {26}, - urldate = {2013-10-13}, - journal = {FEBS Letters}, - author = {Hammond, Scott M.}, - month = oct, - year = {2005}, - keywords = {Argonaute, Dicer, Drosha, RNA interference, RNA-induced silencing complex, Slicer, miRNA, microRNA}, - pages = {5822--5829}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JM4WDE8C/Hammond - 2005 - Dicing and slicing The core machinery of the RNA .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9CZKPSUJ/S0014579305010884.html:text/html} -} - -@article{nair_probabilistic_2014, - title = {Probabilistic partitioning methods to find significant patterns in {ChIP}-{Seq} data}, - volume = {30}, - issn = {1367-4803, 1460-2059}, - url = {http://bioinformatics.oxfordjournals.org/content/30/17/2406}, - doi = {10.1093/bioinformatics/btu318}, - abstract = {Motivation: We have witnessed an enormous increase in ChIP-Seq data for histone modifications in the past few years. Discovering significant patterns in these data is an important problem for understanding biological mechanisms. -Results: We propose probabilistic partitioning methods to discover significant patterns in ChIP-Seq data. Our methods take into account signal magnitude, shape, strand orientation and shifts. We compare our methods with some current methods and demonstrate significant improvements, especially with sparse data. Besides pattern discovery and classification, probabilistic partitioning can serve other purposes in ChIP-Seq data analysis. Specifically, we exemplify its merits in the context of peak finding and partitioning of nucleosome positioning patterns in human promoters. -Availability and implementation: The software and code are available in the supplementary material. -Contact: Philipp.Bucher@isb-sib.ch -Supplementary information: Supplementary data are available at Bioinformatics online.}, - language = {en}, - number = {17}, - urldate = {2015-04-20}, - journal = {Bioinformatics}, - author = {Nair, Nishanth Ulhas and Kumar, Sunil and Moret, Bernard M. E. and Bucher, Philipp}, - month = sep, - year = {2014}, - pmid = {24812341}, - pages = {2406--2413}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DWWCTKW2/Nair et al. - 2014 - Probabilistic partitioning methods to find signifi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7UEHMJ9U/2406.html:text/html} + url = {http://dx.doi.org/10.1371/journal.pcbi.1003326}, + doi = {10.1371/journal.pcbi.1003326}, + abstract = {Mapping the chromosomal locations of transcription factors, nucleosomes, histone modifications, chromatin remodeling enzymes, chaperones, and polymerases is one of the key tasks of modern biology, as evidenced by the Encyclopedia of DNA Elements (ENCODE) Project. To this end, chromatin immunoprecipitation followed by high-throughput sequencing (ChIP-seq) is the standard methodology. Mapping such protein-DNA interactions in vivo using ChIP-seq presents multiple challenges not only in sample preparation and sequencing but also for computational analysis. Here, we present step-by-step guidelines for the computational analysis of ChIP-seq data. We address all the major steps in the analysis of ChIP-seq data: sequencing depth selection, quality checking, mapping, data normalization, assessment of reproducibility, peak calling, differential binding analysis, controlling the false discovery rate, peak annotation, visualization, and motif analysis. At each step in our guidelines we discuss some of the software tools most frequently used. We also highlight the challenges and problems associated with each step in ChIP-seq data analysis. We present a concise workflow for the analysis of ChIP-seq data in Figure 1 that complements and expands on the recommendations of the ENCODE and modENCODE projects. Each step in the workflow is described in detail in the following sections.}, + number = {11}, + urldate = {2014-05-22}, + journal = {PLoS Comput Biol}, + author = {Bailey, Timothy and Krajewski, Pawel and Ladunga, Istvan and Lefebvre, Celine and Li, Qunhua and Liu, Tao and Madrigal, Pedro and Taslim, Cenny and Zhang, Jie}, + month = nov, + year = {2013}, + pages = {e1003326}, + file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4FGJAV84/Bailey et al. - 2013 - Practical Guidelines for the Comprehensive Analysi.pdf:application/pdf;PLoS Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4SF6WQ4C/infodoi10.1371journal.pcbi.html:text/html} } @article{do_what_2008, title = {What is the expectation maximization algorithm?}, volume = {26}, copyright = {© 2008 Nature Publishing Group}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v26/n8/full/nbt1406.html#close}, doi = {10.1038/nbt1406}, abstract = {The expectation maximization algorithm arises in many computational biology applications that involve probabilistic models. What is it good for, and how does it work?}, language = {en}, number = {8}, urldate = {2015-04-21}, journal = {Nature Biotechnology}, author = {Do, Chuong B. and Batzoglou, Serafim}, month = aug, year = {2008}, pages = {897--899}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5FGUS8D9/Do et Batzoglou - 2008 - What is the expectation maximization algorithm.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FBND2UBT/nbt1406.html:text/html} } @article{tran_survey_2014, title = {A survey of motif finding {Web} tools for detecting binding site motifs in {ChIP}-{Seq} data}, volume = {9}, issn = {1745-6150}, url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC4022013/}, doi = {10.1186/1745-6150-9-4}, abstract = {Abstract ChIP-Seq (chromatin immunoprecipitation sequencing) has provided the advantage for finding motifs as ChIP-Seq experiments narrow down the motif finding to binding site locations. Recent motif finding tools facilitate the motif detection by providing user-friendly Web interface. In this work, we reviewed nine motif finding Web tools that are capable for detecting binding site motifs in ChIP-Seq data. We showed each motif finding Web tool has its own advantages for detecting motifs that other tools may not discover. We recommended the users to use multiple motif finding Web tools that implement different algorithms for obtaining significant motifs, overlapping resemble motifs, and non-overlapping motifs. Finally, we provided our suggestions for future development of motif finding Web tool that better assists researchers for finding motifs in ChIP-Seq data. Reviewers This article was reviewed by Prof. Sandor Pongor, Dr. Yuriy Gusev, and Dr. Shyam Prabhakar (nominated by Prof. Limsoon Wong).}, urldate = {2015-04-09}, journal = {Biology Direct}, author = {Tran, Ngoc Tam L and Huang, Chun-Hsi}, month = feb, year = {2014}, pmid = {24555784}, pmcid = {PMC4022013}, pages = {4}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IWAQUBVS/Tran et Huang - 2014 - A survey of motif finding Web tools for detecting .pdf:application/pdf} } @article{deng_yin_2010, title = {Yin {Yang} 1}, volume = {1}, issn = {2154-1264}, url = {http://dx.doi.org/10.4161/trns.1.2.12375}, doi = {10.4161/trns.1.2.12375}, abstract = {As a transcription factor, Yin Yang 1 (YY1) regulates the transcription of a dazzling list of genes and the number of its targets still mounts. Recent studies revealed that YY1 possesses functions independent of its DNA binding activity and its regulatory role in tumorigenesis has started to emerge.}, number = {2}, urldate = {2015-04-09}, journal = {Transcription}, author = {Deng, Zhiyong and Cao, Paul and Wan, Mei Mei and Sui, Guangchao}, month = sep, year = {2010}, pages = {81--84}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NX4NGAC2/Deng et al. - 2010 - Yin Yang 1.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UXX3CF2A/trns.1.2.html:text/html} } @article{wang_sequence_2012, title = {Sequence features and chromatin structure around the genomic regions bound by 119 human transcription factors}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1798}, doi = {10.1101/gr.139105.112}, abstract = {Chromatin immunoprecipitation coupled with high-throughput sequencing (ChIP-seq) has become the dominant technique for mapping transcription factor (TF) binding regions genome-wide. We performed an integrative analysis centered around 457 ChIP-seq data sets on 119 human TFs generated by the ENCODE Consortium. We identified highly enriched sequence motifs in most data sets, revealing new motifs and validating known ones. The motif sites (TF binding sites) are highly conserved evolutionarily and show distinct footprints upon DNase I digestion. We frequently detected secondary motifs in addition to the canonical motifs of the TFs, indicating tethered binding and cobinding between multiple TFs. We observed significant position and orientation preferences between many cobinding TFs. Genes specifically expressed in a cell line are often associated with a greater occurrence of nearby TF binding in that cell line. We observed cell-line–specific secondary motifs that mediate the binding of the histone deacetylase HDAC2 and the enhancer-binding protein EP300. TF binding sites are located in GC-rich, nucleosome-depleted, and DNase I sensitive regions, flanked by well-positioned nucleosomes, and many of these features show cell type specificity. The GC-richness may be beneficial for regulating TF binding because, when unoccupied by a TF, these regions are occupied by nucleosomes in vivo. We present the results of our analysis in a TF-centric web repository Factorbook (http://factorbook.org) and will continually update this repository as more ENCODE data are generated.}, language = {en}, number = {9}, urldate = {2015-04-21}, journal = {Genome Research}, author = {Wang, Jie and Zhuang, Jiali and Iyer, Sowmya and Lin, XinYing and Whitfield, Troy W. and Greven, Melissa C. and Pierce, Brian G. and Dong, Xianjun and Kundaje, Anshul and Cheng, Yong and Rando, Oliver J. and Birney, Ewan and Myers, Richard M. and Noble, William S. and Snyder, Michael and Weng, Zhiping}, month = sep, year = {2012}, pmid = {22955990}, pages = {1798--1812}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZG5GCSXZ/Wang et al. - 2012 - Sequence features and chromatin structure around t.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FDW4W9EP/1798.html:text/html;Wang et al. 2012 - Supplemental_materials.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BKCK28GC/Wang et al. 2012 - Supplemental_materials.pdf:application/pdf} } @article{stormo_determining_2010, title = {Determining the specificity of protein–{DNA} interactions}, volume = {11}, copyright = {© 2010 Nature Publishing Group}, issn = {1471-0056}, url = {http://www.nature.com/nrg/journal/v11/n11/full/nrg2845.html}, doi = {10.1038/nrg2845}, abstract = {Proteins, such as many transcription factors, that bind to specific DNA sequences are essential for the proper regulation of gene expression. Identifying the specific sequences that each factor binds can help to elucidate regulatory networks within cells and how genetic variation can cause disruption of normal gene expression, which is often associated with disease. Traditional methods for determining the specificity of DNA-binding proteins are slow and laborious, but several new high-throughput methods can provide comprehensive binding information much more rapidly. Combined with in vivo determinations of transcription factor binding locations, this information provides more detailed views of the regulatory circuitry of cells and the effects of variation on gene expression.}, language = {en}, number = {11}, urldate = {2015-04-09}, journal = {Nature Reviews Genetics}, author = {Stormo, Gary D. and Zhao, Yue}, month = nov, year = {2010}, pages = {751--760}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WTQGGPQU/Stormo et Zhao - 2010 - Determining the specificity of protein–DNA interac.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KURBDEHF/nrg2845.html:text/html} } @article{pepke_computation_2009, title = {Computation for {ChIP}-seq and {RNA}-seq studies}, volume = {6}, copyright = {© 2009 Nature Publishing Group}, issn = {1548-7091}, url = {http://www.nature.com/nmeth/journal/v6/n11s/full/nmeth.1371.html}, doi = {10.1038/nmeth.1371}, abstract = {Genome-wide measurements of protein-DNA interactions and transcriptomes are increasingly done by deep DNA sequencing methods (ChIP-seq and RNA-seq). The power and richness of these counting-based measurements comes at the cost of routinely handling tens to hundreds of millions of reads. Whereas early adopters necessarily developed their own custom computer code to analyze the first ChIP-seq and RNA-seq datasets, a new generation of more sophisticated algorithms and software tools are emerging to assist in the analysis phase of these projects. Here we describe the multilayered analyses of ChIP-seq and RNA-seq datasets, discuss the software packages currently available to perform tasks at each layer and describe some upcoming challenges and features for future analysis tools. We also discuss how software choices and uses are affected by specific aspects of the underlying biology and data structure, including genome size, positional clustering of transcription factor binding sites, transcript discovery and expression quantification.}, language = {en}, number = {11s}, urldate = {2015-04-09}, journal = {Nature Methods}, author = {Pepke, Shirley and Wold, Barbara and Mortazavi, Ali}, month = nov, year = {2009}, pages = {S22--S32}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NUI26MUX/Pepke et al. - 2009 - Computation for ChIP-seq and RNA-seq studies.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TDGAAFHM/nmeth.1371.html:text/html} } @article{wilbanks_evaluation_2010, title = {Evaluation of {Algorithm} {Performance} in {ChIP}-{Seq} {Peak} {Detection}}, volume = {5}, url = {http://dx.doi.org/10.1371/journal.pone.0011471}, doi = {10.1371/journal.pone.0011471}, abstract = {Next-generation DNA sequencing coupled with chromatin immunoprecipitation (ChIP-seq) is revolutionizing our ability to interrogate whole genome protein-DNA interactions. Identification of protein binding sites from ChIP-seq data has required novel computational tools, distinct from those used for the analysis of ChIP-Chip experiments. The growing popularity of ChIP-seq spurred the development of many different analytical programs (at last count, we noted 31 open source methods), each with some purported advantage. Given that the literature is dense and empirical benchmarking challenging, selecting an appropriate method for ChIP-seq analysis has become a daunting task. Herein we compare the performance of eleven different peak calling programs on common empirical, transcription factor datasets and measure their sensitivity, accuracy and usability. Our analysis provides an unbiased critical assessment of available technologies, and should assist researchers in choosing a suitable tool for handling ChIP-seq data.}, number = {7}, urldate = {2015-04-22}, journal = {PLoS ONE}, author = {Wilbanks, Elizabeth G. and Facciotti, Marc T.}, month = jul, year = {2010}, pages = {e11471}, file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RWE7B96I/Wilbanks et Facciotti - 2010 - Evaluation of Algorithm Performance in ChIP-Seq Pe.pdf:application/pdf} } -@article{yu_nfatc2_2015, - title = {{NFATc}2 mediates epigenetic modification of dendritic cell cytokine and chemokine responses to dectin-1 stimulation}, - volume = {43}, - issn = {0305-1048, 1362-4962}, - url = {http://nar.oxfordjournals.org/content/43/2/836}, - doi = {10.1093/nar/gku1369}, - abstract = {The transcription factor NFATc2 regulates dendritic cell (DC) responses to microbial stimulation through the C-type lectin receptor dectin-1. But the genetic targets of NFATc2 and their effects on DC function remain largely unknown. Therefore we used ChIP-seq to conduct genome-wide mapping of NFATc2 target sites in dectin-1-activated DCs. By combining binding-site data with a comprehensive gene expression profile, we found that NFATc2 occupancy regulates the expression of a subset of dectin-1-activated genes. Surprisingly, NFATc2 targeted an extensive range of DC-derived cytokines and chemokines, including regulatory cytokines such as IL2, IL23a and IL12b. Furthermore, we demonstrated that NFATc2 binding is required to induce the histone 3 lysine 4 trimethylation (H3K4me3) epigenetic mark, which is associated with enhanced gene expression. Together, these data show that the transcription factor NFATc2 mediates epigenetic modification of DC cytokine and chemokine genes leading to activation of their expression.}, - language = {en}, - number = {2}, - urldate = {2015-06-02}, - journal = {Nucleic Acids Research}, - author = {Yu, Hong-Bing and Yurieva, Marina and Balachander, Akhila and Foo, Ivy and Leong, Xiangrong and Zelante, Teresa and Zolezzi, Francesca and Poidinger, Michael and Ricciardi-Castagnoli, Paola}, - month = jan, - year = {2015}, - pmid = {25550437}, - pages = {836--847}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HDJFWRSR/Yu et al. - 2015 - NFATc2 mediates epigenetic modification of dendrit.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9DXTFQ7Z/836.html:text/html} -} - @article{landt_chip-seq_2012, title = {{ChIP}-seq guidelines and practices of the {ENCODE} and {modENCODE} consortia}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1813}, doi = {10.1101/gr.136184.111}, abstract = {Chromatin immunoprecipitation (ChIP) followed by high-throughput DNA sequencing (ChIP-seq) has become a valuable and widely used approach for mapping the genomic location of transcription-factor binding and histone modifications in living cells. Despite its widespread use, there are considerable differences in how these experiments are conducted, how the results are scored and evaluated for quality, and how the data and metadata are archived for public use. These practices affect the quality and utility of any global ChIP experiment. Through our experience in performing ChIP-seq experiments, the ENCODE and modENCODE consortia have developed a set of working standards and guidelines for ChIP experiments that are updated routinely. The current guidelines address antibody validation, experimental replication, sequencing depth, data and metadata reporting, and data quality assessment. We discuss how ChIP quality, assessed in these ways, affects different uses of ChIP-seq data. All data sets used in the analysis have been deposited for public viewing and downloading at the ENCODE (http://encodeproject.org/ENCODE/) and modENCODE (http://www.modencode.org/) portals.}, language = {en}, number = {9}, urldate = {2015-04-16}, journal = {Genome Research}, author = {Landt, Stephen G. and Marinov, Georgi K. and Kundaje, Anshul and Kheradpour, Pouya and Pauli, Florencia and Batzoglou, Serafim and Bernstein, Bradley E. and Bickel, Peter and Brown, James B. and Cayting, Philip and Chen, Yiwen and DeSalvo, Gilberto and Epstein, Charles and Fisher-Aylor, Katherine I. and Euskirchen, Ghia and Gerstein, Mark and Gertz, Jason and Hartemink, Alexander J. and Hoffman, Michael M. and Iyer, Vishwanath R. and Jung, Youngsook L. and Karmakar, Subhradip and Kellis, Manolis and Kharchenko, Peter V. and Li, Qunhua and Liu, Tao and Liu, X. Shirley and Ma, Lijia and Milosavljevic, Aleksandar and Myers, Richard M. and Park, Peter J. and Pazin, Michael J. and Perry, Marc D. and Raha, Debasish and Reddy, Timothy E. and Rozowsky, Joel and Shoresh, Noam and Sidow, Arend and Slattery, Matthew and Stamatoyannopoulos, John A. and Tolstorukov, Michael Y. and White, Kevin P. and Xi, Simon and Farnham, Peggy J. and Lieb, Jason D. and Wold, Barbara J. and Snyder, Michael}, month = sep, year = {2012}, pmid = {22955991}, - pages = {1813--1831}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4JW5NMSR/Landt et al. - 2012 - ChIP-seq guidelines and practices of the ENCODE an.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9IPS4QVU/1813.html:text/html} -} - -@article{li_measuring_2011, - title = {Measuring reproducibility of high-throughput experiments}, - volume = {5}, - issn = {1932-6157, 1941-7330}, - url = {http://projecteuclid.org/euclid.aoas/1318514284}, - doi = {10.1214/11-AOAS466}, - abstract = {Reproducibility is essential to reliable scientific discovery in high-throughput experiments. In this work we propose a unified approach to measure the reproducibility of findings identified from replicate experiments and identify putative discoveries using reproducibility. Unlike the usual scalar measures of reproducibility, our approach creates a curve, which quantitatively assesses when the findings are no longer consistent across replicates. Our curve is fitted by a copula mixture model, from which we derive a quantitative reproducibility score, which we call the “irreproducible discovery rate” (IDR) analogous to the FDR. This score can be computed at each set of paired replicate ranks and permits the principled setting of thresholds both for assessing reproducibility and combining replicates. Since our approach permits an arbitrary scale for each replicate, it provides useful descriptive measures in a wide variety of situations to be explored. We study the performance of the algorithm using simulations and give a heuristic analysis of its theoretical properties. We demonstrate the effectiveness of our method in a ChIP-seq experiment.}, - language = {EN}, - number = {3}, - urldate = {2015-04-16}, - journal = {The Annals of Applied Statistics}, - author = {Li, Qunhua and Brown, James B. and Huang, Haiyan and Bickel, Peter J.}, - month = sep, - year = {2011}, - mrnumber = {MR2884921}, - zmnumber = {1231.62124}, - keywords = {genomics, Reproducibility, association, mixture model, copula, iterative algorithm, irreproducible discovery rate, high-throughput experiment}, - pages = {1752--1779}, - file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/X7878PMG/1318514284.html:text/html} -} - -@article{oh_interaction_2012, - title = {Interaction between {BZR}1 and {PIF}4 integrates brassinosteroid and environmental responses}, - volume = {14}, - copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {1465-7392}, - url = {http://www.nature.com/ncb/journal/v14/n8/full/ncb2545.html}, - doi = {10.1038/ncb2545}, - abstract = {Plant growth is coordinately regulated by environmental and hormonal signals. Brassinosteroid (BR) plays essential roles in growth regulation by light and temperature, but the interactions between BR and these environmental signals remain poorly understood at the molecular level. Here, we show that direct interaction between the dark- and heat-activated transcription factor phytochrome-interacting factor 4 (PIF4) and the BR-activated transcription factor BZR1 integrates the hormonal and environmental signals. BZR1 and PIF4 interact with each other in vitro and in vivo, bind to nearly 2,000 common target genes, and synergistically regulate many of these target genes, including the PRE family helix–loop–helix factors required for promoting cell elongation. Genetic analysis indicates that BZR1 and PIFs are interdependent in promoting cell elongation in response to BR, darkness or heat. These results show that the BZR1–PIF4 interaction controls a core transcription network, enabling plant growth co-regulation by the steroid and environmental signals.}, - language = {en}, - number = {8}, - urldate = {2015-06-02}, - journal = {Nature Cell Biology}, - author = {Oh, Eunkyoo and Zhu, Jia-Ying and Wang, Zhi-Yong}, - month = aug, - year = {2012}, - pages = {802--809}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/59U4SJRE/Oh et al. - 2012 - Interaction between BZR1 and PIF4 integrates brass.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XDHBFPAC/ncb2545.html:text/html} -} - -@article{darmostuk_current_nodate, - title = {Current approaches in {SELEX}: {An} update to aptamer selection technology}, - issn = {0734-9750}, - shorttitle = {Current approaches in {SELEX}}, - url = {http://www.sciencedirect.com/science/article/pii/S0734975015000336}, - doi = {10.1016/j.biotechadv.2015.02.008}, - abstract = {Systematic evolution of ligands by exponential enrichment (SELEX) is a well-established and efficient technology for the generation of oligonucleotides with a high target affinity. These SELEX-derived single stranded DNA and RNA molecules, called aptamers, were selected against various targets, such as proteins, cells, microorganisms, chemical compounds etc. They have a great potential in the use as novel antibodies, in cancer theragnostics and in biomedical research. Vast interest in aptamers stimulated continuous development of SELEX, which underwent numerous modifications since its first application in 1990. Novel modifications made the selection process more efficient, cost-effective and significantly less time-consuming. This article brings a comprehensive and up-to-date review of recent advances in SELEX methods and pinpoints advantages, main obstacles and limitations. The post-SELEX strategies and examples of application are also briefly outlined in this review.}, - urldate = {2015-06-25}, - journal = {Biotechnology Advances}, - author = {Darmostuk, Mariia and Rimpelová, Silvie and Gbelcová, Helena and Ruml, Tomáš}, - keywords = {Aptamers, In silico selection, Oligonucleotide library, PCR, Post-SELEX, SELEX}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/57DBC7BD/Darmostuk et al. - Current approaches in SELEX An update to aptamer .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/R6QTCAEJ/S0734975015000336.html:text/html} + pages = {1813--1831}, + file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4JW5NMSR/Landt et al. - 2012 - ChIP-seq guidelines and practices of the ENCODE an.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9IPS4QVU/1813.html:text/html} } @article{zimmermann_genomic_2010, series = {{RNA}: {From} {Sequence} to {Structure} and {Dynamics}}, title = {Genomic {SELEX}: {A} discovery tool for genomic aptamers}, volume = {52}, issn = {1046-2023}, shorttitle = {Genomic {SELEX}}, url = {http://www.sciencedirect.com/science/article/pii/S1046202310001581}, doi = {10.1016/j.ymeth.2010.06.004}, abstract = {Genomic SELEX is a discovery tool for genomic aptamers, which are genomically encoded functional domains in nucleic acid molecules that recognize and bind specific ligands. When combined with genomic libraries and using RNA-binding proteins as baits, Genomic SELEX used with high-throughput sequencing enables the discovery of genomic RNA aptamers and the identification of RNA–protein interaction networks. Here we describe how to construct and analyze genomic libraries, how to choose baits for selections, how to perform the selection procedure and finally how to analyze the enriched sequences derived from deep sequencing. As a control procedure, we recommend performing a “Neutral” SELEX experiment in parallel to the selection, omitting the selection step. This control experiment provides a background signal for comparison with the positively selected pool. We also recommend deep sequencing the initial library in order to facilitate the final in silico analysis of enrichment with respect to the initial levels. Counter selection procedures, using modified or inactive baits, allow strengthening the binding specificity of the winning selected sequences.}, number = {2}, urldate = {2015-06-25}, journal = {Methods}, author = {Zimmermann, Bob and Bilusic, Ivana and Lorenz, Christina and Schroeder, Renée}, month = oct, year = {2010}, pages = {125--132}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z8JU4VG9/Zimmermann et al. - 2010 - Genomic SELEX A discovery tool for genomic aptame.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WD9VZP7G/S1046202310001581.html:text/html} } @article{schwalie_co-binding_2013, title = {Co-binding by {YY}1 identifies the transcriptionally active, highly conserved set of {CTCF}-bound regions in primate genomes}, volume = {14}, copyright = {2013 Schwalie et al.; licensee BioMed Central Ltd.}, issn = {1465-6906}, url = {http://genomebiology.com/2013/14/12/R148/abstract}, doi = {10.1186/gb-2013-14-12-r148}, abstract = {PMID: 24380390}, language = {en}, number = {12}, urldate = {2015-06-26}, journal = {Genome Biology}, author = {Schwalie, Petra C. and Ward, Michelle C. and Cain, Carolyn E. and Faure, Andre J. and Gilad, Yoav and Odom, Duncan T. and Flicek, Paul}, month = dec, year = {2013}, pmid = {24380390}, pages = {R148}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F284DM3W/Schwalie et al. - 2013 - Co-binding by YY1 identifies the transcriptionally.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G3RIKXKT/R148.html:text/html} } -@article{stormo_determining_2010-1, - title = {Determining the specificity of protein–{DNA} interactions}, - volume = {11}, - copyright = {© 2010 Nature Publishing Group}, - issn = {1471-0056}, - url = {http://www.nature.com/nrg/journal/v11/n11/full/nrg2845.html}, - doi = {10.1038/nrg2845}, - abstract = {Proteins, such as many transcription factors, that bind to specific DNA sequences are essential for the proper regulation of gene expression. Identifying the specific sequences that each factor binds can help to elucidate regulatory networks within cells and how genetic variation can cause disruption of normal gene expression, which is often associated with disease. Traditional methods for determining the specificity of DNA-binding proteins are slow and laborious, but several new high-throughput methods can provide comprehensive binding information much more rapidly. Combined with in vivo determinations of transcription factor binding locations, this information provides more detailed views of the regulatory circuitry of cells and the effects of variation on gene expression.}, - language = {en}, - number = {11}, - urldate = {2015-04-09}, - journal = {Nature Reviews Genetics}, - author = {Stormo, Gary D. and Zhao, Yue}, - month = nov, - year = {2010}, - pages = {751--760} -} - @article{giraud_parallel_2011, series = {Follow-on of {ISPDC}'2009 and {HeteroPar}'2009}, title = {Parallel {Position} {Weight} {Matrices} algorithms}, volume = {37}, issn = {0167-8191}, url = {http://www.sciencedirect.com/science/article/pii/S0167819110001389}, doi = {10.1016/j.parco.2010.10.001}, abstract = {Position Weight Matrices (PWMs) are broadly used in computational biology. The basic problems, Scan and MultipleScan, aim to find all the occurrences of a given PWM or a set of PWMs in long sequences. Some other PWM tasks share a common NP-hard subproblem, ScoreDistribution. The existing algorithms rely on the enumeration on a large set of scores or words, and they are mostly not suitable for parallelization. We propose a new algorithm, BucketScoreDistribution, that is both very efficient and suitable for parallelization. We bound the error induced by this algorithm. We realized a GPU prototype for Scan, MultipleScan and BucketScoreDistribution with the CUDA libraries, and report for the different problems speedups larger than 10× on several Nvidia cards.}, number = {8}, urldate = {2015-07-09}, journal = {Parallel Computing}, author = {Giraud, Mathieu and Varré, Jean-Stéphane}, month = aug, year = {2011}, keywords = {Position Weight Matrices, P-value estimation, Pattern matching, Score distribution, Many-core architectures, GPU, bioinformatics}, pages = {466--478}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7RG5J9PV/Giraud et Varré - 2011 - Parallel Position Weight Matrices algorithms.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HHPD6IGI/S0167819110001389.html:text/html} } @article{wu_fast_2000, title = {Fast probabilistic analysis of sequence function using scoring matrices}, volume = {16}, issn = {1367-4803, 1460-2059}, url = {http://bioinformatics.oxfordjournals.org/content/16/3/233}, doi = {10.1093/bioinformatics/16.3.233}, abstract = {Motivation: We present techniques for increasing the speed of sequence analysis using scoring matrices. Our techniques are based on calculating, for a given scoring matrix, the quantile function, which assigns a probability, or p, value to each segmental score. Our techniques also permit the user to specify a p threshold to indicate the desired trade-off between sensitivity and speed for a particular sequence analysis. The resulting increase in speed should allow scoring matrices to be used more widely in large-scale sequencing and annotation projects. Results: We develop three techniques for increasing the speed of sequence analysis: probability filtering, lookahead scoring, and permuted lookahead scoring. In probability filtering, we compute the score threshold that corresponds to the user-specified p threshold. We use the score threshold to limit the number of segments that are retained in the search process. In lookahead scoring, we test intermediate scores to determine whether they will possibly exceed the score threshold. In permuted lookahead scoring, we score each segment in a particular order designed to maximize the likelihood of early termination. Our two lookahead scoring techniques reduce substantially the number of residues that must be examined. The fraction of residues examined ranges from 62 to 6\%, depending on the p threshold chosen by the user. These techniques permit sequence analysis with scoring matrices at speeds that are several times faster than existing programs. On a database of 12 177 alignment blocks, our techniques permit sequence analysis at a speed of 225 residues/s for a p threshold of 10−6, and 541 residues/s for a p threshold of 10−20. In order to compute the quantile function, we may use either an independence assumption or a Markov assumption. We measure the effect of first- and second-order Markov assumptions and find that they tend to raise the p value of segments, when compared with the independence assumption, by average ratios of 1.30 and 1.69, respectively. We also compare our technique with the empirical 99.5th percentile scores compiled in the BLOCKSPLUS database, and find that they correspond on average to a p value of 1.5 × 10−5. Availability: The techniques described above are implemented in a software package called EMATRIX. This package is available from the authors for free academic use or for licensed commercial use. The EMATRIX set of programs is also available on the Internet at http://motif.stanford.edu/ematrix.}, language = {en}, number = {3}, urldate = {2015-07-24}, journal = {Bioinformatics}, author = {Wu, Thomas D. and Nevill-Manning, Craig G. and Brutlag, Douglas L.}, month = mar, year = {2000}, pmid = {10869016}, pages = {233--244}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TBQ8WNZW/Wu et al. - 2000 - Fast probabilistic analysis of sequence function u.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GHRVXN4S/233.html:text/html} } @article{ioshikhes_nucleosome_2006, title = {Nucleosome positions predicted through comparative genomics}, volume = {38}, copyright = {© 2006 Nature Publishing Group}, issn = {1061-4036}, url = {http://www.nature.com/ng/journal/v38/n10/full/ng1878.html}, doi = {10.1038/ng1878}, abstract = {DNA sequence has long been recognized as an important contributor to nucleosome positioning, which has the potential to regulate access to genes. The extent to which the nucleosomal architecture at promoters is delineated by the underlying sequence is now being worked out. Here we use comparative genomics to report a genome-wide map of nucleosome positioning sequences (NPSs) located in the vicinity of all Saccharomyces cerevisiae genes. We find that the underlying DNA sequence provides a very good predictor of nucleosome locations that have been experimentally mapped to a small fraction of the genome. Notably, distinct classes of genes possess characteristic arrangements of NPSs that may be important for their regulation. In particular, genes that have a relatively compact NPS arrangement over the promoter region tend to have a TATA box buried in an NPS and tend to be highly regulated by chromatin modifying and remodeling factors.}, language = {en}, number = {10}, urldate = {2015-07-24}, journal = {Nature Genetics}, author = {Ioshikhes, Ilya P. and Albert, Istvan and Zanton, Sara J. and Pugh, B. Franklin}, month = oct, year = {2006}, pages = {1210--1215}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MRIMS7MH/Ioshikhes et al. - 2006 - Nucleosome positions predicted through comparative.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KCSRRJC8/ng1878.html:text/html} } @article{thurman_accessible_2012, title = {The accessible chromatin landscape of the human genome}, volume = {489}, copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v489/n7414/full/nature11232.html}, doi = {10.1038/nature11232}, abstract = {DNase I hypersensitive sites (DHSs) are markers of regulatory DNA and have underpinned the discovery of all classes of cis-regulatory elements including enhancers, promoters, insulators, silencers and locus control regions. Here we present the first extensive map of human DHSs identified through genome-wide profiling in 125 diverse cell and tissue types. We identify {\textasciitilde}2.9 million DHSs that encompass virtually all known experimentally validated cis-regulatory sequences and expose a vast trove of novel elements, most with highly cell-selective regulation. Annotating these elements using ENCODE data reveals novel relationships between chromatin accessibility, transcription, DNA methylation and regulatory factor occupancy patterns. We connect {\textasciitilde}580,000 distal DHSs with their target promoters, revealing systematic pairing of different classes of distal DHSs and specific promoter types. Patterning of chromatin accessibility at many regulatory regions is organized with dozens to hundreds of co-activated elements, and the transcellular DNase I sensitivity pattern at a given region can predict cell-type-specific functional behaviours. The DHS landscape shows signatures of recent functional evolutionary constraint. However, the DHS compartment in pluripotent and immortalized cells exhibits higher mutation rates than that in highly differentiated cells, exposing an unexpected link between chromatin accessibility, proliferative potential and patterns of human variation.}, language = {en}, number = {7414}, urldate = {2015-09-11}, journal = {Nature}, author = {Thurman, Robert E. and Rynes, Eric and Humbert, Richard and Vierstra, Jeff and Maurano, Matthew T. and Haugen, Eric and Sheffield, Nathan C. and Stergachis, Andrew B. and Wang, Hao and Vernot, Benjamin and Garg, Kavita and John, Sam and Sandstrom, Richard and Bates, Daniel and Boatman, Lisa and Canfield, Theresa K. and Diegel, Morgan and Dunn, Douglas and Ebersol, Abigail K. and Frum, Tristan and Giste, Erika and Johnson, Audra K. and Johnson, Ericka M. and Kutyavin, Tanya and Lajoie, Bryan and Lee, Bum-Kyu and Lee, Kristen and London, Darin and Lotakis, Dimitra and Neph, Shane and Neri, Fidencio and Nguyen, Eric D. and Qu, Hongzhu and Reynolds, Alex P. and Roach, Vaughn and Safi, Alexias and Sanchez, Minerva E. and Sanyal, Amartya and Shafer, Anthony and Simon, Jeremy M. and Song, Lingyun and Vong, Shinny and Weaver, Molly and Yan, Yongqi and Zhang, Zhancheng and Zhang, Zhuzhu and Lenhard, Boris and Tewari, Muneesh and Dorschner, Michael O. and Hansen, R. Scott and Navas, Patrick A. and Stamatoyannopoulos, George and Iyer, Vishwanath R. and Lieb, Jason D. and Sunyaev, Shamil R. and Akey, Joshua M. and Sabo, Peter J. and Kaul, Rajinder and Furey, Terrence S. and Dekker, Job and Crawford, Gregory E. and Stamatoyannopoulos, John A.}, month = sep, year = {2012}, keywords = {evolution, genetics, genomics, molecular biology}, pages = {75--82}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FXGKAKFH/Thurman et al. - 2012 - The accessible chromatin landscape of the human ge.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NIVF6S5G/nature11232.html:text/html} } -@article{pepke_computation_2009-1, - title = {Computation for {ChIP}-seq and {RNA}-seq studies}, - volume = {6}, - copyright = {© 2009 Nature Publishing Group}, - issn = {1548-7091}, - url = {http://www.nature.com/nmeth/journal/v6/n11s/full/nmeth.1371.html}, - doi = {10.1038/nmeth.1371}, - abstract = {Genome-wide measurements of protein-DNA interactions and transcriptomes are increasingly done by deep DNA sequencing methods (ChIP-seq and RNA-seq). The power and richness of these counting-based measurements comes at the cost of routinely handling tens to hundreds of millions of reads. Whereas early adopters necessarily developed their own custom computer code to analyze the first ChIP-seq and RNA-seq datasets, a new generation of more sophisticated algorithms and software tools are emerging to assist in the analysis phase of these projects. Here we describe the multilayered analyses of ChIP-seq and RNA-seq datasets, discuss the software packages currently available to perform tasks at each layer and describe some upcoming challenges and features for future analysis tools. We also discuss how software choices and uses are affected by specific aspects of the underlying biology and data structure, including genome size, positional clustering of transcription factor binding sites, transcript discovery and expression quantification.}, - language = {en}, - number = {11s}, - urldate = {2015-09-16}, - journal = {Nature Methods}, - author = {Pepke, Shirley and Wold, Barbara and Mortazavi, Ali}, - month = nov, - year = {2009}, - pages = {S22--S32}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H49XEIW2/Pepke et al. - 2009 - Computation for ChIP-seq and RNA-seq studies.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TEWKNJU4/nmeth.1371.html:text/html} -} - -@article{nair_probabilistic_2014-1, +@article{nair_probabilistic_2014, title = {Probabilistic partitioning methods to find significant patterns in {ChIP}-{Seq} data}, volume = {30}, issn = {1367-4803, 1460-2059}, url = {http://bioinformatics.oxfordjournals.org/content/30/17/2406}, doi = {10.1093/bioinformatics/btu318}, abstract = {Motivation: We have witnessed an enormous increase in ChIP-Seq data for histone modifications in the past few years. Discovering significant patterns in these data is an important problem for understanding biological mechanisms. Results: We propose probabilistic partitioning methods to discover significant patterns in ChIP-Seq data. Our methods take into account signal magnitude, shape, strand orientation and shifts. We compare our methods with some current methods and demonstrate significant improvements, especially with sparse data. Besides pattern discovery and classification, probabilistic partitioning can serve other purposes in ChIP-Seq data analysis. Specifically, we exemplify its merits in the context of peak finding and partitioning of nucleosome positioning patterns in human promoters. Availability and implementation: The software and code are available in the supplementary material. Contact: Philipp.Bucher@isb-sib.ch Supplementary information: Supplementary data are available at Bioinformatics online.}, language = {en}, number = {17}, urldate = {2015-07-30}, journal = {Bioinformatics}, author = {Nair, Nishanth Ulhas and Kumar, Sunil and Moret, Bernard M. E. and Bucher, Philipp}, month = sep, year = {2014}, pmid = {24812341}, pages = {2406--2413}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FEN4FCC6/Nair et al. - 2014 - Probabilistic partitioning methods to find signifi.pdf:application/pdf;nair2014_suppl.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FEN4FCC6/nair2014_suppl.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8KVRCEVG/2406.html:text/html} } @article{clifford_comparison_2011, title = {Comparison of {Clustering} {Methods} for {Investigation} of {Genome}-{Wide} {Methylation} {Array} {Data}}, volume = {2}, issn = {1664-8021}, url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC3268382/}, doi = {10.3389/fgene.2011.00088}, abstract = {The use of genome-wide methylation arrays has proved very informative to investigate both clinical and biological questions in human epigenomics. The use of clustering methods either for exploration of these data or to compare to an a priori grouping, e.g., normal versus disease allows assessment of groupings of data without user bias. However no consensus on the methods to use for clustering of methylation array approaches has been reached. To determine the most appropriate clustering method for analysis of illumina array methylation data, a collection of data sets was simulated and used to compare clustering methods. Both hierarchical clustering and non-hierarchical clustering methods (k-means, k-medoids, and fuzzy clustering algorithms) were compared using a range of distance and linkage methods. As no single method consistently outperformed others across different simulations, we propose a method to capture the best clustering outcome based on an additional measure, the silhouette width. This approach produced a consistently higher cluster accuracy compared to using any one method in isolation.}, urldate = {2015-07-31}, journal = {Frontiers in Genetics}, author = {Clifford, Harry and Wessely, Frank and Pendurthi, Satish and Emes, Richard D.}, month = dec, year = {2011}, pmid = {22303382}, pmcid = {PMC3268382}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AECCZPQ2/Clifford et al. - 2011 - Comparison of Clustering Methods for Investigation.pdf:application/pdf} } -@article{waszak_population_nodate, - title = {Population {Variation} and {Genetic} {Control} of {Modular} {Chromatin} {Architecture} in {Humans}}, - volume = {0}, - issn = {0092-8674}, - url = {http://www.cell.com/article/S0092867415009770/abstract}, - doi = {10.1016/j.cell.2015.08.001}, - abstract = {Chromatin state variation at gene regulatory elements is abundant across individuals, yet we understand little about the genetic basis of this variability. Here, we profiled several histone modifications, the transcription factor (TF) PU.1, RNA polymerase II, and gene expression in lymphoblastoid cell lines from 47 whole-genome sequenced individuals. We observed that distinct cis-regulatory elements exhibit coordinated chromatin variation across individuals in the form of variable chromatin modules (VCMs) at sub-Mb scale. VCMs were associated with thousands of genes and preferentially cluster within chromosomal contact domains. We mapped strong proximal and weak, yet more ubiquitous, distal-acting chromatin quantitative trait loci (cQTL) that frequently explain this variation. cQTLs were associated with molecular activity at clusters of cis-regulatory elements and mapped preferentially within TF-bound regions. We propose that local, sequence-independent chromatin variation emerges as a result of genetic perturbations in cooperative interactions between cis-regulatory elements that are located within the same genomic domain.}, - language = {English}, - number = {0}, - urldate = {2015-08-25}, - journal = {Cell}, - author = {Waszak, Sebastian M. and Delaneau, Olivier and Gschwind, Andreas R. and Kilpinen, Helena and Raghav, Sunil K. and Witwicki, Robert M. and Orioli, Andrea and Wiederkehr, Michael and Panousis, Nikolaos I. and Yurovsky, Alisa and Romano-Palumbo, Luciana and Planchon, Alexandra and Bielser, Deborah and Padioleau, Ismael and Udin, Gilles and Thurnheer, Sarah and Hacker, David and Hernandez, Nouria and Reymond, Alexandre and Deplancke, Bart and Dermitzakis, Emmanouil T.}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2EDU5P7E/Waszak et al. - Population Variation and Genetic Control of Modula.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B7HR4XMR/S0092-8674(15)00977-0.html:text/html} -} - @article{melton_recurrent_2015, title = {Recurrent somatic mutations in regulatory regions of human cancer genomes}, volume = {47}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1061-4036}, url = {http://www.nature.com/ng/journal/v47/n7/full/ng.3332.html}, doi = {10.1038/ng.3332}, abstract = {Aberrant regulation of gene expression in cancer can promote survival and proliferation of cancer cells. Here we integrate whole-genome sequencing data from The Cancer Genome Atlas (TCGA) for 436 patients from 8 cancer subtypes with ENCODE and other regulatory annotations to identify point mutations in regulatory regions. We find evidence for positive selection of mutations in transcription factor binding sites, consistent with these sites regulating important cancer cell functions. Using a new method that adjusts for sample- and genomic locus–specific mutation rates, we identify recurrently mutated sites across individuals with cancer. Mutated regulatory sites include known sites in the TERT promoter and many new sites, including a subset in proximity to cancer-related genes. In reporter assays, two new sites display decreased enhancer activity upon mutation. These data demonstrate that many regulatory regions contain mutations under selective pressure and suggest a greater role for regulatory mutations in cancer than previously appreciated.}, language = {en}, number = {7}, urldate = {2015-08-25}, journal = {Nature Genetics}, author = {Melton, Collin and Reuter, Jason A. and Spacek, Damek V. and Snyder, Michael}, month = jul, year = {2015}, pages = {710--716}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6Z4KJ5SK/Melton et al. - 2015 - Recurrent somatic mutations in regulatory regions .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3SIKTKPH/ng.3332.html:text/html} } @article{kundaje_ubiquitous_2012, title = {Ubiquitous heterogeneity and asymmetry of the chromatin environment at regulatory elements}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1735}, doi = {10.1101/gr.136366.111}, abstract = {Gene regulation at functional elements (e.g., enhancers, promoters, insulators) is governed by an interplay of nucleosome remodeling, histone modifications, and transcription factor binding. To enhance our understanding of gene regulation, the ENCODE Consortium has generated a wealth of ChIP-seq data on DNA-binding proteins and histone modifications. We additionally generated nucleosome positioning data on two cell lines, K562 and GM12878, by MNase digestion and high-depth sequencing. Here we relate 14 chromatin signals (12 histone marks, DNase, and nucleosome positioning) to the binding sites of 119 DNA-binding proteins across a large number of cell lines. We developed a new method for unsupervised pattern discovery, the Clustered AGgregation Tool (CAGT), which accounts for the inherent heterogeneity in signal magnitude, shape, and implicit strand orientation of chromatin marks. We applied CAGT on a total of 5084 data set pairs to obtain an exhaustive catalog of high-resolution patterns of histone modifications and nucleosome positioning signals around bound transcription factors. Our analyses reveal extensive heterogeneity in how histone modifications are deposited, and how nucleosomes are positioned around binding sites. With the exception of the CTCF/cohesin complex, asymmetry of nucleosome positioning is predominant. Asymmetry of histone modifications is also widespread, for all types of chromatin marks examined, including promoter, enhancer, elongation, and repressive marks. The fine-resolution signal shapes discovered by CAGT unveiled novel correlation patterns between chromatin marks, nucleosome positioning, and sequence content. Meta-analyses of the signal profiles revealed a common vocabulary of chromatin signals shared across multiple cell lines and binding proteins.}, language = {en}, number = {9}, urldate = {2015-09-07}, journal = {Genome Research}, author = {Kundaje, Anshul and Kyriazopoulou-Panagiotopoulou, Sofia and Libbrecht, Max and Smith, Cheryl L. and Raha, Debasish and Winters, Elliott E. and Johnson, Steven M. and Snyder, Michael and Batzoglou, Serafim and Sidow, Arend}, month = sep, year = {2012}, pmid = {22955985}, pages = {1735--1747}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6JNAUUTN/Kundaje et al. - 2012 - Ubiquitous heterogeneity and asymmetry of the chro.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RRNDKW8M/1735.html:text/html} } -@article{gaffney_controls_2012-1, +@article{gaffney_controls_2012, title = {Controls of {Nucleosome} {Positioning} in the {Human} {Genome}}, volume = {8}, url = {http://dx.doi.org/10.1371/journal.pgen.1003036}, doi = {10.1371/journal.pgen.1003036}, abstract = {Author SummaryWithin the nucleus of the cell, the genome of eukaryotic organisms is tightly packaged into chromatin. Chromatin is composed of a repeating series of bead-like nucleosomes, each of which is encircled 1.7 times by a string of DNA. The organization of nucleosomes on the genome is fundamentally important because they can prevent other proteins from accessing the DNA. Previous studies of human nucleosomes concluded that most nucleosomes have fuzzy positioning and tend to occupy different locations in different cells. This interpretation, however, may be a consequence of the low resolution of existing data. Here we revisit the question of nucleosome positioning by generating the most precise map of nucleosome positions that has ever been created for a human cell line. We find that 8.7\% of nucleosomes have very consistent positioning, and most nucleosomes are more consistently positioned than expected by chance. Additionally, we estimate that almost half of the genome contains regularly spaced arrays of nucleosomes. Much of this positioning is due to the intrinsic preference of nucleosomes for some DNA sequences over others; but in some regions of the genome, the sequence preferences of nucleosomes are overridden by proteins that out-compete them for binding or displace them using energy from ATP.}, number = {11}, urldate = {2015-09-07}, journal = {PLoS Genet}, author = {Gaffney, Daniel J. and McVicker, Graham and Pai, Athma A. and Fondufe-Mittendorf, Yvonne N. and Lewellen, Noah and Michelini, Katelyn and Widom, Jonathan and Gilad, Yoav and Pritchard, Jonathan K.}, month = nov, year = {2012}, pages = {e1003036}, file = {PLoS Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TICE4R38/Gaffney et al. - 2012 - Controls of Nucleosome Positioning in the Human Ge.pdf:application/pdf} } @article{consortium_integrated_2012, title = {An integrated encyclopedia of {DNA} elements in the human genome}, volume = {489}, copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v489/n7414/full/nature11247.html}, doi = {10.1038/nature11247}, abstract = {The human genome encodes the blueprint of life, but the function of the vast majority of its nearly three billion bases is unknown. The Encyclopedia of DNA Elements (ENCODE) project has systematically mapped regions of transcription, transcription factor association, chromatin structure and histone modification. These data enabled us to assign biochemical functions for 80\% of the genome, in particular outside of the well-studied protein-coding regions. Many discovered candidate regulatory elements are physically associated with one another and with expressed genes, providing new insights into the mechanisms of gene regulation. The newly identified elements also show a statistical correspondence to sequence variants linked to human disease, and can thereby guide interpretation of this variation. Overall, the project provides new insights into the organization and regulation of our genes and genome, and is an expansive resource of functional annotations for biomedical research.}, language = {en}, number = {7414}, urldate = {2015-09-28}, journal = {Nature}, author = {Consortium, The ENCODE Project}, month = sep, year = {2012}, keywords = {genetics, genomics, molecular biology}, pages = {57--74}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XTHEAZAC/Consortium - 2012 - An integrated encyclopedia of DNA elements in the .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BQ8BWPQ4/nature11247.html:text/html;supplemental.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XTHEAZAC/supplemental.pdf:application/pdf} } @article{zhou_charting_2011, title = {Charting histone modifications and the functional organization of mammalian genomes}, volume = {12}, copyright = {© 2010 Nature Publishing Group}, issn = {1471-0056}, url = {http://www.nature.com/nrg/journal/v12/n1/full/nrg2905.html}, doi = {10.1038/nrg2905}, abstract = {A succession of technological advances over the past decade have enabled researchers to chart maps of histone modifications and related chromatin structures with increasing accuracy, comprehensiveness and throughput. The resulting data sets highlight the interplay between chromatin and genome function, dynamic variations in chromatin structure across cellular conditions, and emerging roles for large-scale domains and higher-ordered chromatin organization. Here we review a selection of recent studies that have probed histone modifications and successive layers of chromatin structure in mammalian genomes, the patterns that have been identified and future directions for research.}, language = {en}, number = {1}, urldate = {2015-11-04}, journal = {Nature Reviews Genetics}, author = {Zhou, Vicky W. and Goren, Alon and Bernstein, Bradley E.}, month = jan, year = {2011}, pages = {7--18}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XTXCIXEJ/Zhou et al. - 2011 - Charting histone modifications and the functional .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G9JNJPI3/nrg2905.html:text/html} } @article{langst_chromatin_2015, title = {Chromatin {Remodelers}: {From} {Function} to {Dysfunction}}, volume = {6}, copyright = {http://creativecommons.org/licenses/by/3.0/}, shorttitle = {Chromatin {Remodelers}}, url = {http://www.mdpi.com/2073-4425/6/2/299}, doi = {10.3390/genes6020299}, abstract = {Chromatin remodelers are key players in the regulation of chromatin accessibility and nucleosome positioning on the eukaryotic DNA, thereby essential for all DNA dependent biological processes. Thus, it is not surprising that upon of deregulation of those molecular machines healthy cells can turn into cancerous cells. Even though the remodeling enzymes are very abundant and a multitude of different enzymes and chromatin remodeling complexes exist in the cell, the particular remodeling complex with its specific nucleosome positioning features must be at the right place at the right time in order to ensure the proper regulation of the DNA dependent processes. To achieve this, chromatin remodeling complexes harbor protein domains that specifically read chromatin targeting signals, such as histone modifications, DNA sequence/structure, non-coding RNAs, histone variants or DNA bound interacting proteins. Recent studies reveal the interaction between non-coding RNAs and chromatin remodeling complexes showing importance of RNA in remodeling enzyme targeting, scaffolding and regulation. In this review, we summarize current understanding of chromatin remodeling enzyme targeting to chromatin and their role in cancer development.}, language = {en}, number = {2}, urldate = {2015-09-28}, journal = {Genes}, author = {Längst, Gernot and Manelyte, Laura}, month = jun, year = {2015}, keywords = {chromatin remodeler, search mechanism, arrest model, non-coding RNA, cancer}, pages = {299--324}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/P7N7NXIN/Längst et Manelyte - 2015 - Chromatin Remodelers From Function to Dysfunction.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KR92U7ET/htm.html:text/html} } @article{bailey_znf143_2015, title = {{ZNF}143 provides sequence specificity to secure chromatin interactions at gene promoters}, volume = {2}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, url = {http://www.nature.com/ncomms/2015/150203/ncomms7186/full/ncomms7186.html}, doi = {10.1038/ncomms7186}, abstract = {Chromatin interactions connect distal regulatory elements to target gene promoters guiding stimulus- and lineage-specific transcription. Few factors securing chromatin interactions have so far been identified. Here, by integrating chromatin interaction maps with the large collection of transcription factor-binding profiles provided by the ENCODE project, we demonstrate that the zinc-finger protein ​ZNF143 preferentially occupies anchors of chromatin interactions connecting promoters with distal regulatory elements. It binds directly to promoters and associates with lineage-specific chromatin interactions and gene expression. Silencing ​ZNF143 or modulating its DNA-binding affinity using single-nucleotide polymorphisms (SNPs) as a surrogate of site-directed mutagenesis reveals the sequence dependency of chromatin interactions at gene promoters. We also find that chromatin interactions alone do not regulate gene expression. Together, our results identify ​ZNF143 as a novel chromatin-looping factor that contributes to the architectural foundation of the genome by providing sequence specificity at promoters connected with distal regulatory elements.}, language = {en}, urldate = {2015-11-17}, journal = {Nature Communications}, author = {Bailey, Swneke D. and Zhang, Xiaoyang and Desai, Kinjal and Aid, Malika and Corradin, Olivia and Cowper-Sal·lari, Richard and Akhtar-Zaidi, Batool and Scacheri, Peter C. and Haibe-Kains, Benjamin and Lupien, Mathieu}, month = feb, year = {2015}, keywords = {Biological sciences, genetics, molecular biology}, pages = {6186}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T3KAUSWX/Bailey et al. - 2015 - ZNF143 provides sequence specificity to secure chr.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z2XI58RG/ncomms7186.html:text/html} } @article{henikoff_histone_2015, title = {Histone {Variants} and {Epigenetics}}, volume = {7}, issn = {, 1943-0264}, url = {http://cshperspectives.cshlp.org/content/7/1/a019364}, doi = {10.1101/cshperspect.a019364}, abstract = {Histones package and compact DNA by assembling into nucleosome core particles. Most histones are synthesized at S phase for rapid deposition behind replication forks. In addition, the replacement of histones deposited during S phase by variants that can be deposited independently of replication provide the most fundamental level of chromatin differentiation. Alternative mechanisms for depositing different variants can potentially establish and maintain epigenetic states. Variants have also evolved crucial roles in chromosome segregation, transcriptional regulation, DNA repair, and other processes. Investigations into the evolution, structure, and metabolism of histone variants provide a foundation for understanding the participation of chromatin in important cellular processes and in epigenetic memory.}, language = {en}, number = {1}, urldate = {2015-09-28}, journal = {Cold Spring Harbor Perspectives in Biology}, author = {Henikoff, Steven and Smith, M. Mitchell}, month = jan, year = {2015}, pmid = {25561719}, pages = {a019364}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E6UPDJKI/Henikoff et Smith - 2015 - Histone Variants and Epigenetics.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E67U5U59/a019364.html:text/html} } @article{barth_fast_2010, title = {Fast signals and slow marks: the dynamics of histone modifications}, volume = {35}, issn = {0968-0004}, shorttitle = {Fast signals and slow marks}, url = {http://www.sciencedirect.com/science/article/pii/S0968000410000940}, doi = {10.1016/j.tibs.2010.05.006}, abstract = {Most multi-cellular organisms adopt a specific gene expression pattern during cellular differentiation. Once established, this pattern is frequently maintained over several cell divisions despite the fact that the initiating signal is no longer present. Differential packaging into chromatin is one such mechanism that allows fixation of transcriptional activity. Recent genome-wide studies demonstrate that actively transcribed regions are characterized by a specific modification pattern of histones, the main protein component of chromatin. These findings support the hypothesis that a histone code uses histone post-translational modifications to stably inscribe particular chromatin structures into the genome. Experiments on the dynamics of histone modifications reveal a striking kinetic difference between methylation, phosphorylation and acetylation, suggesting different roles of these modifications in epigenetically fixing specific gene expression patterns.}, number = {11}, urldate = {2015-09-28}, journal = {Trends in Biochemical Sciences}, author = {Barth, Teresa K. and Imhof, Axel}, month = nov, year = {2010}, pages = {618--626}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UPFQHFWS/Barth et Imhof - 2010 - Fast signals and slow marks the dynamics of histo.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ACW228QE/S0968000410000940.html:text/html} } @article{venkatesh_histone_2015, title = {Histone exchange, chromatin structure and the regulation of transcription}, volume = {16}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0072}, url = {http://www.nature.com/nrm/journal/v16/n3/full/nrm3941.html}, doi = {10.1038/nrm3941}, abstract = {The packaging of DNA into strings of nucleosomes is one of the features that allows eukaryotic cells to tightly regulate gene expression. The ordered disassembly of nucleosomes permits RNA polymerase II (Pol II) to access the DNA, whereas nucleosomal reassembly impedes access, thus preventing transcription and mRNA synthesis. Chromatin modifications, chromatin remodellers, histone chaperones and histone variants regulate nucleosomal dynamics during transcription. Disregulation of nucleosome dynamics results in aberrant transcription initiation, producing non-coding RNAs. Ongoing research is elucidating the molecular mechanisms that regulate chromatin structure during transcription by preventing histone exchange, thereby limiting non-coding RNA expression.}, language = {en}, number = {3}, urldate = {2015-09-28}, journal = {Nature Reviews Molecular Cell Biology}, author = {Venkatesh, Swaminathan and Workman, Jerry L.}, month = mar, year = {2015}, pages = {178--189}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DSVWNBZV/Venkatesh et Workman - 2015 - Histone exchange, chromatin structure and the regu.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W2JBHNFP/nrm3941.html:text/html} } -@article{barth_fast_2010-1, - title = {Fast signals and slow marks: the dynamics of histone modifications}, - volume = {35}, - issn = {0968-0004}, - shorttitle = {Fast signals and slow marks}, - url = {http://www.sciencedirect.com/science/article/pii/S0968000410000940}, - doi = {10.1016/j.tibs.2010.05.006}, - abstract = {Most multi-cellular organisms adopt a specific gene expression pattern during cellular differentiation. Once established, this pattern is frequently maintained over several cell divisions despite the fact that the initiating signal is no longer present. Differential packaging into chromatin is one such mechanism that allows fixation of transcriptional activity. Recent genome-wide studies demonstrate that actively transcribed regions are characterized by a specific modification pattern of histones, the main protein component of chromatin. These findings support the hypothesis that a histone code uses histone post-translational modifications to stably inscribe particular chromatin structures into the genome. Experiments on the dynamics of histone modifications reveal a striking kinetic difference between methylation, phosphorylation and acetylation, suggesting different roles of these modifications in epigenetically fixing specific gene expression patterns.}, - number = {11}, - urldate = {2015-09-29}, - journal = {Trends in Biochemical Sciences}, - author = {Barth, Teresa K. and Imhof, Axel}, - month = nov, - year = {2010}, - pages = {618--626}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U97TKNPN/Barth et Imhof - 2010 - Fast signals and slow marks the dynamics of histo.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EN6WBTWZ/S0968000410000940.html:text/html} -} - @article{tsompana_chromatin_2014, title = {Chromatin accessibility: a window into the genome}, volume = {7}, issn = {1756-8935}, shorttitle = {Chromatin accessibility}, url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC4253006/}, doi = {10.1186/1756-8935-7-33}, abstract = {Transcriptional activation throughout the eukaryotic lineage has been tightly linked with disruption of nucleosome organization at promoters, enhancers, silencers, insulators and locus control regions due to transcription factor binding. Regulatory DNA thus coincides with open or accessible genomic sites of remodeled chromatin. Current chromatin accessibility assays are used to separate the genome by enzymatic or chemical means and isolate either the accessible or protected locations. The isolated DNA is then quantified using a next-generation sequencing platform. Wide application of these assays has recently focused on the identification of the instrumental epigenetic changes responsible for differential gene expression, cell proliferation, functional diversification and disease development. Here we discuss the limitations and advantages of current genome-wide chromatin accessibility assays with especial attention on experimental precautions and sequence data analysis. We conclude with our perspective on future improvements necessary for moving the field of chromatin profiling forward.}, urldate = {2015-10-01}, journal = {Epigenetics \& Chromatin}, author = {Tsompana, Maria and Buck, Michael J}, month = nov, year = {2014}, pmid = {25473421}, pmcid = {PMC4253006}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/X5EEV2QU/Tsompana et Buck - 2014 - Chromatin accessibility a window into the genome.pdf:application/pdf} } @article{iwafuchi-doi_pioneer_2014, title = {Pioneer transcription factors in cell reprogramming}, volume = {28}, issn = {0890-9369, 1549-5477}, url = {http://genesdev.cshlp.org/content/28/24/2679}, doi = {10.1101/gad.253443.114}, abstract = {A subset of eukaryotic transcription factors possesses the remarkable ability to reprogram one type of cell into another. The transcription factors that reprogram cell fate are invariably those that are crucial for the initial cell programming in embryonic development. To elicit cell programming or reprogramming, transcription factors must be able to engage genes that are developmentally silenced and inappropriate for expression in the original cell. Developmentally silenced genes are typically embedded in “closed” chromatin that is covered by nucleosomes and not hypersensitive to nuclease probes such as DNase I. Biochemical and genomic studies have shown that transcription factors with the highest reprogramming activity often have the special ability to engage their target sites on nucleosomal DNA, thus behaving as “pioneer factors” to initiate events in closed chromatin. Other reprogramming factors appear dependent on pioneer factors for engaging nucleosomes and closed chromatin. However, certain genomic domains in which nucleosomes are occluded by higher-order chromatin structures, such as in heterochromatin, are resistant to pioneer factor binding. Understanding the means by which pioneer factors can engage closed chromatin and how heterochromatin can prevent such binding promises to advance our ability to reprogram cell fates at will and is the topic of this review.}, language = {en}, number = {24}, urldate = {2015-10-01}, journal = {Genes \& Development}, author = {Iwafuchi-Doi, Makiko and Zaret, Kenneth S.}, month = dec, year = {2014}, pmid = {25512556}, keywords = {Chromatin, pioneer transcription factor, transdifferentiation, Reprogramming, development, nucleosome}, pages = {2679--2692}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CEITEC7S/Iwafuchi-Doi et Zaret - 2014 - Pioneer transcription factors in cell reprogrammin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KB29H8TM/2679.html:text/html} } @article{cairns_logic_2009, title = {The logic of chromatin architecture and remodelling at promoters}, volume = {461}, copyright = {© 2009 Nature Publishing Group}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v461/n7261/full/nature08450.html}, doi = {10.1038/nature08450}, abstract = {The regulation of gene transcription involves a dynamic balance between packaging regulatory sequences into chromatin and allowing transcriptional regulators access to these sequences. Access is restricted by the nucleosomes, but these can be repositioned or ejected by enzymes known as nucleosome remodellers. In addition, the DNA sequence can impart stiffness or curvature to the DNA, thereby affecting the position of nucleosomes on the DNA, influencing particular promoter 'architectures'. Recent genome-wide studies in yeast suggest that constitutive and regulated genes have architectures that differ in terms of nucleosome position, turnover, remodelling requirements and transcriptional noise.}, language = {en}, number = {7261}, urldate = {2015-10-02}, journal = {Nature}, author = {Cairns, Bradley R.}, month = sep, year = {2009}, pages = {193--198}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XWRUTA2D/Cairns - 2009 - The logic of chromatin architecture and remodellin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CPRFW37U/nature08450.html:text/html} } @article{the_uk10k_consortium_uk10k_2015, title = {The {UK}10K project identifies rare variants in health and disease}, volume = {526}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v526/n7571/full/nature14962.html}, doi = {10.1038/nature14962}, abstract = {The contribution of rare and low-frequency variants to human traits is largely unexplored. Here we describe insights from sequencing whole genomes (low read depth, 7×) or exomes (high read depth, 80×) of nearly 10,000 individuals from population-based and disease collections. In extensively phenotyped cohorts we characterize over 24 million novel sequence variants, generate a highly accurate imputation reference panel and identify novel alleles associated with levels of triglycerides (APOB), adiponectin (ADIPOQ) and low-density lipoprotein cholesterol (LDLR and RGAG1) from single-marker and rare variant aggregation tests. We describe population structure and functional annotation of rare and low-frequency variants, use the data to estimate the benefits of sequencing for association studies, and summarize lessons from disease-specific collections. Finally, we make available an extensive resource, including individual-level genetic and phenotypic data and web-based tools to facilitate the exploration of association results.}, language = {en}, number = {7571}, urldate = {2015-10-09}, journal = {Nature}, author = {{The UK10K Consortium}}, month = oct, year = {2015}, keywords = {Next-generation sequencing, Genome-wide association studies}, pages = {82--90}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CUKIZJGS/The UK10K Consortium - 2015 - The UK10K project identifies rare variants in heal.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HZEXSHCX/nature14962.html:text/html} } -@article{zwart_carrier-assisted_2013, - title = {A carrier-assisted {ChIP}-seq method for estrogen receptor-chromatin interactions from breast cancer core needle biopsy samples}, - volume = {14}, - copyright = {2013 Zwart et al.; licensee BioMed Central Ltd.}, - issn = {1471-2164}, - url = {http://www.biomedcentral.com/1471-2164/14/232/abstract}, - doi = {10.1186/1471-2164-14-232}, - abstract = {The Estrogen Receptor alpha (ERα) is the key transcriptional regulator in luminal breast cancer and is therefore the main target for adjuvant treatment of this subtype. Luminal gene signatures are dictated by the transcriptional capacities of ERα, which are a direct consequence of the receptors binding preference at specific sites on the chromatin. The identification of ERα binding signatures on a genome-wide level has greatly enhanced our understanding of Estrogen Receptor biology in cell lines and tumours, but the technique has its limitations with respect to its applicability in limited amounts of tumour tissue.}, - language = {en}, - number = {1}, - urldate = {2015-10-16}, - journal = {BMC Genomics}, - author = {Zwart, Wilbert and Koornstra, Rutger and Wesseling, Jelle and Rutgers, Emiel and Linn, Sabine and Carroll, Jason S.}, - month = apr, - year = {2013}, - pmid = {23565824}, - pages = {232}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BV5UA68M/Zwart et al. - 2013 - A carrier-assisted ChIP-seq method for estrogen re.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KP86QEPG/232.html:text/html} -} - @article{locke_coordinated_2015, title = {Coordinated epigenetic remodelling of transcriptional networks occurs during early breast carcinogenesis}, volume = {7}, copyright = {2015 Locke et al.; licensee BioMed Central.}, issn = {1868-7083}, url = {http://www.clinicalepigeneticsjournal.com/content/7/1/52/abstract}, doi = {10.1186/s13148-015-0086-0}, abstract = {Dysregulation of the epigenome is a common event in malignancy; however, deciphering the earliest cancer-associated epigenetic events remains a challenge. Cancer epigenome studies to date have primarily utilised cancer cell lines or clinical samples, where it is difficult to identify the initial epigenetic lesions from those that occur over time. Here, we analysed the epigenome of human mammary epithelial cells (HMEC) and a matched variant cell population (vHMEC) that have spontaneously escaped senescence and undergone partial carcinogenic transformation. Using this model of basal-like breast carcinogenesis, we provide striking new insights into the very first epigenetic changes that occur during the initial stages of malignancy.}, language = {en}, number = {1}, urldate = {2015-10-19}, journal = {Clinical Epigenetics}, author = {Locke, Warwick J. and Zotenko, Elena and Stirzaker, Clare and Robinson, Mark D. and Hinshelwood, Rebecca A. and Stone, Andrew and Reddel, Roger R. and Huschtscha, Lily I. and Clark, Susan J.}, month = may, year = {2015}, pmid = {25960784}, keywords = {DNA Methylation, Methylome, Basal breast cancer, Epigenome sequencing, Biomarker, epigenetics}, pages = {52}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7R7V74EJ/Locke et al. - 2015 - Coordinated epigenetic remodelling of transcriptio.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/92XAVETV/52.html:text/html} } @article{su_somatic_2015, title = {Somatic {Cell} {Fusions} {Reveal} {Extensive} {Heterogeneity} in {Basal}-like {Breast} {Cancer}}, volume = {11}, issn = {2211-1247}, url = {http://www.sciencedirect.com/science/article/pii/S2211124715005239}, doi = {10.1016/j.celrep.2015.05.011}, abstract = {Summary Basal-like and luminal breast tumors have distinct clinical behavior and molecular profiles, yet the underlying mechanisms are poorly defined. To interrogate processes that determine these distinct phenotypes and their inheritance pattern, we generated somatic cell fusions and performed integrated genetic and epigenetic (DNA methylation and chromatin) profiling. We found that the basal-like trait is generally dominant and is largely defined by epigenetic repression of luminal transcription factors. Definition of super-enhancers highlighted a core program common in luminal cells but a high degree of heterogeneity in basal-like breast cancers that correlates with clinical outcome. We also found that protein extracts of basal-like cells are sufficient to induce a luminal-to-basal phenotypic switch, implying a trigger of basal-like autoregulatory circuits. We determined that KDM6A might be required for luminal-basal fusions, and we identified EN1, TBX18, and TCF4 as candidate transcriptional regulators of the luminal-to-basal switch. Our findings highlight the remarkable epigenetic plasticity of breast cancer cells.}, number = {10}, urldate = {2015-11-02}, journal = {Cell Reports}, author = {Su, Ying and Subedee, Ashim and Bloushtain-Qimron, Noga and Savova, Virginia and Krzystanek, Marcin and Li, Lewyn and Marusyk, Andriy and Tabassum, Doris P. and Zak, Alexander and Flacker, Mary Jo and Li, Mei and Lin, Jessica J. and Sukumar, Saraswati and Suzuki, Hiromu and Long, Henry and Szallasi, Zoltan and Gimelbrant, Alexander and Maruyama, Reo and Polyak, Kornelia}, month = jun, year = {2015}, pages = {1549--1563}, file = {ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4MNPHIBW/S2211124715005239.html:text/html} } @article{gascard_epigenetic_2015, title = {Epigenetic and transcriptional determinants of the human breast}, volume = {6}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, url = {http://www.nature.com/ncomms/2015/150218/ncomms7351/full/ncomms7351.html}, doi = {10.1038/ncomms7351}, abstract = {While significant effort has been dedicated to the characterization of epigenetic changes associated with prenatal differentiation, relatively little is known about the epigenetic changes that accompany post-natal differentiation where fully functional differentiated cell types with limited lifespans arise. Here we sought to address this gap by generating epigenomic and transcriptional profiles from primary human breast cell types isolated from disease-free human subjects. From these data we define a comprehensive human breast transcriptional network, including a set of myoepithelial- and luminal epithelial-specific intronic retention events. Intersection of epigenetic states with RNA expression from distinct breast epithelium lineages demonstrates that mCpG provides a stable record of exonic and intronic usage, whereas H3K36me3 is dynamic. We find a striking asymmetry in epigenomic reprogramming between luminal and myoepithelial cell types, with the genomes of luminal cells harbouring more than twice the number of hypomethylated enhancer elements compared with myoepithelial cells.}, language = {en}, urldate = {2015-11-18}, journal = {Nature Communications}, author = {Gascard, Philippe and Bilenky, Misha and Sigaroudinia, Mahvash and Zhao, Jianxin and Li, Luolan and Carles, Annaick and Delaney, Allen and Tam, Angela and Kamoh, Baljit and Cho, Stephanie and Griffith, Malachi and Chu, Andy and Robertson, Gordon and Cheung, Dorothy and Li, Irene and Heravi-Moussavi, Alireza and Moksa, Michelle and Mingay, Matthew and Hussainkhel, Angela and Davis, Brad and Nagarajan, Raman P. and Hong, Chibo and Echipare, Lorigail and O’Geen, Henriette and Hangauer, Matthew J. and Cheng, Jeffrey B. and Neel, Dana and Hu, Donglei and McManus, Michael T. and Moore, Richard and Mungall, Andrew and Ma, Yussanne and Plettner, Patrick and Ziv, Elad and Wang, Ting and Farnham, Peggy J. and Jones, Steven J. M. and Marra, Marco A. and Tlsty, Thea D. and Costello, Joseph F. and Hirst, Martin}, month = feb, year = {2015}, keywords = {Biological sciences, developmental biology, molecular biology}, pages = {6351}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9KJ75WN5/Gascard et al. - 2015 - Epigenetic and transcriptional determinants of the.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/766Q6FZB/ncomms7351.html:text/html} } @article{soufi_pioneer_2015, title = {Pioneer {Transcription} {Factors} {Target} {Partial} {DNA} {Motifs} on {Nucleosomes} to {Initiate} {Reprogramming}}, volume = {161}, issn = {0092-8674}, url = {http://www.cell.com/article/S0092867415003049/abstract}, doi = {10.1016/j.cell.2015.03.017}, abstract = {Pioneer transcription factors (TFs) access silent chromatin and initiate cell-fate changes, using diverse types of DNA binding domains (DBDs). FoxA, the paradigm pioneer TF, has a winged helix DBD that resembles linker histone and thereby binds its target sites on nucleosomes and in compacted chromatin. Herein, we compare the nucleosome and chromatin targeting activities of Oct4 (POU DBD), Sox2 (HMG box DBD), Klf4 (zinc finger DBD), and c-Myc (bHLH DBD), which together reprogram somatic cells to pluripotency. Purified Oct4, Sox2, and Klf4 proteins can bind nucleosomes in vitro, and in vivo they preferentially target silent sites enriched for nucleosomes. Pioneer activity relates simply to the ability of a given DBD to target partial motifs displayed on the nucleosome surface. Such partial motif recognition can occur by coordinate binding between factors. Our findings provide insight into how pioneer factors can target naive chromatin sites.}, language = {English}, number = {3}, urldate = {2015-12-02}, journal = {Cell}, author = {Soufi, Abdenour and Garcia, Meilin Fernandez and Jaroszewicz, Artur and Osman, Nebiyu and Pellegrini, Matteo and Zaret, Kenneth S.}, month = apr, year = {2015}, pmid = {25892221}, pages = {555--568}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6KNK7QSD/Soufi et al. - 2015 - Pioneer Transcription Factors Target Partial DNA M.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5GT7KEX7/S0092-8674(15)00304-9.html:text/html} } @article{weber_nucleosomes_2014, title = {Nucleosomes {Are} {Context}-{Specific}, {H}2A.{Z}-{Modulated} {Barriers} to {RNA} {Polymerase}}, volume = {53}, issn = {1097-2765}, url = {http://www.cell.com/article/S1097276514001592/abstract}, doi = {10.1016/j.molcel.2014.02.014}, abstract = {Nucleosomes are barriers to transcription in vitro; however, their effects on RNA polymerase in vivo are unknown. Here we describe a simple and general strategy to comprehensively map the positions of elongating and arrested RNA polymerase II (RNAPII) at nucleotide resolution. We find that the entry site of the first (+1) nucleosome is a barrier to RNAPII for essentially all genes, including those undergoing regulated pausing farther upstream. In contrast to the +1 nucleosome, gene body nucleosomes are low barriers and cause RNAPII stalling both at the entry site and near the dyad axis. The extent of the +1 nucleosome barrier correlates with nucleosome occupancy but anticorrelates with enrichment of histone variant H2A.Z. Importantly, depletion of H2A.Z from a nucleosome position results in a higher barrier to RNAPII. Our results suggest that nucleosomes present significant, context-specific barriers to RNAPII in vivo that can be tuned by the incorporation of H2A.Z.}, language = {English}, number = {5}, urldate = {2016-01-07}, journal = {Molecular Cell}, author = {Weber, Christopher M. and Ramachandran, Srinivas and Henikoff, Steven}, month = jun, year = {2014}, pmid = {24606920}, pages = {819--830}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3MMPKGM5/Weber et al. - 2014 - Nucleosomes Are Context-Specific, H2A.Z-Modulated .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2VESJ49J/S1097-2765(14)00159-2.html:text/html} } @article{li_combining_2015, - series = {({Epi}){Genomics} approaches and their applications}, - title = {Combining {MeDIP}-seq and {MRE}-seq to investigate genome-wide {CpG} methylation}, - volume = {72}, - issn = {1046-2023}, - url = {http://www.sciencedirect.com/science/article/pii/S1046202314003594}, - doi = {10.1016/j.ymeth.2014.10.032}, - abstract = {DNA CpG methylation is a widespread epigenetic mark in high eukaryotes including mammals. DNA methylation plays key roles in diverse biological processes such as X chromosome inactivation, transposable element repression, genomic imprinting, and control of gene expression. Recent advancements in sequencing-based DNA methylation profiling methods provide an unprecedented opportunity to measure DNA methylation in a genome-wide fashion, making it possible to comprehensively investigate the role of DNA methylation. Several methods have been developed, such as Whole Genome Bisulfite Sequencing (WGBS), Reduced Representation Bisulfite Sequencing (RRBS), and enrichment-based methods including Methylation Dependent ImmunoPrecipitation followed by sequencing (MeDIP-seq), methyl-CpG binding domain (MBD) protein-enriched genome sequencing (MBD-seq), methyltransferase-directed Transfer of Activated Groups followed by sequencing (mTAG), and Methylation-sensitive Restriction Enzyme digestion followed by sequencing (MRE-seq). These methods differ by their genomic CpG coverage, resolution, quantitative accuracy, cost, and software for analyzing the data. Among these, WGBS is considered the gold standard. However, it is still a cost-prohibitive technology for a typical laboratory due to the required sequencing depth. We found that by integrating two enrichment-based methods that are complementary in nature (i.e., MeDIP-seq and MRE-seq), we can significantly increase the efficiency of whole DNA methylome profiling. By using two recently developed computational algorithms (i.e., M\&M and methylCRF), the combination of MeDIP-seq and MRE-seq produces genome-wide CpG methylation measurement at high coverage and high resolution, and robust predictions of differentially methylated regions. Thus, the combination of the two enrichment-based methods provides a cost-effective alternative to WGBS. In this article we describe both the experimental protocols for performing MeDIP-seq and MRE-seq, and the computational protocols for running M\&M and methylCRF.}, - urldate = {2015-11-20}, - journal = {Methods}, - author = {Li, Daofeng and Zhang, Bo and Xing, Xiaoyun and Wang, Ting}, - month = jan, - year = {2015}, - keywords = {DNA Methylation, MeDIP-seq, MRE-seq, M\&M, methylCRF}, - pages = {29--40}, - file = {1-s2.0-S1046202314003594-main.pdf:/home/romaingroux/Bureau/1-s2.0-S1046202314003594-main.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IWTCECVF/S1046202314003594.html:text/html} -} - -@article{li_combining_2015-1, series = {({Epi}){Genomics} approaches and their applications}, title = {Combining {MeDIP}-seq and {MRE}-seq to investigate genome-wide {CpG} methylation}, volume = {72}, issn = {1046-2023}, url = {http://www.sciencedirect.com/science/article/pii/S1046202314003594}, doi = {10.1016/j.ymeth.2014.10.032}, abstract = {DNA CpG methylation is a widespread epigenetic mark in high eukaryotes including mammals. DNA methylation plays key roles in diverse biological processes such as X chromosome inactivation, transposable element repression, genomic imprinting, and control of gene expression. Recent advancements in sequencing-based DNA methylation profiling methods provide an unprecedented opportunity to measure DNA methylation in a genome-wide fashion, making it possible to comprehensively investigate the role of DNA methylation. Several methods have been developed, such as Whole Genome Bisulfite Sequencing (WGBS), Reduced Representation Bisulfite Sequencing (RRBS), and enrichment-based methods including Methylation Dependent ImmunoPrecipitation followed by sequencing (MeDIP-seq), methyl-CpG binding domain (MBD) protein-enriched genome sequencing (MBD-seq), methyltransferase-directed Transfer of Activated Groups followed by sequencing (mTAG), and Methylation-sensitive Restriction Enzyme digestion followed by sequencing (MRE-seq). These methods differ by their genomic CpG coverage, resolution, quantitative accuracy, cost, and software for analyzing the data. Among these, WGBS is considered the gold standard. However, it is still a cost-prohibitive technology for a typical laboratory due to the required sequencing depth. We found that by integrating two enrichment-based methods that are complementary in nature (i.e., MeDIP-seq and MRE-seq), we can significantly increase the efficiency of whole DNA methylome profiling. By using two recently developed computational algorithms (i.e., M\&M and methylCRF), the combination of MeDIP-seq and MRE-seq produces genome-wide CpG methylation measurement at high coverage and high resolution, and robust predictions of differentially methylated regions. Thus, the combination of the two enrichment-based methods provides a cost-effective alternative to WGBS. In this article we describe both the experimental protocols for performing MeDIP-seq and MRE-seq, and the computational protocols for running M\&M and methylCRF.}, urldate = {2015-11-20}, journal = {Methods}, author = {Li, Daofeng and Zhang, Bo and Xing, Xiaoyun and Wang, Ting}, month = jan, year = {2015}, keywords = {DNA Methylation, MeDIP-seq, MRE-seq, M\&M, methylCRF}, pages = {29--40}, file = {1-s2.0-S1046202314003594-main.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HNFTVWZG/1-s2.0-S1046202314003594-main.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HNFTVWZG/S1046202314003594.html:text/html} } @article{jolma_dna-dependent_2015, title = {{DNA}-dependent formation of transcription factor pairs alters their binding specificity}, volume = {527}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v527/n7578/full/nature15518.html}, doi = {10.1038/nature15518}, abstract = {Gene expression is regulated by transcription factors (TFs), proteins that recognize short DNA sequence motifs. Such sequences are very common in the human genome, and an important determinant of the specificity of gene expression is the cooperative binding of multiple TFs to closely located motifs. However, interactions between DNA-bound TFs have not been systematically characterized. To identify TF pairs that bind cooperatively to DNA, and to characterize their spacing and orientation preferences, we have performed consecutive affinity-purification systematic evolution of ligands by exponential enrichment (CAP-SELEX) analysis of 9,400 TF–TF–DNA interactions. This analysis revealed 315 TF–TF interactions recognizing 618 heterodimeric motifs, most of which have not been previously described. The observed cooperativity occurred promiscuously between TFs from diverse structural families. Structural analysis of the TF pairs, including a novel crystal structure of MEIS1 and DLX3 bound to their identified recognition site, revealed that the interactions between the TFs were predominantly mediated by DNA. Most TF pair sites identified involved a large overlap between individual TF recognition motifs, and resulted in recognition of composite sites that were markedly different from the individual TF’s motifs. Together, our results indicate that the DNA molecule commonly plays an active role in cooperative interactions that define the gene regulatory lexicon.}, language = {en}, number = {7578}, urldate = {2015-12-02}, journal = {Nature}, author = {Jolma, Arttu and Yin, Yimeng and Nitta, Kazuhiro R. and Dave, Kashyap and Popov, Alexander and Taipale, Minna and Enge, Martin and Kivioja, Teemu and Morgunova, Ekaterina and Taipale, Jussi}, month = nov, year = {2015}, keywords = {DNA, Gene regulation, X-ray crystallography, Transcriptional regulatory elements}, pages = {384--388}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MIJZ6935/Jolma et al. - 2015 - DNA-dependent formation of transcription factor pa.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DPX4EIAA/nature15518.html:text/html} } @article{zentner_high-resolution_2014, title = {High-resolution digital profiling of the epigenome}, volume = {15}, copyright = {© 2014 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0056}, url = {http://www.nature.com/nrg/journal/v15/n12/full/nrg3798.html}, doi = {10.1038/nrg3798}, abstract = {The widespread adoption of short-read DNA sequencing as a digital epigenomic readout platform has motivated the development of genome-wide tools that achieve base-pair resolution. New methods for footprinting and affinity purification of nucleosomes, RNA polymerases, chromatin remodellers and transcription factors have increased the resolution of epigenomic profiling by two orders of magnitude, leading to new insights into how the chromatin landscape affects gene regulation. These digital epigenomic tools have also been applied to directly profile both turnover kinetics and transcription in situ. In this Review, we describe how these new genome-wide tools allow interrogation of diverse aspects of the epigenome.}, language = {en}, number = {12}, urldate = {2015-12-16}, journal = {Nature Reviews Genetics}, author = {Zentner, Gabriel E. and Henikoff, Steven}, month = dec, year = {2014}, keywords = {Next-generation sequencing, Chromatin analysis, epigenetics, Epigenomics}, pages = {814--827}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H4M8AG8H/Zentner et Henikoff - 2014 - High-resolution digital profiling of the epigenome.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8FX7956R/nrg3798.html:text/html} } -@article{bonhoure_quantifying_2014, - title = {Quantifying {ChIP}-seq data: a spiking method providing an internal reference for sample-to-sample normalization}, - volume = {24}, - issn = {1088-9051, 1549-5469}, - shorttitle = {Quantifying {ChIP}-seq data}, - url = {http://genome.cshlp.org/content/24/7/1157}, - doi = {10.1101/gr.168260.113}, - abstract = {Chromatin immunoprecipitation followed by deep sequencing (ChIP-seq) experiments are widely used to determine, within entire genomes, the occupancy sites of any protein of interest, including, for example, transcription factors, RNA polymerases, or histones with or without various modifications. In addition to allowing the determination of occupancy sites within one cell type and under one condition, this method allows, in principle, the establishment and comparison of occupancy maps in various cell types, tissues, and conditions. Such comparisons require, however, that samples be normalized. Widely used normalization methods that include a quantile normalization step perform well when factor occupancy varies at a subset of sites, but may miss uniform genome-wide increases or decreases in site occupancy. We describe a spike adjustment procedure (SAP) that, unlike commonly used normalization methods intervening at the analysis stage, entails an experimental step prior to immunoprecipitation. A constant, low amount from a single batch of chromatin of a foreign genome is added to the experimental chromatin. This “spike” chromatin then serves as an internal control to which the experimental signals can be adjusted. We show that the method improves similarity between replicates and reveals biological differences including global and largely uniform changes.}, - language = {en}, - number = {7}, - urldate = {2015-12-17}, - journal = {Genome Research}, - author = {Bonhoure, Nicolas and Bounova, Gergana and Bernasconi, David and Praz, Viviane and Lammers, Fabienne and Canella, Donatella and Willis, Ian M. and Herr, Winship and Hernandez, Nouria and Delorenzi, Mauro and Consortium, The CycliX and Hernandez, Nouria and Delorenzi, Mauro and Deplancke, Bart and Desvergne, Béatrice and Guex, Nicolas and Herr, Winship and Naef, Felix and Rougemont, Jacques and Schibler, Ueli and Andersin, Teemu and Cousin, Pascal and Gilardi, Federica and Gos, Pascal and Lammers, Fabienne and Raghav, Sunil and Villeneuve, Dominic and Fabbretti, Roberto and Vlegel, Volker and Xenarios, Ioannis and Migliavacca, Eugenia and Praz, Viviane and David, Fabrice and Jarosz, Yohan and Kuznetsov, Dmitry and Liechti, Robin and Martin, Olivier and Delafontaine, Julien and Cajan, Julia and Gustafson, Kyle and Krier, Irina and Leleu, Marion and Molina, Nacho and Naldi, Aurélien and Rib, Leonor and Symul, Laura and Bounova, Gergana}, - month = jul, - year = {2014}, - pmid = {24709819}, - pages = {1157--1168}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4ACJ54HP/Bonhoure et al. - 2014 - Quantifying ChIP-seq data a spiking method provid.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UNDJZM98/1157.html:text/html} -} - @article{soon_high-throughput_2014, title = {High-throughput sequencing for biology and medicine}, volume = {9}, issn = {1744-4292}, url = {http://msb.embopress.org/cgi/doi/10.1038/msb.2012.61}, doi = {10.1038/msb.2012.61}, language = {en}, number = {1}, urldate = {2016-01-14}, journal = {Molecular Systems Biology}, author = {Soon, W. W. and Hariharan, M. and Snyder, M. P.}, month = apr, year = {2014}, pages = {640--640}, file = {Soon13.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Soon13.pdf:application/pdf} } @article{whitesides_whitesides_2004, title = {Whitesides' {Group}: {Writing} a {Paper}}, volume = {16}, issn = {1521-4095}, shorttitle = {Whitesides' {Group}}, url = {http://onlinelibrary.wiley.com/doi/10.1002/adma.200400767/abstract}, doi = {10.1002/adma.200400767}, language = {en}, number = {15}, urldate = {2016-01-14}, journal = {Advanced Materials}, author = {Whitesides, G. M.}, month = aug, year = {2004}, pages = {1375--1377}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CC6CNIUE/Whitesides - 2004 - Whitesides' Group Writing a Paper.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/52MA9ZBD/abstract.html:text/html} } @article{vale_accelerating_2015, title = {Accelerating scientific publication in biology}, volume = {112}, issn = {0027-8424, 1091-6490}, url = {http://www.pnas.org/content/112/44/13439}, doi = {10.1073/pnas.1511912112}, abstract = {Scientific publications enable results and ideas to be transmitted throughout the scientific community. The number and type of journal publications also have become the primary criteria used in evaluating career advancement. Our analysis suggests that publication practices have changed considerably in the life sciences over the past 30 years. More experimental data are now required for publication, and the average time required for graduate students to publish their first paper has increased and is approaching the desirable duration of PhD training. Because publication is generally a requirement for career progression, schemes to reduce the time of graduate student and postdoctoral training may be difficult to implement without also considering new mechanisms for accelerating communication of their work. The increasing time to publication also delays potential catalytic effects that ensue when many scientists have access to new information. The time has come for life scientists, funding agencies, and publishers to discuss how to communicate new findings in a way that best serves the interests of the public and the scientific community.}, language = {en}, number = {44}, urldate = {2016-01-15}, journal = {Proceedings of the National Academy of Sciences}, author = {Vale, Ronald D.}, month = nov, year = {2015}, pmid = {26508643}, keywords = {scientific publication, arXiv, PhD training, career advancement, journals}, pages = {13439--13446}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G9NU54KG/Vale - 2015 - Accelerating scientific publication in biology.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UARRVZJ4/13439.html:text/html} } @article{chen_chromatin_2014, title = {Chromatin modifiers and remodellers: regulators of cellular differentiation}, volume = {15}, copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0056}, shorttitle = {Chromatin modifiers and remodellers}, url = {http://www.nature.com/nrg/journal/v15/n2/full/nrg3607.html}, doi = {10.1038/nrg3607}, abstract = {Cellular differentiation is, by definition, epigenetic. Genome-wide profiling of pluripotent cells and differentiated cells suggests global chromatin remodelling during differentiation, which results in a progressive transition from a fairly open chromatin configuration to a more compact state. Genetic studies in mouse models show major roles for a variety of histone modifiers and chromatin remodellers in key developmental transitions, such as the segregation of embryonic and extra-embryonic lineages in blastocyst stage embryos, the formation of the three germ layers during gastrulation and the differentiation of adult stem cells. Furthermore, rather than merely stabilizing the gene expression changes that are driven by developmental transcription factors, there is emerging evidence that chromatin regulators have multifaceted roles in cell fate decisions.}, language = {en}, number = {2}, urldate = {2016-01-18}, journal = {Nature Reviews Genetics}, author = {Chen, Taiping and Dent, Sharon Y. R.}, month = feb, year = {2014}, keywords = {Chromatin remodelling, Differentiation, Histone post-translational modifications, Pluripotency}, pages = {93--106}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/776XAIRC/Chen et Dent - 2014 - Chromatin modifiers and remodellers regulators of.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XPB7IVZ2/nrg3607.html:text/html} } @article{voss_dynamic_2014, title = {Dynamic regulation of transcriptional states by chromatin and transcription factors}, volume = {15}, copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0056}, url = {http://www.nature.com/nrg/journal/v15/n2/full/nrg3623.html}, doi = {10.1038/nrg3623}, abstract = {The interaction of regulatory proteins with the complex nucleoprotein structures that are found in mammalian cells involves chromatin reorganization at multiple levels. Mechanisms that support these transitions are complex on many timescales, which range from milliseconds to minutes or hours. In this Review, we discuss emerging concepts regarding the function of regulatory elements in living cells. We also explore the involvement of these dynamic and stochastic processes in the evolution of fluctuating transcriptional activity states that are now commonly reported in eukaryotic systems.}, language = {en}, number = {2}, urldate = {2016-01-18}, journal = {Nature Reviews Genetics}, author = {Voss, Ty C. and Hager, Gordon L.}, month = feb, year = {2014}, keywords = {Gene regulation, Chromatin remodelling, Nuclear receptors}, pages = {69--81}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HHXI44C5/Voss et Hager - 2014 - Dynamic regulation of transcriptional states by ch.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2MW9DB9V/nrg3623.html:text/html} } @article{yusuf_transcription_2012, title = {The {Transcription} {Factor} {Encyclopedia}}, volume = {13}, copyright = {2012 Yusuf et al.; licensee BioMed Central Ltd.}, issn = {1465-6906}, url = {http://genomebiology.com/2012/13/3/R24/abstract}, doi = {10.1186/gb-2012-13-3-r24}, abstract = {Here we present the Transcription Factor Encyclopedia (TFe), a new web-based compendium of mini review articles on transcription factors (TFs) that is founded on the principles of open access and collaboration. Our consortium of over 100 researchers has collectively contributed over 130 mini review articles on pertinent human, mouse and rat TFs. Notable features of the TFe website include a high-quality PDF generator and web API for programmatic data retrieval. TFe aims to rapidly educate scientists about the TFs they encounter through the delivery of succinct summaries written and vetted by experts in the field. TFe is available at http://www.cisreg.ca/tfe.}, language = {en}, number = {3}, urldate = {2016-01-19}, journal = {Genome Biology}, author = {Yusuf, Dimas and Butland, Stefanie L. and Swanson, Magdalena I. and Bolotin, Eugene and Ticoll, Amy and Cheung, Warren A. and Zhang, Xiao Y. Cindy and Dickman, Christopher TD and Fulton, Debra L. and Lim, Jonathan S. and Schnabl, Jake M. and Ramos, Oscar HP and Vasseur-Cognet, Mireille and Leeuw, Charles N. de and Simpson, Elizabeth M. and Ryffel, Gerhart U. and Lam, Eric W.-F. and Kist, Ralf and Wilson, Miranda SC and Marco-Ferreres, Raquel and Brosens, Jan J. and Beccari, Leonardo L. and Bovolenta, Paola and Benayoun, Bérénice A. and Monteiro, Lara J. and Schwenen, Helma DC and Grontved, Lars and Wederell, Elizabeth and Mandrup, Susanne and Veitia, Reiner A. and Chakravarthy, Harini and Hoodless, Pamela A. and Mancarelli, M. Michela and Torbett, Bruce E. and Banham, Alison H. and Reddy, Sekhar P. and Cullum, Rebecca L. and Liedtke, Michaela and Tschan, Mario P. and Vaz, Michelle and Rizzino, Angie and Zannini, Mariastella and Frietze, Seth and Farnham, Peggy J. and Eijkelenboom, Astrid and Brown, Philip J. and Laperrière, David and Leprince, Dominique and Cristofaro, Tiziana de and Prince, Kelly L. and Putker, Marrit and Peso, Luis del and Camenisch, Gieri and Wenger, Roland H. and Mikula, Michal and Rozendaal, Marieke and Mader, Sylvie and Ostrowski, Jerzy and Rhodes, Simon J. and Rechem, Capucine Van and Boulay, Gaylor and Olechnowicz, Sam WZ and Breslin, Mary B. and Lan, Michael S. and Nanan, Kyster K. and Wegner, Michael and Hou, Juan and Mullen, Rachel D. and Colvin, Stephanie C. and Noy, Peter J. and Webb, Carol F. and Witek, Matthew E. and Ferrell, Scott and Daniel, Juliet M. and Park, Jason and Waldman, Scott A. and Peet, Daniel J. and Taggart, Michael and Jayaraman, Padma-Sheela and Karrich, Julien J. and Blom, Bianca and Vesuna, Farhad and O'Geen, Henriette and Sun, Yunfu and Gronostajski, Richard M. and Woodcroft, Mark W. and Hough, Margaret R. and Chen, Edwin and Europe-Finner, G. Nicholas and Karolczak-Bayatti, Magdalena and Bailey, Jarrod and Hankinson, Oliver and Raman, Venu and LeBrun, David P. and Biswal, Shyam and Harvey, Christopher J. and DeBruyne, Jason P. and Hogenesch, John B. and Hevner, Robert F. and Héligon, Christophe and Luo, Xin M. and Blank, Marissa C. and Millen, Kathleen J. and Sharlin, David S. and Forrest, Douglas and Dahlman-Wright, Karin and Zhao, Chunyan and Mishima, Yuriko and Sinha, Satrajit and Chakrabarti, Rumela and Portales-Casamar, Elodie and Sladek, Frances M. and Bradley, Philip H. and Wasserman, Wyeth W.}, month = mar, year = {2012}, pmid = {22458515}, pages = {R24}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4ZWWPCW9/Yusuf et al. - 2012 - The Transcription Factor Encyclopedia.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T826TI5M/R24.html:text/html} } @article{arvey_sequence_2012, title = {Sequence and chromatin determinants of cell-type–specific transcription factor binding}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1723}, doi = {10.1101/gr.127712.111}, abstract = {Gene regulatory programs in distinct cell types are maintained in large part through the cell-type–specific binding of transcription factors (TFs). The determinants of TF binding include direct DNA sequence preferences, DNA sequence preferences of cofactors, and the local cell-dependent chromatin context. To explore the contribution of DNA sequence signal, histone modifications, and DNase accessibility to cell-type–specific binding, we analyzed 286 ChIP-seq experiments performed by the ENCODE Consortium. This analysis included experiments for 67 transcriptional regulators, 15 of which were profiled in both the GM12878 (lymphoblastoid) and K562 (erythroleukemic) human hematopoietic cell lines. To model TF-bound regions, we trained support vector machines (SVMs) that use flexible k-mer patterns to capture DNA sequence signals more accurately than traditional motif approaches. In addition, we trained SVM spatial chromatin signatures to model local histone modifications and DNase accessibility, obtaining significantly more accurate TF occupancy predictions than simpler approaches. Consistent with previous studies, we find that DNase accessibility can explain cell-line–specific binding for many factors. However, we also find that of the 10 factors with prominent cell-type–specific binding patterns, four display distinct cell-type–specific DNA sequence preferences according to our models. Moreover, for two factors we identify cell-specific binding sites that are accessible in both cell types but bound only in one. For these sites, cell-type–specific sequence models, rather than DNase accessibility, are better able to explain differential binding. Our results suggest that using a single motif for each TF and filtering for chromatin accessible loci is not always sufficient to accurately account for cell-type–specific binding profiles.}, language = {en}, number = {9}, urldate = {2016-01-19}, journal = {Genome Research}, author = {Arvey, Aaron and Agius, Phaedra and Noble, William Stafford and Leslie, Christina}, month = sep, year = {2012}, pmid = {22955984}, pages = {1723--1734}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EIBI77AP/Arvey et al. - 2012 - Sequence and chromatin determinants of cell-type–s.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J34PZE7C/1723.html:text/html} } @article{wingender_tfclass:_2013, title = {{TFClass}: an expandable hierarchical classification of human transcription factors}, volume = {41}, issn = {0305-1048, 1362-4962}, shorttitle = {{TFClass}}, url = {http://nar.oxfordjournals.org/content/41/D1/D165}, doi = {10.1093/nar/gks1123}, abstract = {TFClass (http://tfclass.bioinf.med.uni-goettingen.de/) provides a comprehensive classification of human transcription factors based on their DNA-binding domains. Transcription factors constitute a large functional family of proteins directly regulating the activity of genes. Most of them are sequence-specific DNA-binding proteins, thus reading out the information encoded in cis-regulatory DNA elements of promoters, enhancers and other regulatory regions of a genome. TFClass is a database that classifies human transcription factors by a six-level classification schema, four of which are abstractions according to different criteria, while the fifth level represents TF genes and the sixth individual gene products. Altogether, nine superclasses have been identified, comprising 40 classes and 111 families. Counted by genes, 1558 human TFs have been classified so far or {\textgreater}2900 different TFs when including their isoforms generated by alternative splicing or protein processing events. With this classification, we hope to provide a basis for deciphering protein–DNA recognition codes; moreover, it can be used for constructing expanded transcriptional networks by inferring additional TF-target gene relations.}, language = {en}, number = {D1}, urldate = {2016-01-19}, journal = {Nucleic Acids Research}, author = {Wingender, Edgar and Schoeps, Torsten and Dönitz, Jürgen}, month = jan, year = {2013}, pmid = {23180794}, pages = {D165--D170}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q3PRSC5J/Wingender et al. - 2013 - TFClass an expandable hierarchical classification.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GS9XIDFU/D165.html:text/html} } @article{spitz_transcription_2012, title = {Transcription factors: from enhancer binding to developmental control}, volume = {13}, copyright = {© 2012 Nature Publishing Group}, issn = {1471-0056}, shorttitle = {Transcription factors}, url = {http://www.nature.com/nrg/journal/v13/n9/full/nrg3207.html}, doi = {10.1038/nrg3207}, abstract = {Developmental progression is driven by specific spatiotemporal domains of gene expression, which give rise to stereotypically patterned embryos even in the presence of environmental and genetic variation. Views of how transcription factors regulate gene expression are changing owing to recent genome-wide studies of transcription factor binding and RNA expression. Such studies reveal patterns that, at first glance, seem to contrast with the robustness of the developmental processes they encode. Here, we review our current knowledge of transcription factor function from genomic and genetic studies and discuss how different strategies, including extensive cooperative regulation (both direct and indirect), progressive priming of regulatory elements, and the integration of activities from multiple enhancers, confer specificity and robustness to transcriptional regulation during development.}, language = {en}, number = {9}, urldate = {2016-01-19}, journal = {Nature Reviews Genetics}, author = {Spitz, François and Furlong, Eileen E. M.}, month = sep, year = {2012}, pages = {613--626}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/88HIRA68/Spitz et Furlong - 2012 - Transcription factors from enhancer binding to de.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F4CR3GTQ/nrg3207.html:text/html} } -@article{kelly_h2a.z_2010, - title = {H2A.{Z} {Maintenance} during {Mitosis} {Reveals} {Nucleosome} {Shifting} on {Mitotically} {Silenced} {Genes}}, - volume = {39}, - issn = {1097-2765}, - url = {http://www.sciencedirect.com/science/article/pii/S1097276510006362}, - doi = {10.1016/j.molcel.2010.08.026}, - abstract = {Summary -Profound chromatin changes occur during mitosis to allow for gene silencing and chromosome segregation followed by reactivation of memorized transcription states in daughter cells. Using genome-wide sequencing, we found H2A.Z-containing +1 nucleosomes of active genes shift upstream to occupy TSSs during mitosis, significantly reducing nucleosome-depleted regions. Single-molecule analysis confirmed nucleosome shifting and demonstrated that mitotic shifting is specific to active genes that are silenced during mitosis and, thus, is not seen on promoters, which are silenced by methylation or mitotically expressed genes. Using the GRP78 promoter as a model, we found H3K4 trimethylation is also maintained while other indicators of active chromatin are lost and expression is decreased. These key changes provide a potential mechanism for rapid silencing and reactivation of genes during the cell cycle.}, - number = {6}, - urldate = {2016-01-19}, - journal = {Molecular Cell}, - author = {Kelly, Theresa K. and Miranda, Tina Branscombe and Liang, Gangning and Berman, Benjamin P. and Lin, Joy C. and Tanay, Amos and Jones, Peter A.}, - month = sep, - year = {2010}, - pages = {901--911}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W99N9G89/Kelly et al. - 2010 - H2A.Z Maintenance during Mitosis Reveals Nucleosom.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/US9QVA9H/S1097276510006362.html:text/html} -} - @article{geertz_massively_2012, title = {Massively parallel measurements of molecular interaction kinetics on a microfluidic platform}, volume = {109}, issn = {0027-8424, 1091-6490}, url = {http://www.pnas.org/content/109/41/16540}, doi = {10.1073/pnas.1206011109}, abstract = {Quantitative biology requires quantitative data. No high-throughput technologies exist capable of obtaining several hundred independent kinetic binding measurements in a single experiment. We present an integrated microfluidic device (k-MITOMI) for the simultaneous kinetic characterization of 768 biomolecular interactions. We applied k-MITOMI to the kinetic analysis of transcription factor (TF)—DNA interactions, measuring the detailed kinetic landscapes of the mouse TF Zif268, and the yeast TFs Tye7p, Yox1p, and Tbf1p. We demonstrated the integrated nature of k-MITOMI by expressing, purifying, and characterizing 27 additional yeast transcription factors in parallel on a single device. Overall, we obtained 2,388 association and dissociation curves of 223 unique molecular interactions with equilibrium dissociation constants ranging from 2 × 10-6 M to 2 × 10-9 M, and dissociation rate constants of approximately 6 s-1 to 8.5 × 10-3 s-1. Association rate constants were uniform across 3 TF families, ranging from 3.7 × 106 M-1 s-1 to 9.6 × 107 M-1 s-1, and are well below the diffusion limit. We expect that k-MITOMI will contribute to our quantitative understanding of biological systems and accelerate the development and characterization of engineered systems.}, language = {en}, number = {41}, urldate = {2016-01-21}, journal = {Proceedings of the National Academy of Sciences}, author = {Geertz, Marcel and Shore, David and Maerkl, Sebastian J.}, month = oct, year = {2012}, pmid = {23012409}, keywords = {biochemistry, systems biology, biophysics}, pages = {16540--16545}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4MAQWT2T/Geertz et al. - 2012 - Massively parallel measurements of molecular inter.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8PQQMFX4/16540.html:text/html} } @article{maerkl_systems_2007, title = {A {Systems} {Approach} to {Measuring} the {Binding} {Energy} {Landscapes} of {Transcription} {Factors}}, volume = {315}, issn = {0036-8075, 1095-9203}, url = {http://classic.sciencemag.org/content/315/5809/233}, doi = {10.1126/science.1131007}, abstract = {A major goal of systems biology is to predict the function of biological networks. Although network topologies have been successfully determined in many cases, the quantitative parameters governing these networks generally have not. Measuring affinities of molecular interactions in high-throughput format remains problematic, especially for transient and low-affinity interactions. We describe a high-throughput microfluidic platform that measures such properties on the basis of mechanical trapping of molecular interactions. With this platform we characterized DNA binding energy landscapes for four eukaryotic transcription factors; these landscapes were used to test basic assumptions about transcription factor binding and to predict their in vivo function.}, language = {en}, number = {5809}, urldate = {2016-01-21}, journal = {Science}, author = {Maerkl, Sebastian J. and Quake, Stephen R.}, month = jan, year = {2007}, pmid = {17218526}, pages = {233--237}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RZ935GZR/Maerkl et Quake - 2007 - A Systems Approach to Measuring the Binding Energy.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XNNSJWSC/233.html:text/html} } @article{nelson_microfluidic_2013, title = {Microfluidic affinity and {ChIP}-seq analyses converge on a conserved {FOXP}2-binding motif in chimp and human, which enables the detection of evolutionarily novel targets}, volume = {41}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/41/12/5991}, doi = {10.1093/nar/gkt259}, abstract = {The transcription factor forkhead box P2 (FOXP2) is believed to be important in the evolution of human speech. A mutation in its DNA-binding domain causes severe speech impairment. Humans have acquired two coding changes relative to the conserved mammalian sequence. Despite intense interest in FOXP2, it has remained an open question whether the human protein’s DNA-binding specificity and chromatin localization are conserved. Previous in vitro and ChIP-chip studies have provided conflicting consensus sequences for the FOXP2-binding site. Using MITOMI 2.0 microfluidic affinity assays, we describe the binding site of FOXP2 and its affinity profile in base-specific detail for all substitutions of the strongest binding site. We find that human and chimp FOXP2 have similar binding sites that are distinct from previously suggested consensus binding sites. Additionally, through analysis of FOXP2 ChIP-seq data from cultured neurons, we find strong overrepresentation of a motif that matches our in vitro results and identifies a set of genes with FOXP2 binding sites. The FOXP2-binding sites tend to be conserved, yet we identified 38 instances of evolutionarily novel sites in humans. Combined, these data present a comprehensive portrait of FOXP2’s-binding properties and imply that although its sequence specificity has been conserved, some of its genomic binding sites are newly evolved.}, language = {en}, number = {12}, urldate = {2016-01-21}, journal = {Nucleic Acids Research}, author = {Nelson, Christopher S. and Fuller, Chris K. and Fordyce, Polly M. and Greninger, Alexander L. and Li, Hao and DeRisi, Joseph L.}, month = jul, year = {2013}, pmid = {23625967}, pages = {5991--6004}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WF8QCD8N/Nelson et al. - 2013 - Microfluidic affinity and ChIP-seq analyses conver.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7KS9WRW9/5991.html:text/html} } @article{siepel_evolutionarily_2005, title = {Evolutionarily conserved elements in vertebrate, insect, worm, and yeast genomes}, volume = {15}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/15/8/1034}, doi = {10.1101/gr.3715005}, abstract = {We have conducted a comprehensive search for conserved elements in vertebrate genomes, using genome-wide multiple alignments of five vertebrate species (human, mouse, rat, chicken, and Fugu rubripes). Parallel searches have been performed with multiple alignments of four insect species (three species of Drosophila and Anopheles gambiae), two species of Caenorhabditis, and seven species of Saccharomyces. Conserved elements were identified with a computer program called phastCons, which is based on a two-state phylogenetic hidden Markov model (phylo-HMM). PhastCons works by fitting a phylo-HMM to the data by maximum likelihood, subject to constraints designed to calibrate the model across species groups, and then predicting conserved elements based on this model. The predicted elements cover roughly 3\%–8\% of the human genome (depending on the details of the calibration procedure) and substantially higher fractions of the more compact Drosophila melanogaster (37\%–53\%), Caenorhabditis elegans (18\%–37\%), and Saccharaomyces cerevisiae (47\%–68\%) genomes. From yeasts to vertebrates, in order of increasing genome size and general biological complexity, increasing fractions of conserved bases are found to lie outside of the exons of known protein-coding genes. In all groups, the most highly conserved elements (HCEs), by log-odds score, are hundreds or thousands of bases long. These elements share certain properties with ultraconserved elements, but they tend to be longer and less perfectly conserved, and they overlap genes of somewhat different functional categories. In vertebrates, HCEs are associated with the 3′ UTRs of regulatory genes, stable gene deserts, and megabase-sized regions rich in moderately conserved noncoding sequences. Noncoding HCEs also show strong statistical evidence of an enrichment for RNA secondary structure.}, language = {en}, number = {8}, urldate = {2016-01-25}, journal = {Genome Research}, author = {Siepel, Adam and Bejerano, Gill and Pedersen, Jakob S. and Hinrichs, Angie S. and Hou, Minmei and Rosenbloom, Kate and Clawson, Hiram and Spieth, John and Hillier, LaDeana W. and Richards, Stephen and Weinstock, George M. and Wilson, Richard K. and Gibbs, Richard A. and Kent, W. James and Miller, Webb and Haussler, David}, month = aug, year = {2005}, pmid = {16024819}, pages = {1034--1050}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BJEIIK34/Siepel et al. - 2005 - Evolutionarily conserved elements in vertebrate, i.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E6DW4AJD/1034.html:text/html} } -@article{kaplan_dna-encoded_2009, - title = {The {DNA}-encoded nucleosome organization of a eukaryotic genome}, - volume = {458}, - copyright = {© 2008 Nature Publishing Group}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v458/n7236/full/nature07667.html}, - doi = {10.1038/nature07667}, - abstract = {Nucleosome organization is critical for gene regulation. In living cells this organization is determined by multiple factors, including the action of chromatin remodellers, competition with site-specific DNA-binding proteins, and the DNA sequence preferences of the nucleosomes themselves. However, it has been difficult to estimate the relative importance of each of these mechanisms in vivo, because in vivo nucleosome maps reflect the combined action of all influencing factors. Here we determine the importance of nucleosome DNA sequence preferences experimentally by measuring the genome-wide occupancy of nucleosomes assembled on purified yeast genomic DNA. The resulting map, in which nucleosome occupancy is governed only by the intrinsic sequence preferences of nucleosomes, is similar to in vivo nucleosome maps generated in three different growth conditions. In vitro, nucleosome depletion is evident at many transcription factor binding sites and around gene start and end sites, indicating that nucleosome depletion at these sites in vivo is partly encoded in the genome. We confirm these results with a micrococcal nuclease-independent experiment that measures the relative affinity of nucleosomes for {\textasciitilde}40,000 double-stranded 150-base-pair oligonucleotides. Using our in vitro data, we devise a computational model of nucleosome sequence preferences that is significantly correlated with in vivo nucleosome occupancy in Caenorhabditis elegans. Our results indicate that the intrinsic DNA sequence preferences of nucleosomes have a central role in determining the organization of nucleosomes in vivo.}, - language = {en}, - number = {7236}, - urldate = {2016-01-27}, - journal = {Nature}, - author = {Kaplan, Noam and Moore, Irene K. and Fondufe-Mittendorf, Yvonne and Gossett, Andrea J. and Tillo, Desiree and Field, Yair and LeProust, Emily M. and Hughes, Timothy R. and Lieb, Jason D. and Widom, Jonathan and Segal, Eran}, - month = mar, - year = {2009}, - pages = {362--366}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GNQVEI22/Kaplan et al. - 2009 - The DNA-encoded nucleosome organization of a eukar.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6RWTW6VP/nature07667.html:text/html} -} - @article{henikoff_epigenome_2011, title = {Epigenome characterization at single base-pair resolution}, volume = {108}, issn = {0027-8424, 1091-6490}, url = {http://www.pnas.org/content/108/45/18318}, doi = {10.1073/pnas.1110731108}, abstract = {We have combined standard micrococcal nuclease (MNase) digestion of nuclei with a modified protocol for constructing paired-end DNA sequencing libraries to map both nucleosomes and subnucleosome-sized particles at single base-pair resolution throughout the budding yeast genome. We found that partially unwrapped nucleosomes and subnucleosome-sized particles can occupy the same position within a cell population, suggesting dynamic behavior. By varying the time of MNase digestion, we have been able to observe changes that reflect differential sensitivity of particles, including the eviction of nucleosomes. To characterize DNA-binding features of transcription factors, we plotted the length of each fragment versus its position in the genome, which defined the minimal protected region of each factor. This process led to the precise mapping of protected and exposed regions at and around binding sites, and also determination of the degree to which they are flanked by phased nucleosomes and subnucleosome-sized particles. Our protocol and mapping method provide a general strategy for epigenome characterization, including nucleosome phasing and dynamics, ATP-dependent nucleosome remodelers, and transcription factors, from a single-sequenced sample.}, language = {en}, number = {45}, urldate = {2016-01-27}, journal = {Proceedings of the National Academy of Sciences}, author = {Henikoff, Jorja G. and Belsky, Jason A. and Krassovsky, Kristina and MacAlpine, David M. and Henikoff, Steven}, month = nov, year = {2011}, pmid = {22025700}, keywords = {Saccharomyces cerevisiae, V-plot, transcription factor binding sites}, pages = {18318--18323}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MU77SWCN/Henikoff et al. - 2011 - Epigenome characterization at single base-pair res.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FZPMDDMR/18318.html:text/html} } @article{dingwall_high_1981, title = {High sequence specificity of micrococcal nuclease}, volume = {9}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/9/12/2659}, doi = {10.1093/nar/9.12.2659}, abstract = {The substrate specificity of micrococcal nuclease (EC 3.1.4.7) has been studied. The enzyme recognises features of nucleotide composition, nucleotide sequence and tertiary structure of DNA. Kinetic analysis indicates that the rate of cleavage is 30 times greater at the 5′ side of A or T than at G or C. Digestion of end-labelled linear DNA molecules of known sequence revealed that only a limited number of sites are cut, generating a highly specific pattern of fragments. The frequency of cleavage at each site has been determined and it may reflect the poor base overlap in the 5′ T-A 3′ stack as well as the length of contiguous A and T residues. The same sequence preferences are found when DNA is assembled into nucleosomes. Deoxyribonuclease 1 (EC 3.1.4.5.) recognises many of the same sequence features. Micrococcal nuclease also mimics nuclease S1 selectively cleaving an inverted repeat in supercoiled pBR322. The value of micrococcal nuclease as a “non-specific” enzymatic probe for studying nucleosome phasing is questioned.}, language = {en}, number = {12}, urldate = {2016-01-27}, journal = {Nucleic Acids Research}, author = {Dingwall, Colin and Lomonossoff, George P. and Laskey, Ronald A.}, month = jun, year = {1981}, pmid = {6269057}, pages = {2659--2674}, file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZP7H67F3/2659.html:text/html} } @article{jiang_nucleosome_2009, title = {Nucleosome positioning and gene regulation: advances through genomics}, volume = {10}, copyright = {© 2009 Nature Publishing Group}, issn = {1471-0056}, shorttitle = {Nucleosome positioning and gene regulation}, url = {http://www.nature.com/nrg/journal/v10/n3/full/nrg2522.html}, doi = {10.1038/nrg2522}, abstract = {Knowing the precise locations of nucleosomes in a genome is key to understanding how genes are regulated. Recent 'next generation' ChIP–chip and ChIP–Seq technologies have accelerated our understanding of the basic principles of chromatin organization. Here we discuss what high-resolution genome-wide maps of nucleosome positions have taught us about how nucleosome positioning demarcates promoter regions and transcriptional start sites, and how the composition and structure of promoter nucleosomes facilitate or inhibit transcription. A detailed picture is starting to emerge of how diverse factors, including underlying DNA sequences and chromatin remodelling complexes, influence nucleosome positioning.}, language = {en}, number = {3}, urldate = {2016-01-28}, journal = {Nature Reviews Genetics}, author = {Jiang, Cizhong and Pugh, B. Franklin}, month = mar, year = {2009}, pages = {161--172}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G8FIE4U4/Jiang et Pugh - 2009 - Nucleosome positioning and gene regulation advanc.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FGDCABJF/nrg2522.html:text/html} } @article{horz_sequence_1981, title = {Sequence specific cleavage of {DNA} by micrococcal nuclease}, volume = {9}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/9/12/2643}, doi = {10.1093/nar/9.12.2643}, abstract = {Micrococcal nuclease is shown to cleave DNA under conditions of partial digestion in a specific manner. Sequences of the type 5′CATA and 5′CTA are attacked preferentially, followed by exonucleoTytic degradation at the newly generated DNA termini. GC-rich flanking sequences further increase the probability of initial attack. Unexpectedly, long stretches containing only A and T are spared by the nuclease. These results, which were obtained with mouse satellite DNA and two fragments from the plasmid pBR322, do not support the previous contention that it is the regions of high AT-content which are initially cleaved by micrococcal nuclease. This specificity of micrococcal nuclease complicates its use in experiments intended to monitor the nucleoprotein structure of a DNA sequence in chromatin.}, language = {en}, number = {12}, urldate = {2016-01-27}, journal = {Nucleic Acids Research}, author = {Hörz, Wolfram and Altenburger, Werner}, month = jun, year = {1981}, pmid = {7279658}, pages = {2643--2658}, file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MBQQBQZW/2643.html:text/html} } @article{kaplan_contribution_2010, title = {Contribution of histone sequence preferences to nucleosome organization: proposed definitions and methodology}, volume = {11}, copyright = {2010 BioMed Central Ltd}, issn = {1465-6906}, shorttitle = {Contribution of histone sequence preferences to nucleosome organization}, url = {http://genomebiology.com/2010/11/11/140/abstract}, doi = {10.1186/gb-2010-11-11-140}, abstract = {We propose definitions and procedures for comparing nucleosome maps and discuss current agreement and disagreement on the effect of histone sequence preferences on nucleosome organization in vivo.}, language = {en}, number = {11}, urldate = {2016-01-27}, journal = {Genome Biology}, author = {Kaplan, Noam and Hughes, Timothy R. and Lieb, Jason D. and Widom, Jonathan and Segal, Eran}, month = nov, year = {2010}, pmid = {21118582}, pages = {140}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8QTUCP9V/Kaplan et al. - 2010 - Contribution of histone sequence preferences to nu.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/37AT8SVN/140.html:text/html} } @article{sung_dnase_2014, title = {{DNase} {Footprint} {Signatures} {Are} {Dictated} by {Factor} {Dynamics} and {DNA} {Sequence}}, volume = {56}, issn = {1097-2765}, url = {http://www.cell.com/article/S1097276514006716/abstract}, doi = {10.1016/j.molcel.2014.08.016}, abstract = {Genomic footprinting has emerged as an unbiased discovery method for transcription factor (TF) occupancy at cognate DNA in vivo. A basic premise of footprinting is that sequence-specific TF-DNA interactions are associated with localized resistance to nucleases, leaving observable signatures of cleavage within accessible chromatin. This phenomenon is interpreted to imply protection of the critical nucleotides by the stably bound protein factor. However, this model conflicts with previous reports of many TFs exchanging with specific binding sites in living cells on a timescale of seconds. We show that TFs with short DNA residence times have no footprints at bound motif elements. Moreover, the nuclease cleavage profile within a footprint originates from the DNA sequence in the factor-binding site, rather than from the protein occupying specific nucleotides. These findings suggest a revised understanding of TF footprinting and reveal limitations in comprehensive reconstruction of the TF regulatory network using this approach.}, language = {English}, number = {2}, urldate = {2016-01-27}, journal = {Molecular Cell}, author = {Sung, Myong-Hee and Guertin, Michael J. and Baek, Songjoon and Hager, Gordon L.}, month = oct, year = {2014}, pmid = {25242143}, pages = {275--285}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XHCZQETM/Sung et al. - 2014 - DNase Footprint Signatures Are Dictated by Factor .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W2QU5DXX/S1097-2765(14)00671-6.html:text/html} } @article{chen_improved_2014, title = {Improved nucleosome-positioning algorithm {iNPS} for accurate nucleosome positioning from sequencing data}, volume = {5}, copyright = {© 2014 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, url = {http://www.nature.com/ncomms/2014/140918/ncomms5909/full/ncomms5909.html}, doi = {10.1038/ncomms5909}, abstract = {Accurate determination of genome-wide nucleosome positioning can provide important insights into global gene regulation. Here, we describe the development of an improved nucleosome-positioning algorithm—iNPS—which achieves significantly better performance than the widely used NPS package. By determining nucleosome boundaries more precisely and merging or separating shoulder peaks based on local ​MNase-seq signals, iNPS can unambiguously detect 60\% more nucleosomes. The detected nucleosomes display better nucleosome ‘widths’ and neighbouring centre–centre distance distributions, giving rise to sharper patterns and better phasing of average nucleosome profiles and higher consistency between independent data subsets. In addition to its unique advantage in classifying nucleosomes by shape to reveal their different biological properties, iNPS also achieves higher significance and lower false positive rates than previously published methods. The application of iNPS to T-cell activation data demonstrates a greater ability to facilitate detection of nucleosome repositioning, uncovering additional biological features underlying the activation process.}, language = {en}, urldate = {2016-01-27}, journal = {Nature Communications}, author = {Chen, Weizhong and Liu, Yi and Zhu, Shanshan and Green, Christopher D. and Wei, Gang and Han, Jing-Dong Jackie}, month = sep, year = {2014}, keywords = {Biological sciences, bioinformatics}, pages = {4909}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ICZIKCZR/Chen et al. - 2014 - Improved nucleosome-positioning algorithm iNPS for.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AAARM58C/ncomms5909.html:text/html} } -@article{soufi_pioneer_2015-1, - title = {Pioneer {Transcription} {Factors} {Target} {Partial} {DNA} {Motifs} on {Nucleosomes} to {Initiate} {Reprogramming}}, - volume = {161}, - issn = {0092-8674}, - url = {http://www.cell.com/article/S0092867415003049/abstract}, - doi = {10.1016/j.cell.2015.03.017}, - abstract = {Pioneer transcription factors (TFs) access silent chromatin and initiate cell-fate changes, using diverse types of DNA binding domains (DBDs). FoxA, the paradigm pioneer TF, has a winged helix DBD that resembles linker histone and thereby binds its target sites on nucleosomes and in compacted chromatin. Herein, we compare the nucleosome and chromatin targeting activities of Oct4 (POU DBD), Sox2 (HMG box DBD), Klf4 (zinc finger DBD), and c-Myc (bHLH DBD), which together reprogram somatic cells to pluripotency. Purified Oct4, Sox2, and Klf4 proteins can bind nucleosomes in vitro, and in vivo they preferentially target silent sites enriched for nucleosomes. Pioneer activity relates simply to the ability of a given DBD to target partial motifs displayed on the nucleosome surface. Such partial motif recognition can occur by coordinate binding between factors. Our findings provide insight into how pioneer factors can target naive chromatin sites.}, - language = {English}, - number = {3}, - urldate = {2016-01-27}, - journal = {Cell}, - author = {Soufi, Abdenour and Garcia, Meilin Fernandez and Jaroszewicz, Artur and Osman, Nebiyu and Pellegrini, Matteo and Zaret, Kenneth S.}, - month = apr, - year = {2015}, - pmid = {25892221}, - pages = {555--568}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K55QZZPQ/Soufi et al. - 2015 - Pioneer Transcription Factors Target Partial DNA M.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IKRCCW23/S0092-8674(15)00304-9.html:text/html} -} - @article{weirauch_determination_2014, title = {Determination and {Inference} of {Eukaryotic} {Transcription} {Factor} {Sequence} {Specificity}}, volume = {158}, issn = {0092-8674}, url = {http://www.sciencedirect.com/science/article/pii/S0092867414010368}, doi = {10.1016/j.cell.2014.08.009}, abstract = {Summary Transcription factor (TF) DNA sequence preferences direct their regulatory activity, but are currently known for only ∼1\% of eukaryotic TFs. Broadly sampling DNA-binding domain (DBD) types from multiple eukaryotic clades, we determined DNA sequence preferences for \>1,000 TFs encompassing 54 different DBD classes from 131 diverse eukaryotes. We find that closely related DBDs almost always have very similar DNA sequence preferences, enabling inference of motifs for ∼34\% of the ∼170,000 known or predicted eukaryotic TFs. Sequences matching both measured and inferred motifs are enriched in chromatin immunoprecipitation sequencing (ChIP-seq) peaks and upstream of transcription start sites in diverse eukaryotic lineages. SNPs defining expression quantitative trait loci in Arabidopsis promoters are also enriched for predicted TF binding sites. Importantly, our motif “library” can be used to identify specific TFs whose binding may be altered by human disease risk alleles. These data present a powerful resource for mapping transcriptional networks across eukaryotes.}, number = {6}, urldate = {2016-01-27}, journal = {Cell}, author = {Weirauch, Matthew T. and Yang, Ally and Albu, Mihai and Cote, Atina G. and Montenegro-Montero, Alejandro and Drewe, Philipp and Najafabadi, Hamed S. and Lambert, Samuel A. and Mann, Ishminder and Cook, Kate and Zheng, Hong and Goity, Alejandra and van Bakel, Harm and Lozano, Jean-Claude and Galli, Mary and Lewsey, Mathew G. and Huang, Eryong and Mukherjee, Tuhin and Chen, Xiaoting and Reece-Hoyes, John S. and Govindarajan, Sridhar and Shaulsky, Gad and Walhout, Albertha J. M. and Bouget, François-Yves and Ratsch, Gunnar and Larrondo, Luis F. and Ecker, Joseph R. and Hughes, Timothy R.}, month = sep, year = {2014}, pages = {1431--1443}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5XR4BSK6/Weirauch et al. - 2014 - Determination and Inference of Eukaryotic Transcri.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B6FAA9XX/S0092867414010368.html:text/html} } @article{nechanitzky_transcription_2013, title = {Transcription factor {EBF}1 is essential for the maintenance of {B} cell identity and prevention of alternative fates in committed cells}, volume = {14}, copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1529-2908}, url = {http://www.nature.com/ni/journal/v14/n8/full/ni.2641.html}, doi = {10.1038/ni.2641}, abstract = {The transcription factors EBF1 and Pax5 have been linked to activation of the B cell lineage program and irreversible loss of alternative lineage potential (commitment), respectively. Here we conditionally deleted Ebf1 in committed pro-B cells after transfer into alymphoid mice. We found that those cells converted into innate lymphoid cells (ILCs) and T cells with variable-diversity-joining (VDJ) rearrangements of loci encoding both B cell and T cell antigen receptors. As intermediates in lineage conversion, Ebf1-deficient CD19+ cells expressing Pax5 and transcriptional regulators of the ILC and T cell fates were detectable. In particular, genes encoding the transcription factors Id2 and TCF-1 were bound and repressed by EBF1. Thus, both EBF1 and Pax5 are required for B lineage commitment by repressing distinct and common determinants of alternative cell fates.}, language = {en}, number = {8}, urldate = {2016-01-27}, journal = {Nature Immunology}, author = {Nechanitzky, Robert and Akbas, Duygu and Scherer, Stefanie and Györy, Ildiko and Hoyler, Thomas and Ramamoorthy, Senthilkumar and Diefenbach, Andreas and Grosschedl, Rudolf}, month = aug, year = {2013}, keywords = {Lymphocytes}, pages = {867--875}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PPDTTR8G/Nechanitzky et al. - 2013 - Transcription factor EBF1 is essential for the mai.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4IZAZJ4U/ni.2641.html:text/html} } @article{sherwood_discovery_2014, title = {Discovery of directional and nondirectional pioneer transcription factors by modeling {DNase} profile magnitude and shape}, volume = {32}, copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v32/n2/full/nbt.2798.html}, doi = {10.1038/nbt.2798}, abstract = {We describe protein interaction quantitation (PIQ), a computational method for modeling the magnitude and shape of genome-wide DNase I hypersensitivity profiles to identify transcription factor (TF) binding sites. Through the use of machine-learning techniques, PIQ identified binding sites for {\textgreater}700 TFs from one DNase I hypersensitivity analysis followed by sequencing (DNase-seq) experiment with accuracy comparable to that of chromatin immunoprecipitation followed by sequencing (ChIP-seq). We applied PIQ to analyze DNase-seq data from mouse embryonic stem cells differentiating into prepancreatic and intestinal endoderm. We identified 120 and experimentally validated eight 'pioneer' TF families that dynamically open chromatin. Four pioneer TF families only opened chromatin in one direction from their motifs. Furthermore, we identified 'settler' TFs whose genomic binding is principally governed by proximity to open chromatin. Our results support a model of hierarchical TF binding in which directional and nondirectional pioneer activity shapes the chromatin landscape for population by settler TFs.}, language = {en}, number = {2}, urldate = {2016-02-03}, journal = {Nature Biotechnology}, author = {Sherwood, Richard I. and Hashimoto, Tatsunori and O'Donnell, Charles W. and Lewis, Sophia and Barkal, Amira A. and van Hoff, John Peter and Karun, Vivek and Jaakkola, Tommi and Gifford, David K.}, month = feb, year = {2014}, keywords = {Embryonic stem cells, Genome informatics, Machine learning, Regulatory networks}, pages = {171--178}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/85GIH6AN/Sherwood et al. - 2014 - Discovery of directional and nondirectional pionee.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B9U6VK4P/nbt.2798.html:text/html} } -@article{kaplan_dna-encoded_2009-1, +@article{kaplan_dna-encoded_2009, title = {The {DNA}-encoded nucleosome organization of a eukaryotic genome}, volume = {458}, copyright = {© 2008 Nature Publishing Group}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v458/n7236/full/nature07667.html}, doi = {10.1038/nature07667}, abstract = {Nucleosome organization is critical for gene regulation. In living cells this organization is determined by multiple factors, including the action of chromatin remodellers, competition with site-specific DNA-binding proteins, and the DNA sequence preferences of the nucleosomes themselves. However, it has been difficult to estimate the relative importance of each of these mechanisms in vivo, because in vivo nucleosome maps reflect the combined action of all influencing factors. Here we determine the importance of nucleosome DNA sequence preferences experimentally by measuring the genome-wide occupancy of nucleosomes assembled on purified yeast genomic DNA. The resulting map, in which nucleosome occupancy is governed only by the intrinsic sequence preferences of nucleosomes, is similar to in vivo nucleosome maps generated in three different growth conditions. In vitro, nucleosome depletion is evident at many transcription factor binding sites and around gene start and end sites, indicating that nucleosome depletion at these sites in vivo is partly encoded in the genome. We confirm these results with a micrococcal nuclease-independent experiment that measures the relative affinity of nucleosomes for {\textasciitilde}40,000 double-stranded 150-base-pair oligonucleotides. Using our in vitro data, we devise a computational model of nucleosome sequence preferences that is significantly correlated with in vivo nucleosome occupancy in Caenorhabditis elegans. Our results indicate that the intrinsic DNA sequence preferences of nucleosomes have a central role in determining the organization of nucleosomes in vivo.}, language = {en}, number = {7236}, urldate = {2016-02-23}, journal = {Nature}, author = {Kaplan, Noam and Moore, Irene K. and Fondufe-Mittendorf, Yvonne and Gossett, Andrea J. and Tillo, Desiree and Field, Yair and LeProust, Emily M. and Hughes, Timothy R. and Lieb, Jason D. and Widom, Jonathan and Segal, Eran}, month = mar, year = {2009}, pages = {362--366}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4KX9KHHJ/Kaplan et al. - 2009 - The DNA-encoded nucleosome organization of a eukar.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XI3XE3IK/nature07667.html:text/html} } @article{jolma_dna-binding_2013, title = {{DNA}-{Binding} {Specificities} of {Human} {Transcription} {Factors}}, volume = {152}, issn = {0092-8674}, url = {http://www.sciencedirect.com/science/article/pii/S0092867412014961}, doi = {10.1016/j.cell.2012.12.009}, abstract = {Summary Although the proteins that read the gene regulatory code, transcription factors (TFs), have been largely identified, it is not well known which sequences TFs can recognize. We have analyzed the sequence-specific binding of human TFs using high-throughput SELEX and ChIP sequencing. A total of 830 binding profiles were obtained, describing 239 distinctly different binding specificities. The models represent the majority of human TFs, approximately doubling the coverage compared to existing systematic studies. Our results reveal additional specificity determinants for a large number of factors for which a partial specificity was known, including a commonly observed A- or T-rich stretch that flanks the core motifs. Global analysis of the data revealed that homodimer orientation and spacing preferences, and base-stacking interactions, have a larger role in TF-DNA binding than previously appreciated. We further describe a binding model incorporating these features that is required to understand binding of TFs to DNA.}, number = {1–2}, urldate = {2016-02-29}, journal = {Cell}, author = {Jolma, Arttu and Yan, Jian and Whitington, Thomas and Toivonen, Jarkko and Nitta, Kazuhiro R. and Rastas, Pasi and Morgunova, Ekaterina and Enge, Martin and Taipale, Mikko and Wei, Gonghong and Palin, Kimmo and Vaquerizas, Juan M. and Vincentelli, Renaud and Luscombe, Nicholas M. and Hughes, Timothy R. and Lemaire, Patrick and Ukkonen, Esko and Kivioja, Teemu and Taipale, Jussi}, month = jan, year = {2013}, pages = {327--339}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7EIKAUV2/Jolma et al. - 2013 - DNA-Binding Specificities of Human Transcription F.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ECTCAT9X/S0092867412014961.html:text/html} } @article{duttke_human_2015, title = {Human {Promoters} {Are} {Intrinsically} {Directional}}, volume = {57}, issn = {1097-2765}, url = {http://www.sciencedirect.com/science/article/pii/S1097276514010077}, doi = {10.1016/j.molcel.2014.12.029}, abstract = {Summary Divergent transcription, in which reverse-oriented transcripts occur upstream of eukaryotic promoters in regions devoid of annotated genes, has been suggested to be a general property of active promoters. Here we show that the human basal RNA polymerase II transcriptional machinery and core promoter are inherently unidirectional and that reverse-oriented transcripts originate from their own cognate reverse-directed core promoters. In vitro transcription analysis and mapping of nascent transcripts in HeLa cells revealed that sequences at reverse start sites are similar to those of their forward counterparts. The use of DNase I accessibility to define proximal promoter borders revealed that about half of promoters are unidirectional and that unidirectional promoters are depleted at their upstream edges of reverse core promoter sequences and their associated chromatin features. Divergent transcription is thus not an inherent property of the transcription process but rather the consequence of the presence of both forward- and reverse-directed core promoters.}, number = {4}, urldate = {2016-03-01}, journal = {Molecular Cell}, author = {Duttke, Sascha H. C. and Lacadie, Scott A. and Ibrahim, Mahmoud M. and Glass, Christopher K. and Corcoran, David L. and Benner, Christopher and Heinz, Sven and Kadonaga, James T. and Ohler, Uwe}, month = feb, year = {2015}, pages = {674--684}, file = {ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4FF6Q3EJ/S1097276514010077\$.html:text/html} } @article{badis_library_2008, title = {A {Library} of {Yeast} {Transcription} {Factor} {Motifs} {Reveals} a {Widespread} {Function} for {Rsc}3 in {Targeting} {Nucleosome} {Exclusion} at {Promoters}}, volume = {32}, issn = {1097-2765}, url = {http://www.sciencedirect.com/science/article/pii/S1097276508008423}, doi = {10.1016/j.molcel.2008.11.020}, abstract = {Summary The sequence specificity of DNA-binding proteins is the primary mechanism by which the cell recognizes genomic features. Here, we describe systematic determination of yeast transcription factor DNA-binding specificities. We obtained binding specificities for 112 DNA-binding proteins representing 19 distinct structural classes. One-third of the binding specificities have not been previously reported. Several binding sequences have striking genomic distributions relative to transcription start sites, supporting their biological relevance and suggesting a role in promoter architecture. Among these are Rsc3 binding sequences, containing the core CGCG, which are found preferentially ∼100 bp upstream of transcription start sites. Mutation of RSC3 results in a dramatic increase in nucleosome occupancy in hundreds of proximal promoters containing a Rsc3 binding element, but has little impact on promoters lacking Rsc3 binding sequences, indicating that Rsc3 plays a broad role in targeting nucleosome exclusion at yeast promoters.}, number = {6}, urldate = {2016-08-09}, journal = {Molecular Cell}, author = {Badis, Gwenael and Chan, Esther T. and van Bakel, Harm and Pena-Castillo, Lourdes and Tillo, Desiree and Tsui, Kyle and Carlson, Clayton D. and Gossett, Andrea J. and Hasinoff, Michael J. and Warren, Christopher L. and Gebbia, Marinella and Talukder, Shaheynoor and Yang, Ally and Mnaimneh, Sanie and Terterov, Dimitri and Coburn, David and Li Yeo, Ai and Yeo, Zhen Xuan and Clarke, Neil D. and Lieb, Jason D. and Ansari, Aseem Z. and Nislow, Corey and Hughes, Timothy R.}, month = dec, year = {2008}, keywords = {DNA, PROTEINS}, pages = {878--887}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3827EM9J/Badis et al. - 2008 - A Library of Yeast Transcription Factor Motifs Rev.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8UHEJ37M/S1097276508008423.html:text/html} } @incollection{jolma_methods_2011, series = {Subcellular {Biochemistry}}, title = {Methods for {Analysis} of {Transcription} {Factor} {DNA}-{Binding} {Specificity} {In} {Vitro}}, copyright = {©2011 Springer Science+Business Media B.V.}, isbn = {978-90-481-9068-3 978-90-481-9069-0}, url = {http://link.springer.com/chapter/10.1007/978-90-481-9069-0_7}, abstract = {Transcription of genes during development and in response to environmental stimuli is determined by genomic DNA sequence. The DNA sequences regulating transcription are read by sequence-specific transcription factors (TFs) that recognize relatively short sequences, generally between four and twenty base pairs in length. Transcriptional regulation generally requires binding of multiple TFs in close proximity to each other. Mechanistic understanding of transcription in an organism thus requires detailed knowledge of binding affinities of all its TFs to all possible DNA sequences, and the co–operative interactions between the TFs. However, very little is known about such co-operative binding interactions, and even the simple TF-DNA binding information exists only for a very small proportion of all TFs – for example, mammals have approximately 1,300–2,000 TFs [1, 2], yet the largest public databases for TF binding specificity, Jaspar and Uniprobe [3, 4] currently list only approximately 500 moderate to high resolution profiles for human or mouse. This lack of knowledge is in part due to the fact that analysis of TF DNA binding has been laborious and expensive. In this chapter, we review methods that can be used to determine binding specificity of TFs to DNA, mainly focusing on recently developed assays that allow high-resolution analysis of TF binding specificity in relatively high throughput.}, language = {en}, number = {52}, urldate = {2016-03-09}, booktitle = {A {Handbook} of {Transcription} {Factors}}, publisher = {Springer Netherlands}, author = {Jolma, Arttu and Taipale, Jussi}, editor = {Hughes, Timothy R.}, year = {2011}, doi = {10.1007/978-90-481-9069-0_7}, keywords = {SELEX, Biomedicine general, Biochemistry, general, Nucleic Acid Chemistry, Cell Biology, Protein–DNA interactions, Co-operative binding, Affinity, Protein binding microarrays}, pages = {155--173}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/N3SWG4KM/Jolma et Taipale - 2011 - Methods for Analysis of Transcription Factor DNA-B.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K2P3P7G7/10.html:text/html} } @article{stormo_specificity_1998, title = {Specificity, free energy and information content in protein–{DNA} interactions}, volume = {23}, issn = {0968-0004}, url = {http://www.sciencedirect.com/science/article/pii/S0968000498011876}, doi = {10.1016/S0968-0004(98)01187-6}, abstract = {Site-specific DNA–protein interactions can be studied using experimental and computational methods. Experimental approaches typically analyze a protein–DNA interaction by measuring the free energy of binding under a variety of conditions. Computational methods focus on alignments of known binding sites for a protein, and, from these alignments, make estimates of the binding energy. Understanding the relationship between these two perspectives, and finding ways to improve both, is a major challenge of modern molecular biology.}, number = {3}, urldate = {2016-03-11}, journal = {Trends in Biochemical Sciences}, author = {Stormo, Gary D. and Fields, Dana S.}, month = mar, year = {1998}, keywords = {protein-DNA interaction, free energy of binding, equilibrium binding constant}, pages = {109--113}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HF85TI4K/Stormo et Fields - 1998 - Specificity, free energy and information content i.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E84QCIUM/S0968000498011876.html:text/html} } @article{zhang_canonical_2014, title = {Canonical nucleosome organization at promoters forms during genome activation}, volume = {24}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/24/2/260}, doi = {10.1101/gr.157750.113}, abstract = {The organization of nucleosomes influences transcriptional activity by controlling accessibility of DNA binding proteins to the genome. Genome-wide nucleosome binding profiles have identified a canonical nucleosome organization at gene promoters, where arrays of well-positioned nucleosomes emanate from nucleosome-depleted regions. The mechanisms of formation and the function of canonical promoter nucleosome organization remain unclear. Here we analyze the genome-wide location of nucleosomes during zebrafish embryogenesis and show that well-positioned nucleosome arrays appear on thousands of promoters during the activation of the zygotic genome. The formation of canonical promoter nucleosome organization is independent of DNA sequence preference, transcriptional elongation, and robust RNA polymerase II (Pol II) binding. Instead, canonical promoter nucleosome organization correlates with the presence of histone H3 lysine 4 trimethylation (H3K4me3) and affects future transcriptional activation. These findings reveal that genome activation is central to the organization of nucleosome arrays during early embryogenesis.}, language = {en}, number = {2}, urldate = {2016-03-16}, journal = {Genome Research}, author = {Zhang, Yong and Vastenhouw, Nadine L. and Feng, Jianxing and Fu, Kai and Wang, Chenfei and Ge, Ying and Pauli, Andrea and Hummelen, Paul van and Schier, Alexander F. and Liu, X. Shirley}, month = feb, year = {2014}, pmid = {24285721}, pages = {260--266}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WM4I4Q4W/Zhang et al. - 2014 - Canonical nucleosome organization at promoters for.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BPB52I5C/260.html:text/html} } @article{siebert_bayesian_2016, title = {Bayesian {Markov} models consistently outperform {PWMs} at predicting motifs in nucleotide sequences}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/early/2016/06/09/nar.gkw521}, doi = {10.1093/nar/gkw521}, abstract = {Position weight matrices (PWMs) are the standard model for DNA and RNA regulatory motifs. In PWMs nucleotide probabilities are independent of nucleotides at other positions. Models that account for dependencies need many parameters and are prone to overfitting. We have developed a Bayesian approach for motif discovery using Markov models in which conditional probabilities of order k − 1 act as priors for those of order k. This Bayesian Markov model (BaMM) training automatically adapts model complexity to the amount of available data. We also derive an EM algorithm for de-novo discovery of enriched motifs. For transcription factor binding, BaMMs achieve significantly (P = 1/16) higher cross-validated partial AUC than PWMs in 97\% of 446 ChIP-seq ENCODE datasets and improve performance by 36\% on average. BaMMs also learn complex multipartite motifs, improving predictions of transcription start sites, polyadenylation sites, bacterial pause sites, and RNA binding sites by 26–101\%. BaMMs never performed worse than PWMs. These robust improvements argue in favour of generally replacing PWMs by BaMMs.}, language = {en}, urldate = {2016-06-15}, journal = {Nucleic Acids Research}, author = {Siebert, Matthias and Söding, Johannes}, month = jun, year = {2016}, pmid = {27288444}, pages = {gkw521}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WXRQ4RFI/Siebert et Söding - 2016 - Bayesian Markov models consistently outperform PWM.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QRW8B45T/nar.gkw521.html:text/html;Supplemental.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/79AXCN8I/Supplemental.pdf:application/pdf} } @article{gupta_quantifying_2007, title = {Quantifying similarity between motifs}, volume = {8}, issn = {1474-760X}, url = {http://dx.doi.org/10.1186/gb-2007-8-2-r24}, doi = {10.1186/gb-2007-8-2-r24}, abstract = {A common question within the context of de novo motif discovery is whether a newly discovered, putative motif resembles any previously discovered motif in an existing database. To answer this question, we define a statistical measure of motif-motif similarity, and we describe an algorithm, called Tomtom, for searching a database of motifs with a given query motif. Experimental simulations demonstrate the accuracy of Tomtom's E values and its effectiveness in finding similar motifs.}, urldate = {2016-05-17}, journal = {Genome Biology}, author = {Gupta, Shobhit and Stamatoyannopoulos, John A. and Bailey, Timothy L. and Noble, William Stafford}, year = {2007}, pages = {R24}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8BIHRUEV/Gupta et al. - 2007 - Quantifying similarity between motifs.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SFIWP7TF/gb-2007-8-2-r24.html:text/html} } @article{alipanahi_predicting_2015, title = {Predicting the sequence specificities of {DNA}- and {RNA}-binding proteins by deep learning}, volume = {33}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v33/n8/full/nbt.3300.html}, doi = {10.1038/nbt.3300}, abstract = {Knowing the sequence specificities of DNA- and RNA-binding proteins is essential for developing models of the regulatory processes in biological systems and for identifying causal disease variants. Here we show that sequence specificities can be ascertained from experimental data with 'deep learning' techniques, which offer a scalable, flexible and unified computational approach for pattern discovery. Using a diverse array of experimental data and evaluation metrics, we find that deep learning outperforms other state-of-the-art methods, even when training on in vitro data and testing on in vivo data. We call this approach DeepBind and have built a stand-alone software tool that is fully automatic and handles millions of sequences per experiment. Specificities determined by DeepBind are readily visualized as a weighted ensemble of position weight matrices or as a 'mutation map' that indicates how variations affect binding within a specific sequence.}, language = {en}, number = {8}, urldate = {2016-06-15}, journal = {Nature Biotechnology}, author = {Alipanahi, Babak and Delong, Andrew and Weirauch, Matthew T. and Frey, Brendan J.}, month = aug, year = {2015}, keywords = {Genome informatics, Computational biology and bioinformatics, Gene regulatory networks}, pages = {831--838}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GWV3VGUD/Alipanahi et al. - 2015 - Predicting the sequence specificities of DNA- and .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GDJRXKTR/nbt.3300.html:text/html} } @article{kumar_predicting_2016, title = {Predicting transcription factor site occupancy using {DNA} sequence intrinsic and cell-type specific chromatin features}, volume = {17}, issn = {1471-2105}, url = {http://dx.doi.org/10.1186/s12859-015-0846-z}, doi = {10.1186/s12859-015-0846-z}, abstract = {Understanding the mechanisms by which transcription factors (TF) are recruited to their physiological target sites is crucial for understanding gene regulation. DNA sequence intrinsic features such as predicted binding affinity are often not very effective in predicting in vivo site occupancy and in any case could not explain cell-type specific binding events. Recent reports show that chromatin accessibility, nucleosome occupancy and specific histone post-translational modifications greatly influence TF site occupancy in vivo. In this work, we use machine-learning methods to build predictive models and assess the relative importance of different sequence-intrinsic and chromatin features in the TF-to-target-site recruitment process.}, number = {1}, urldate = {2016-06-15}, journal = {BMC Bioinformatics}, author = {Kumar, Sunil and Bucher, Philipp}, year = {2016}, pages = {41--50}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M45S496M/Kumar et Bucher - 2016 - Predicting transcription factor site occupancy usi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M9Q6XTG4/s12859-015-0846-z.html:text/html} } @article{sharon_feature-based_2008, title = {A {Feature}-{Based} {Approach} to {Modeling} {Protein}–{DNA} {Interactions}}, volume = {4}, issn = {1553-7358}, url = {http://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1000154}, doi = {10.1371/journal.pcbi.1000154}, abstract = {Author Summary Transcription factor (TF) protein binding to its DNA target sequences is a fundamental physical interaction underlying gene regulation. Characterizing the binding specificities of TFs is essential for deducing which genes are regulated by which TFs. Recently, several high-throughput methods that measure sequences enriched for TF targets genomewide were developed. Since TFs recognize relatively short sequences, much effort has been directed at developing computational methods that identify enriched subsequences (motifs) from these sequences. However, little effort has been directed towards improving the representation of motifs. Practically, available motif finding software use the position specific scoring matrix (PSSM) model, which assumes independence between different motif positions. We present an alternative, richer model, called the feature motif model (FMM), that enables the representation of a variety of sequence features and captures dependencies that exist between binding site positions. We show how FMMs explain TF binding data better than PSSMs on both synthetic and real data. We also present a motif finder algorithm that learns FMM motifs from unaligned promoter sequences and show how de novo FMMs, learned from binding data of the human TFs c-Myc and CTCF, reveal intriguing insights about their binding specificities.}, number = {8}, urldate = {2016-06-16}, journal = {PLOS Comput Biol}, author = {Sharon, Eilon and Lubliner, Shai and Segal, Eran}, year = {2008}, keywords = {Transcription Factors, Sequence motif analysis, Sequence alignment, Algorithms, Markov models, Network motifs, Probability distribution, DNA-binding proteins}, pages = {e1000154}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K9B28TX5/Sharon et al. - 2008 - A Feature-Based Approach to Modeling Protein–DNA I.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H3U7TP6B/article.html:text/html} } @article{tsai_contribution_2015, title = {Contribution of {Sequence} {Motif}, {Chromatin} {State}, and {DNA} {Structure} {Features} to {Predictive} {Models} of {Transcription} {Factor} {Binding} in {Yeast}}, volume = {11}, issn = {1553-7358}, url = {http://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1004418}, doi = {10.1371/journal.pcbi.1004418}, abstract = {Author Summary Identification of transcription factor binding sites based on sequence motifs is typically accompanied by a high false positive rate. Increasing evidence suggests that there are many other factors besides DNA sequence that may affect the binding and interaction of TFs with DNA. Through the integration of sequence motif, chromatin state, and DNA structure properties, we show that TF binding can be better predicted. Moreover, considering chromatin state and DNA structure properties simultaneously yields a significant improvement. While the binding of some TFs can be readily predicted using either chromatin state information or DNA structure, other TFs need both. Thus, our findings provide insights on how different histone modifications and DNA structure properties may influence the binding of a particular TF and thus how TFs regulate gene expression. These features are referred to as sequence “intrinsic properties” because they can be predicted from sequences alone. These intrinsic properties can be used to build a TF binding prediction model that has a similar performance to considering all features. Moreover, the intrinsic property model allows TFBS predictions not only across TFs, but also across DNA-binding domain families that are present in most eukaryotes, suggesting that the model likely can be used across species.}, number = {8}, urldate = {2016-06-16}, journal = {PLOS Comput Biol}, author = {Tsai, Zing Tsung-Yeh and Shiu, Shin-Han and Tsai, Huai-Kuang}, year = {2015}, keywords = {Chromatin, Sequence motif analysis, Forecasting, DNA structure, Nucleosomes, Gene expression, Histones, DNA sequence analysis}, pages = {e1004418}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UZW539AW/Tsai et al. - 2015 - Contribution of Sequence Motif, Chromatin State, a.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RNZ4GZS8/article.html:text/html} } @article{sunnaker_approximate_2013, title = {Approximate {Bayesian} {Computation}}, volume = {9}, issn = {1553-7358}, url = {http://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1002803}, doi = {10.1371/journal.pcbi.1002803}, abstract = {Approximate Bayesian computation (ABC) constitutes a class of computational methods rooted in Bayesian statistics . In all model-based statistical inference , the likelihood function is of central importance, since it expresses the probability of the observed data under a particular statistical model, and thus quantifies the support data lend to particular values of parameters and to choices among different models. For simple models, an analytical formula for the likelihood function can typically be derived. However, for more complex models, an analytical formula might be elusive or the likelihood function might be computationally very costly to evaluate. ABC methods bypass the evaluation of the likelihood function. In this way, ABC methods widen the realm of models for which statistical inference can be considered. ABC methods are mathematically well-founded, but they inevitably make assumptions and approximations whose impact needs to be carefully assessed. Furthermore, the wider application domain of ABC exacerbates the challenges of parameter estimation and model selection . ABC has rapidly gained popularity over the last years and in particular for the analysis of complex problems arising in biological sciences (e.g., in population genetics , ecology , epidemiology , and systems biology ).}, number = {1}, urldate = {2016-06-24}, journal = {PLOS Comput Biol}, author = {Sunnåker, Mikael and Busetto, Alberto Giovanni and Numminen, Elina and Corander, Jukka and Foll, Matthieu and Dessimoz, Christophe}, month = jan, year = {2013}, keywords = {Algorithms, Computer software, Simulation and modeling, Statistical inference, Quality control, Statistical distributions, Statistical models, Population genetics}, pages = {e1002803}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ACGRZCFG/Sunnåker et al. - 2013 - Approximate Bayesian Computation.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F3PCJQ2X/article.html:text/html} } @article{cheng_understanding_2012, title = {Understanding transcriptional regulation by integrative analysis of transcription factor binding data}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1658}, doi = {10.1101/gr.136838.111}, abstract = {Statistical models have been used to quantify the relationship between gene expression and transcription factor (TF) binding signals. Here we apply the models to the large-scale data generated by the ENCODE project to study transcriptional regulation by TFs. Our results reveal a notable difference in the prediction accuracy of expression levels of transcription start sites (TSSs) captured by different technologies and RNA extraction protocols. In general, the expression levels of TSSs with high CpG content are more predictable than those with low CpG content. For genes with alternative TSSs, the expression levels of downstream TSSs are more predictable than those of the upstream ones. Different TF categories and specific TFs vary substantially in their contributions to predicting expression. Between two cell lines, the differential expression of TSS can be precisely reflected by the difference of TF-binding signals in a quantitative manner, arguing against the conventional on-and-off model of TF binding. Finally, we explore the relationships between TF-binding signals and other chromatin features such as histone modifications and DNase hypersensitivity for determining expression. The models imply that these features regulate transcription in a highly coordinated manner.}, language = {en}, number = {9}, urldate = {2016-07-07}, journal = {Genome Research}, author = {Cheng, Chao and Alexander, Roger and Min, Renqiang and Leng, Jing and Yip, Kevin Y. and Rozowsky, Joel and Yan, Koon-Kiu and Dong, Xianjun and Djebali, Sarah and Ruan, Yijun and Davis, Carrie A. and Carninci, Piero and Lassman, Timo and Gingeras, Thomas R. and Guigó, Roderic and Birney, Ewan and Weng, Zhiping and Snyder, Michael and Gerstein, Mark}, month = sep, year = {2012}, pmid = {22955978}, pages = {1658--1667}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8PDJPINK/Cheng et al. - 2012 - Understanding transcriptional regulation by integr.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QUK6KTKM/1658.html:text/html;Supplemental_Figures_and_Tables.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6WQC2A9C/Supplemental_Figures_and_Tables.pdf:application/pdf} } @article{gordan_distinguishing_2009, title = {Distinguishing direct versus indirect transcription factor–{DNA} interactions}, volume = {19}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/19/11/2090}, doi = {10.1101/gr.094144.109}, abstract = {Transcriptional regulation is largely enacted by transcription factors (TFs) binding DNA. Large numbers of TF binding motifs have been revealed by ChIP-chip experiments followed by computational DNA motif discovery. However, the success of motif discovery algorithms has been limited when applied to sequences bound in vivo (such as those identified by ChIP-chip) because the observed TF–DNA interactions are not necessarily direct: Some TFs predominantly associate with DNA indirectly through protein partners, while others exhibit both direct and indirect binding. Here, we present the first method for distinguishing between direct and indirect TF–DNA interactions, integrating in vivo TF binding data, in vivo nucleosome occupancy data, and motifs from in vitro protein binding microarray experiments. When applied to yeast ChIP-chip data, our method reveals that only 48\% of the data sets can be readily explained by direct binding of the profiled TF, while 16\% can be explained by indirect DNA binding. In the remaining 36\%, none of the motifs used in our analysis was able to explain the ChIP-chip data, either because the data were too noisy or because the set of motifs was incomplete. As more in vitro TF DNA binding motifs become available, our method could be used to build a complete catalog of direct and indirect TF–DNA interactions. Our method is not restricted to yeast or to ChIP-chip data, but can be applied in any system for which both in vivo binding data and in vitro DNA binding motifs are available.}, language = {en}, number = {11}, urldate = {2016-07-11}, journal = {Genome Research}, author = {Gordân, Raluca and Hartemink, Alexander J. and Bulyk, Martha L.}, month = nov, year = {2009}, pmid = {19652015}, pages = {2090--2100}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G35V4FIF/Gordân et al. - 2009 - Distinguishing direct versus indirect transcriptio.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q4K9GBD5/2090.html:text/html} } @article{badis_diversity_2009, title = {Diversity and {Complexity} in {DNA} {Recognition} by {Transcription} {Factors}}, volume = {324}, copyright = {Copyright © 2009, American Association for the Advancement of Science}, issn = {0036-8075, 1095-9203}, url = {http://science.sciencemag.org/content/324/5935/1720}, doi = {10.1126/science.1162327}, abstract = {Transcriptional Regulation Gets More Complicated Sequence preferences of DNA binding proteins are a primary mechanism by which cells interpret the genome. A central goal in genome biology is to identify regulatory sequences in the genome; however, few proteins' DNA binding specificities have been characterized comprehensively. Badis et al. (p. 1720, published online 14 May) studied 104 known and predicted transcription factors (TFs), spanning 22 structural classes, in the mouse genome. While traditional models of TF binding sites are based on a single collection of highly similar DNA sequences, binding profiles were represented better by multiple motifs. Roughly half of the TFs recognized distinct primary and secondary motifs that are different from each other. At least some of these interaction modes appeared to be attributable to biophysically distinct protein conformations, adding to the complexity of transcriptional regulation. Sequence preferences of DNA binding proteins are a primary mechanism by which cells interpret the genome. Despite the central importance of these proteins in physiology, development, and evolution, comprehensive DNA binding specificities have been determined experimentally for only a few proteins. Here, we used microarrays containing all 10–base pair sequences to examine the binding specificities of 104 distinct mouse DNA binding proteins representing 22 structural classes. Our results reveal a complex landscape of binding, with virtually every protein analyzed possessing unique preferences. Roughly half of the proteins each recognized multiple distinctly different sequence motifs, challenging our molecular understanding of how proteins interact with their DNA binding sites. This complexity in DNA recognition may be important in gene regulation and in the evolution of transcriptional regulatory networks. A broad survey of transcription factors reveals that related proteins can have multiple and differing DNA binding specificities. A broad survey of transcription factors reveals that related proteins can have multiple and differing DNA binding specificities.}, language = {en}, number = {5935}, urldate = {2016-07-11}, journal = {Science}, author = {Badis, Gwenael and Berger, Michael F. and Philippakis, Anthony A. and Talukder, Shaheynoor and Gehrke, Andrew R. and Jaeger, Savina A. and Chan, Esther T. and Metzler, Genita and Vedenko, Anastasia and Chen, Xiaoyu and Kuznetsov, Hanna and Wang, Chi-Fong and Coburn, David and Newburger, Daniel E. and Morris, Quaid and Hughes, Timothy R. and Bulyk, Martha L.}, month = jun, year = {2009}, pmid = {19443739}, pages = {1720--1723}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HZKW3MWF/Badis et al. - 2009 - Diversity and Complexity in DNA Recognition by Tra.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EEUGZASQ/1720.html:text/html} } @article{carlson_specificity_2010, title = {Specificity landscapes of {DNA} binding molecules elucidate biological function}, volume = {107}, issn = {0027-8424, 1091-6490}, url = {http://www.pnas.org/content/107/10/4544}, doi = {10.1073/pnas.0914023107}, abstract = {Evaluating the specificity spectra of DNA binding molecules is a nontrivial challenge that hinders the ability to decipher gene regulatory networks or engineer molecules that act on genomes. Here we compare the DNA sequence specificities for different classes of proteins and engineered DNA binding molecules across the entire sequence space. These high-content data are visualized and interpreted using an interactive “specificity landscape” which simultaneously displays the affinity and specificity of a million-plus DNA sequences. Contrary to expectation, specificity landscapes reveal that synthetic DNA ligands match, and often surpass, the specificities of eukaryotic DNA binding proteins. The landscapes also identify differential specificity constraints imposed by diverse structural folds of natural and synthetic DNA binders. Importantly, the sequence context of a binding site significantly influences binding energetics, and utilizing the full contextual information permits greater accuracy in annotating regulatory elements within a given genome. Assigning such context-dependent binding values to every DNA sequence across the genome yields predictive genome-wide binding landscapes (genomescapes). A genomescape of a synthetic DNA binding molecule provided insight into its differential regulatory activity in cultured cells. The approach we describe will accelerate the creation of precision-tailored DNA therapeutics and uncover principles that govern sequence-specificity of DNA binding molecules.}, language = {en}, number = {10}, urldate = {2016-07-11}, journal = {Proceedings of the National Academy of Sciences}, author = {Carlson, Clayton D. and Warren, Christopher L. and Hauschild, Karl E. and Ozers, Mary S. and Qadir, Naveeda and Bhimsaria, Devesh and Lee, Youngsook and Cerrina, Franco and Ansari, Aseem Z.}, month = mar, year = {2010}, pmid = {20176964}, keywords = {chemical genomics, Cognate Site Identification, DNA binders, genomescapes, Energy Landscapes}, pages = {4544--4549}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3Z8DU24S/Carlson et al. - 2010 - Specificity landscapes of DNA binding molecules el.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XKEEFARQ/4544.html:text/html} } -@misc{noauthor_additivity_nodate, - title = {Additivity in protein–{DNA} interactions: how good an approximation is it?}, - url = {http://nar.oxfordjournals.org/content/30/20/4442.long}, - urldate = {2016-07-11}, - file = {Additivity in protein–DNA interactions\: how good an approximation is it?:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2EUIAZDZ/4442.html:text/html} -} - @article{benos_additivity_2002, title = {Additivity in protein–{DNA} interactions: how good an approximation is it?}, volume = {30}, issn = {0305-1048, 1362-4962}, shorttitle = {Additivity in protein–{DNA} interactions}, url = {http://nar.oxfordjournals.org/content/30/20/4442}, doi = {10.1093/nar/gkf578}, abstract = {Man and Stormo and Bulyk et al. recently presented their results on the study of the DNA binding affinity of proteins. In both of these studies the main conclusion is that the additivity assumption, usually applied in methods to search for binding sites, is not true. In the first study, the analysis of binding affinity data from the Mnt repressor protein bound to all possible DNA (sub)targets at positions 16 and 17 of the binding site, showed that those positions are not independent. In the second study, the authors analysed DNA binding affinity data of the wild‐type mouse EGR1 protein and four variants differing on the middle finger. The binding affinity of these proteins was measured to all 64 possible trinucleotide (sub)targets of the middle finger using microarray technology. The analysis of the measurements also showed interdependence among the positions in the DNA target. In the present report, we review the data of both studies and we re‐ analyse them using various statistical methods, including a comparison with a multiple regression approach. We conclude that despite the fact that the additivity assumption does not fit the data perfectly, in most cases it provides a very good approximation of the true nature of the specific protein–DNA interactions. Therefore, additive models can be very useful for the discovery and prediction of binding sites in genomic DNA.}, language = {en}, number = {20}, urldate = {2016-07-11}, journal = {Nucleic Acids Research}, author = {Benos, Panayiotis V. and Bulyk, Martha L. and Stormo, Gary D.}, month = oct, year = {2002}, pmid = {12384591}, pages = {4442--4451}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9NNEN6A3/Benos et al. - 2002 - Additivity in protein–DNA interactions how good a.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/D8CV39DE/4442.html:text/html} } @article{bulyk_nucleotides_2002, title = {Nucleotides of transcription factor binding sites exert interdependent effects on the binding affinities of transcription factors}, volume = {30}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/30/5/1255}, doi = {10.1093/nar/30.5.1255}, abstract = {We can determine the effects of many possible sequence variations in transcription factor binding sites using microarray binding experiments. Analysis of wild-type and mutant Zif268 (Egr1) zinc fingers bound to microarrays containing all possible central 3 bp triplet binding sites indicates that the nucleotides of transcription factor binding sites cannot be treated independently. This indicates that the current practice of characterizing transcription factor binding sites by mutating individual positions of binding sites one base pair at a time does not provide a true picture of the sequence specificity. Similarly, current bioinformatic practices using either just a consensus sequence, or even mononucleotide frequency weight matrices to provide more complete descriptions of transcription factor binding sites, are not accurate in depicting the true binding site specificities, since these methods rely upon the assumption that the nucleotides of binding sites exert independent effects on binding affinity. Our results stress the importance of complete reference tables of all possible binding sites for comparing protein binding preferences for various DNA sequences. We also show results suggesting that microarray binding data using particular subsets of all possible binding sites can be used to extrapolate the relative binding affinities of all possible full-length binding sites, given a known binding site for use as a starting sequence for site preference refinement.}, language = {en}, number = {5}, urldate = {2016-07-12}, journal = {Nucleic Acids Research}, author = {Bulyk, Martha L. and Johnson, Philip L. F. and Church, George M.}, month = mar, year = {2002}, pmid = {11861919}, pages = {1255--1261}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GW392C6E/Bulyk et al. - 2002 - Nucleotides of transcription factor binding sites .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/553SQDSR/1255.html:text/html} } -@article{zhao_improved_2012, - title = {Improved {Models} for {Transcription} {Factor} {Binding} {Site} {Identification} {Using} {Nonindependent} {Interactions}}, - volume = {191}, - copyright = {Copyright © 2012 by the Genetics Society of America}, - issn = {0016-6731, 1943-2631}, - url = {http://www.genetics.org/content/191/3/781}, - doi = {10.1534/genetics.112.138685}, - abstract = {Identifying transcription factor (TF) binding sites is essential for understanding regulatory networks. The specificity of most TFs is currently modeled using position weight matrices (PWMs) that assume the positions within a binding site contribute independently to binding affinity for any site. Extensive, high-throughput quantitative binding assays let us examine, for the first time, the independence assumption for many TFs. We find that the specificity of most TFs is well fit with the simple PWM model, but in some cases more complex models are required. We introduce a binding energy model (BEM) that can include energy parameters for nonindependent contributions to binding affinity. We show that in most cases where a PWM is not sufficient, a BEM that includes energy parameters for adjacent dinucleotide contributions models the specificity very well. Having more accurate models of specificity greatly improves the interpretation of in vivo TF localization data, such as from chromatin immunoprecipitation followed by sequencing (ChIP-seq) experiments.}, - language = {en}, - number = {3}, - urldate = {2016-07-12}, - journal = {Genetics}, - author = {Zhao, Yue and Ruan, Shuxiang and Pandey, Manishi and Stormo, Gary D.}, - month = jul, - year = {2012}, - pmid = {22505627}, - pages = {781--790}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9SWTFQCK/Zhao et al. - 2012 - Improved Models for Transcription Factor Binding S.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PV6QGUI3/781.html:text/html} -} - -@misc{noauthor_computational_nodate, - title = {Computational technique for improvement of the position-weight matrices for the {DNA}/protein binding sites}, - url = {http://nar.oxfordjournals.org/content/33/7/2290.long}, - urldate = {2016-07-12}, - file = {Computational technique for improvement of the position-weight matrices for the DNA/protein binding sites:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T3IW6KGX/2290.html:text/html} -} - @article{gershenzon_computational_2005, title = {Computational technique for improvement of the position-weight matrices for the {DNA}/protein binding sites}, volume = {33}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/33/7/2290}, doi = {10.1093/nar/gki519}, abstract = {Position-weight matrices (PWMs) are broadly used to locate transcription factor binding sites in DNA sequences. The majority of existing PWMs provide a low level of both sensitivity and specificity. We present a new computational algorithm, a modification of the Staden–Bucher approach, that improves the PWM. We applied the proposed technique on the PWM of the GC-box, binding site for Sp1. The comparison of old and new PWMs shows that the latter increase both sensitivity and specificity. The statistical parameters of GC-box distribution in promoter regions and in the human genome, as well as in each chromosome, are presented. The majority of commonly used PWMs are the 4-row mononucleotide matrices, although 16-row dinucleotide matrices are known to be more informative. The algorithm efficiently determines the 16-row matrices and preliminary results show that such matrices provide better results than 4-row matrices.}, language = {en}, number = {7}, urldate = {2016-07-12}, journal = {Nucleic Acids Research}, author = {Gershenzon, Naum I. and Stormo, Gary D. and Ioshikhes, Ilya P.}, month = jan, year = {2005}, pmid = {15849315}, pages = {2290--2301}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FJ85FE73/Gershenzon et al. - 2005 - Computational technique for improvement of the pos.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3GJ3CQ3F/2290.html:text/html} } @article{djordjevic_biophysical_2003, title = {A {Biophysical} {Approach} to {Transcription} {Factor} {Binding} {Site} {Discovery}}, volume = {13}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/13/11/2381}, doi = {10.1101/gr.1271603}, abstract = {Identification of transcription factor binding sites within regulatory segments of genomic DNA is an important step toward understanding of the regulatory circuits that control expression of genes. Here, we describe a novel bioinformatics method that bases classification of potential binding sites explicitly on the estimate of sequence-specific binding energy of a given transcription factor. The method also estimates the chemical potential of the factor that defines the threshold of binding. In contrast with the widely used information-theoretic weight matrix method, the new approach correctly describes saturation in the transcription factor/DNA binding probability. This results in a significant improvement in the number of expected false positives, particularly in the ubiquitous case of low-specificity factors. In the strong binding limit, the algorithm is related to the “support vector machine” approach to pattern recognition. The new method is used to identify likely genomic binding sites for the E. coli transcription factors collected in the DPInteract database. In addition, for CRP (a global regulatory factor), the likely regulatory modality (i.e., repressor or activator) of predicted binding sites is determined.}, language = {en}, number = {11}, urldate = {2016-08-03}, journal = {Genome Research}, author = {Djordjevic, Marko and Sengupta, Anirvan M. and Shraiman, Boris I.}, month = nov, year = {2003}, pmid = {14597652}, pages = {2381--2390}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UT9VDSVF/Djordjevic et al. - 2003 - A Biophysical Approach to Transcription Factor Bin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J8XU8D44/2381.html:text/html} } @article{liu_whole-genome_2006, title = {Whole-genome comparison of {Leu}3 binding in vitro and in vivo reveals the importance of nucleosome occupancy in target site selection}, volume = {16}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/16/12/1517}, doi = {10.1101/gr.5655606}, abstract = {Sequence motifs that are potentially recognized by DNA-binding proteins occur far more often in genomic DNA than do observed in vivo protein–DNA interactions. To determine how chromatin influences the utilization of particular DNA-binding sites, we compared the in vivo genome-wide binding location of the yeast transcription factor Leu3 to the binding location observed on the same genomic DNA in the absence of any protein cofactors. We found that the DNA-sequence motif recognized by Leu3 in vitro and in vivo was functionally indistinguishable, but Leu3 bound different genomic locations under the two conditions. Accounting for nucleosome occupancy in addition to DNA-sequence motifs significantly improved the prediction of protein–DNA interactions in vivo, but not the prediction of sites bound by purified Leu3 in vitro. Use of histone modification data does not further improve binding predictions, presumably because their effect is already manifest in the global histone distribution. Measurements of nucleosome occupancy in strains that differ in Leu3 genotype show that low nucleosome occupancy at loci bound by Leu3 is not a consequence of Leu3 binding. These results permit quantitation of the epigenetic influence that chromatin exerts on DNA binding-site selection, and provide evidence for an instructive, functionally important role for nucleosome occupancy in determining patterns of regulatory factor targeting genome-wide.}, language = {en}, number = {12}, urldate = {2016-08-08}, journal = {Genome Research}, author = {Liu, Xiao and Lee, Cheol-Koo and Granek, Joshua A. and Clarke, Neil D. and Lieb, Jason D.}, month = dec, year = {2006}, pmid = {17053089}, pages = {1517--1528}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GA2KFRND/Liu et al. - 2006 - Whole-genome comparison of Leu3 binding in vitro a.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/P9UXRF68/1517.html:text/html} } @article{zhu_high-resolution_2009, title = {High-resolution {DNA}-binding specificity analysis of yeast transcription factors}, volume = {19}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/19/4/556}, doi = {10.1101/gr.090233.108}, abstract = {Transcription factors (TFs) regulate the expression of genes through sequence-specific interactions with DNA-binding sites. However, despite recent progress in identifying in vivo TF binding sites by microarray readout of chromatin immunoprecipitation (ChIP-chip), nearly half of all known yeast TFs are of unknown DNA-binding specificities, and many additional predicted TFs remain uncharacterized. To address these gaps in our knowledge of yeast TFs and their cis regulatory sequences, we have determined high-resolution binding profiles for 89 known and predicted yeast TFs, over more than 2.3 million gapped and ungapped 8-bp sequences (“k-mers”). We report 50 new or significantly different direct DNA-binding site motifs for yeast DNA-binding proteins and motifs for eight proteins for which only a consensus sequence was previously known; in total, this corresponds to over a 50\% increase in the number of yeast DNA-binding proteins with experimentally determined DNA-binding specificities. Among other novel regulators, we discovered proteins that bind the PAC (Polymerase A and C) motif (GATGAG) and regulate ribosomal RNA (rRNA) transcription and processing, core cellular processes that are constituent to ribosome biogenesis. In contrast to earlier data types, these comprehensive k-mer binding data permit us to consider the regulatory potential of genomic sequence at the individual word level. These k-mer data allowed us to reannotate in vivo TF binding targets as direct or indirect and to examine TFs' potential effects on gene expression in ∼1700 environmental and cellular conditions. These approaches could be adapted to identify TFs and cis regulatory elements in higher eukaryotes.}, language = {en}, number = {4}, urldate = {2016-08-08}, journal = {Genome Research}, author = {Zhu, Cong and Byers, Kelsey J. R. P. and McCord, Rachel Patton and Shi, Zhenwei and Berger, Michael F. and Newburger, Daniel E. and Saulrieta, Katrina and Smith, Zachary and Shah, Mita V. and Radhakrishnan, Mathangi and Philippakis, Anthony A. and Hu, Yanhui and Masi, Federico De and Pacek, Marcin and Rolfs, Andreas and Murthy, Tal and LaBaer, Joshua and Bulyk, Martha L.}, month = apr, year = {2009}, pmid = {19158363}, pages = {556--566}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DFQVE56N/Zhu et al. - 2009 - High-resolution DNA-binding specificity analysis o.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BIRIECRR/556.html:text/html} } @article{weirauch_evaluation_2013, title = {Evaluation of methods for modeling transcription factor sequence specificity}, volume = {31}, copyright = {© 2013 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v31/n2/abs/nbt.2486.html}, doi = {10.1038/nbt.2486}, abstract = {Genomic analyses often involve scanning for potential transcription factor (TF) binding sites using models of the sequence specificity of DNA binding proteins. Many approaches have been developed to model and learn a protein's DNA-binding specificity, but these methods have not been systematically compared. Here we applied 26 such approaches to in vitro protein binding microarray data for 66 mouse TFs belonging to various families. For nine TFs, we also scored the resulting motif models on in vivo data, and found that the best in vitro–derived motifs performed similarly to motifs derived from the in vivo data. Our results indicate that simple models based on mononucleotide position weight matrices trained by the best methods perform similarly to more complex models for most TFs examined, but fall short in specific cases ({\textless}10\% of the TFs examined here). In addition, the best-performing motifs typically have relatively low information content, consistent with widespread degeneracy in eukaryotic TF sequence preferences. View full text}, language = {en}, number = {2}, urldate = {2016-08-08}, journal = {Nature Biotechnology}, author = {Weirauch, Matthew T. and Cote, Atina and Norel, Raquel and Annala, Matti and Zhao, Yue and Riley, Todd R. and Saez-Rodriguez, Julio and Cokelaer, Thomas and Vedenko, Anastasia and Talukder, Shaheynoor and {Dream5 Consortium} and Bussemaker, Harmen J. and Morris, Quaid D. and Bulyk, Martha L. and Stolovitzky, Gustavo and Hughes, Timothy R.}, month = feb, year = {2013}, keywords = {Transcription Factors, functional genomics, Computational biology and bioinformatics}, pages = {126--134}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QINBEMQC/Weirauch et al. - 2013 - Evaluation of methods for modeling transcription f.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ANR3WQZ2/nbt.2486.html:text/html} } @article{zhao_quantitative_2011, title = {Quantitative analysis demonstrates most transcription factors require only simple models of specificity}, volume = {29}, copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v29/n6/full/nbt.1893.html}, doi = {10.1038/nbt.1893}, language = {en}, number = {6}, urldate = {2016-08-11}, journal = {Nature Biotechnology}, author = {Zhao, Yue and Stormo, Gary D.}, month = jun, year = {2011}, keywords = {Transcription Factors, functional genomics, Computational biology and bioinformatics}, pages = {480--483}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3874FVNA/Zhao et Stormo - 2011 - Quantitative analysis demonstrates most transcript.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XBGB842T/nbt.1893.html:text/html} } @article{ha_cops:_2012, title = {{COPS}: {Detecting} {Co}-{Occurrence} and {Spatial} {Arrangement} of {Transcription} {Factor} {Binding} {Motifs} in {Genome}-{Wide} {Datasets}}, volume = {7}, issn = {1932-6203}, shorttitle = {{COPS}}, url = {http://journals.plos.org/plosone/article?id=10.1371/journal.pone.0052055}, doi = {10.1371/journal.pone.0052055}, abstract = {In multi-cellular organisms, spatiotemporal activity of cis -regulatory DNA elements depends on their occupancy by different transcription factors (TFs). In recent years, genome-wide ChIP-on-Chip, ChIP-Seq and DamID assays have been extensively used to unravel the combinatorial interaction of TFs with cis -regulatory modules (CRMs) in the genome. Even though genome-wide binding profiles are increasingly becoming available for different TFs, single TF binding profiles are in most cases not sufficient for dissecting complex regulatory networks. Thus, potent computational tools detecting statistically significant and biologically relevant TF-motif co-occurrences in genome-wide datasets are essential for analyzing context-dependent transcriptional regulation. We have developed COPS ( C o- O ccurrence P attern S earch), a new bioinformatics tool based on a combination of association rules and Markov chain models, which detects co-occurring TF binding sites (BSs) on genomic regions of interest. COPS scans DNA sequences for frequent motif patterns using a Frequent-Pattern tree based data mining approach, which allows efficient performance of the software with respect to both data structure and implementation speed, in particular when mining large datasets. Since transcriptional gene regulation very often relies on the formation of regulatory protein complexes mediated by closely adjoining TF binding sites on CRMs, COPS additionally detects preferred short distance between co-occurring TF motifs. The performance of our software with respect to biological significance was evaluated using three published datasets containing genomic regions that are independently bound by several TFs involved in a defined biological process. In sum, COPS is a fast, efficient and user-friendly tool mining statistically and biologically significant TFBS co-occurrences and therefore allows the identification of TFs that combinatorially regulate gene expression.}, number = {12}, urldate = {2016-08-15}, journal = {PLOS ONE}, author = {Ha, Nati and Polychronidou, Maria and Lohmann, Ingrid}, year = {2012}, keywords = {Gene regulation, Sequence motif analysis, Invertebrate genomics, Genome analysis, Mammalian genomics, Drosophila melanogaster, Genomic databases, Mesoderm}, pages = {e52055}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T3FVC4RM/Ha et al. - 2012 - COPS Detecting Co-Occurrence and Spatial Arrangem.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DCMZ65QU/article.html:text/html} } @article{touzet_efficient_2007, title = {Efficient and accurate {P}-value computation for {Position} {Weight} {Matrices}}, volume = {2}, issn = {1748-7188}, url = {http://dx.doi.org/10.1186/1748-7188-2-15}, doi = {10.1186/1748-7188-2-15}, abstract = {Position Weight Matrices (PWMs) are probabilistic representations of signals in sequences. They are widely used to model approximate patterns in DNA or in protein sequences. The usage of PWMs needs as a prerequisite to knowing the statistical significance of a word according to its score. This is done by defining the P-value of a score, which is the probability that the background model can achieve a score larger than or equal to the observed value. This gives rise to the following problem: Given a P-value, find the corresponding score threshold. Existing methods rely on dynamic programming or probability generating functions. For many examples of PWMs, they fail to give accurate results in a reasonable amount of time.}, urldate = {2016-08-16}, journal = {Algorithms for Molecular Biology}, author = {Touzet, Hélène and Varré, Jean-Stéphane}, year = {2007}, pages = {15}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/25QZE893/Touzet et Varré - 2007 - Efficient and accurate P-value computation for Pos.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ENEM24D3/1748-7188-2-15.html:text/html} } @article{loo_computational_2009, title = {Computational methods for the detection of cis-regulatory modules}, volume = {10}, issn = {1467-5463, 1477-4054}, url = {http://bib.oxfordjournals.org/content/10/5/509}, doi = {10.1093/bib/bbp025}, abstract = {Metazoan transcription regulation occurs through the concerted action of multiple transcription factors that bind co-operatively to cis-regulatory modules (CRMs). The annotation of these key regulators of transcription is lagging far behind the annotation of the transcriptome itself. Here, we give an overview of existing computational methods to detect these CRMs in metazoan genomes. We subdivide these methods into three classes: CRM scanners screen sequences for CRMs based on predefined models that often consist of multiple position weight matrices (PWMs). CRM builders construct models of similar CRMs controlling a set of co-regulated or co-expressed genes. CRM genome screeners screen sequences or complete genomes for CRMs as homotypic or heterotypic clusters of binding sites for any combination of transcription factors. We believe that CRM scanners are currently the most advanced methods, although their applicability is limited. Finally, we argue that CRM builders that make use of PWM libraries will benefit greatly from future advances and will prove to be most instrumental for the annotation of regulatory regions in metazoan genomes.}, language = {en}, number = {5}, urldate = {2016-08-16}, journal = {Briefings in Bioinformatics}, author = {Loo, Peter Van and Marynen, Peter}, month = sep, year = {2009}, pmid = {19498042}, keywords = {transcription regulation, cis-regulatory modules, genome annotation, regulatory regions, computational CRM detection}, pages = {509--524}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U5ZEZPMH/Loo et Marynen - 2009 - Computational methods for the detection of cis-reg.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RXMCQQB8/509.html:text/html} } -@article{man_non-independence_2001, - title = {Non-independence of {Mnt} repressor-operator interaction determined by a new quantitative multiple fluorescence relative affinity ({QuMFRA}) assay}, - volume = {29}, - issn = {1362-4962}, - abstract = {Salmonella bacteriophage repressor Mnt belongs to the ribbon-helix-helix class of transcription factors. Previous SELEX results suggested that interactions of Mnt with positions 16 and 17 of the operator DNA are not independent. Using a newly developed high-throughput quantitative multiple fluorescence relative affinity (QuMFRA) assay, we directly quantified the relative equilibrium binding constants (K(ref)) of Mnt to operators carrying all the possible dinucleotide combinations at these two positions. Results show that Mnt prefers binding to C, instead of wild-type A, at position 16 when wild-type C at position 17 is changed to other bases. The measured K(ref) values of double mutants were also higher than the values predicted from single mutants, demonstrating the non-independence of these two positions. The ability to produce a large number of quantitative binding data simultaneously and the potential to scale up makes QuMFRA a valuable tool for the large-scale study of macromolecular interaction.}, - language = {eng}, - number = {12}, - journal = {Nucleic Acids Research}, - author = {Man, T. K. and Stormo, G. D.}, - month = jun, - year = {2001}, - pmid = {11410653}, - pmcid = {PMC55749}, - keywords = {DNA, Models, Molecular, fluorescence, thermodynamics, viral proteins, DNA-binding proteins, Bacteriophage P22, Base Sequence, Binding Sites, Fluorescent Dyes, Mutation, Operator Regions, Genetic, Protein Binding, Repressor Proteins, Salmonella, Substrate Specificity, Viral Regulatory and Accessory Proteins}, - pages = {2471--2478} -} - @article{yip_classification_2012, title = {Classification of human genomic regions based on experimentally determined binding sites of more than 100 transcription-related factors}, volume = {13}, issn = {1474-760X}, url = {http://dx.doi.org/10.1186/gb-2012-13-9-r48}, doi = {10.1186/gb-2012-13-9-r48}, abstract = {Transcription factors function by binding different classes of regulatory elements. The Encyclopedia of DNA Elements (ENCODE) project has recently produced binding data for more than 100 transcription factors from about 500 ChIP-seq experiments in multiple cell types. While this large amount of data creates a valuable resource, it is nonetheless overwhelmingly complex and simultaneously incomplete since it covers only a small fraction of all human transcription factors.}, urldate = {2016-08-17}, journal = {Genome Biology}, author = {Yip, Kevin Y. and Cheng, Chao and Bhardwaj, Nitin and Brown, James B. and Leng, Jing and Kundaje, Anshul and Rozowsky, Joel and Birney, Ewan and Bickel, Peter and Snyder, Michael and Gerstein, Mark}, year = {2012}, pages = {R48}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HCR3FP2I/Yip et al. - 2012 - Classification of human genomic regions based on e.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z7ZTJIFA/gb-2012-13-9-r48.html:text/html} } @article{natarajan_predicting_2012, title = {Predicting cell-type–specific gene expression from regions of open chromatin}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1711}, doi = {10.1101/gr.135129.111}, abstract = {Complex patterns of cell-type–specific gene expression are thought to be achieved by combinatorial binding of transcription factors (TFs) to sequence elements in regulatory regions. Predicting cell-type–specific expression in mammals has been hindered by the oftentimes unknown location of distal regulatory regions. To alleviate this bottleneck, we used DNase-seq data from 19 diverse human cell types to identify proximal and distal regulatory elements at genome-wide scale. Matched expression data allowed us to separate genes into classes of cell-type–specific up-regulated, down-regulated, and constitutively expressed genes. CG dinucleotide content and DNA accessibility in the promoters of these three classes of genes displayed substantial differences, highlighting the importance of including these aspects in modeling gene expression. We associated DNase I hypersensitive sites (DHSs) with genes, and trained classifiers for different expression patterns. TF sequence motif matches in DHSs provided a strong performance improvement in predicting gene expression over the typical baseline approach of using proximal promoter sequences. In particular, we achieved competitive performance when discriminating up-regulated genes from different cell types or genes up- and down-regulated under the same conditions. We identified previously known and new candidate cell-type–specific regulators. The models generated testable predictions of activating or repressive functions of regulators. DNase I footprints for these regulators were indicative of their direct binding to DNA. In summary, we successfully used information of open chromatin obtained by a single assay, DNase-seq, to address the problem of predicting cell-type–specific gene expression in mammalian organisms directly from regulatory sequence.}, language = {en}, number = {9}, urldate = {2016-08-17}, journal = {Genome Research}, author = {Natarajan, Anirudh and Yardımcı, Galip Gürkan and Sheffield, Nathan C. and Crawford, Gregory E. and Ohler, Uwe}, month = sep, year = {2012}, pmid = {22955983}, pages = {1711--1722}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KQRSH46X/Natarajan et al. - 2012 - Predicting cell-type–specific gene expression from.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IVRNI5D9/1711.html:text/html} } -@article{thurman_accessible_2012-1, - title = {The accessible chromatin landscape of the human genome}, - volume = {489}, - copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v489/n7414/full/nature11232.html}, - doi = {10.1038/nature11232}, - abstract = {DNase I hypersensitive sites (DHSs) are markers of regulatory DNA and have underpinned the discovery of all classes of cis-regulatory elements including enhancers, promoters, insulators, silencers and locus control regions. Here we present the first extensive map of human DHSs identified through genome-wide profiling in 125 diverse cell and tissue types. We identify {\textasciitilde}2.9 million DHSs that encompass virtually all known experimentally validated cis-regulatory sequences and expose a vast trove of novel elements, most with highly cell-selective regulation. Annotating these elements using ENCODE data reveals novel relationships between chromatin accessibility, transcription, DNA methylation and regulatory factor occupancy patterns. We connect {\textasciitilde}580,000 distal DHSs with their target promoters, revealing systematic pairing of different classes of distal DHSs and specific promoter types. Patterning of chromatin accessibility at many regulatory regions is organized with dozens to hundreds of co-activated elements, and the transcellular DNase I sensitivity pattern at a given region can predict cell-type-specific functional behaviours. The DHS landscape shows signatures of recent functional evolutionary constraint. However, the DHS compartment in pluripotent and immortalized cells exhibits higher mutation rates than that in highly differentiated cells, exposing an unexpected link between chromatin accessibility, proliferative potential and patterns of human variation.}, - language = {en}, - number = {7414}, - urldate = {2016-08-17}, - journal = {Nature}, - author = {Thurman, Robert E. and Rynes, Eric and Humbert, Richard and Vierstra, Jeff and Maurano, Matthew T. and Haugen, Eric and Sheffield, Nathan C. and Stergachis, Andrew B. and Wang, Hao and Vernot, Benjamin and Garg, Kavita and John, Sam and Sandstrom, Richard and Bates, Daniel and Boatman, Lisa and Canfield, Theresa K. and Diegel, Morgan and Dunn, Douglas and Ebersol, Abigail K. and Frum, Tristan and Giste, Erika and Johnson, Audra K. and Johnson, Ericka M. and Kutyavin, Tanya and Lajoie, Bryan and Lee, Bum-Kyu and Lee, Kristen and London, Darin and Lotakis, Dimitra and Neph, Shane and Neri, Fidencio and Nguyen, Eric D. and Qu, Hongzhu and Reynolds, Alex P. and Roach, Vaughn and Safi, Alexias and Sanchez, Minerva E. and Sanyal, Amartya and Shafer, Anthony and Simon, Jeremy M. and Song, Lingyun and Vong, Shinny and Weaver, Molly and Yan, Yongqi and Zhang, Zhancheng and Zhang, Zhuzhu and Lenhard, Boris and Tewari, Muneesh and Dorschner, Michael O. and Hansen, R. Scott and Navas, Patrick A. and Stamatoyannopoulos, George and Iyer, Vishwanath R. and Lieb, Jason D. and Sunyaev, Shamil R. and Akey, Joshua M. and Sabo, Peter J. and Kaul, Rajinder and Furey, Terrence S. and Dekker, Job and Crawford, Gregory E. and Stamatoyannopoulos, John A.}, - month = sep, - year = {2012}, - keywords = {evolution, genetics, genomics, molecular biology}, - pages = {75--82}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A8NSPKM6/Thurman et al. - 2012 - The accessible chromatin landscape of the human ge.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZTVB3AN5/nature11232.html:text/html} -} - @article{neph_expansive_2012, title = {An expansive human regulatory lexicon encoded in transcription factor footprints}, volume = {489}, copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v489/n7414/full/nature11212.html}, doi = {10.1038/nature11212}, abstract = {Regulatory factor binding to genomic DNA protects the underlying sequence from cleavage by DNase I, leaving nucleotide-resolution footprints. Using genomic DNase I footprinting across 41 diverse cell and tissue types, we detected 45 million transcription factor occupancy events within regulatory regions, representing differential binding to 8.4 million distinct short sequence elements. Here we show that this small genomic sequence compartment, roughly twice the size of the exome, encodes an expansive repertoire of conserved recognition sequences for DNA-binding proteins that nearly doubles the size of the human cis–regulatory lexicon. We find that genetic variants affecting allelic chromatin states are concentrated in footprints, and that these elements are preferentially sheltered from DNA methylation. High-resolution DNase I cleavage patterns mirror nucleotide-level evolutionary conservation and track the crystallographic topography of protein–DNA interfaces, indicating that transcription factor structure has been evolutionarily imprinted on the human genome sequence. We identify a stereotyped 50-base-pair footprint that precisely defines the site of transcript origination within thousands of human promoters. Finally, we describe a large collection of novel regulatory factor recognition motifs that are highly conserved in both sequence and function, and exhibit cell-selective occupancy patterns that closely parallel major regulators of development, differentiation and pluripotency.}, language = {en}, number = {7414}, urldate = {2016-08-17}, journal = {Nature}, author = {Neph, Shane and Vierstra, Jeff and Stergachis, Andrew B. and Reynolds, Alex P. and Haugen, Eric and Vernot, Benjamin and Thurman, Robert E. and John, Sam and Sandstrom, Richard and Johnson, Audra K. and Maurano, Matthew T. and Humbert, Richard and Rynes, Eric and Wang, Hao and Vong, Shinny and Lee, Kristen and Bates, Daniel and Diegel, Morgan and Roach, Vaughn and Dunn, Douglas and Neri, Jun and Schafer, Anthony and Hansen, R. Scott and Kutyavin, Tanya and Giste, Erika and Weaver, Molly and Canfield, Theresa and Sabo, Peter and Zhang, Miaohua and Balasundaram, Gayathri and Byron, Rachel and MacCoss, Michael J. and Akey, Joshua M. and Bender, M. A. and Groudine, Mark and Kaul, Rajinder and Stamatoyannopoulos, John A.}, month = sep, year = {2012}, keywords = {evolution, genetics, genomics, molecular biology}, pages = {83--90}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M3T8WI2W/Neph et al. - 2012 - An expansive human regulatory lexicon encoded in t.pdf:application/pdf;Neph et al.-2012 - supplemental.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M3T8WI2W/Neph et al.-2012 - supplemental.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MCX576A7/nature11212.html:text/html} } @article{gerstein_architecture_2012, title = {Architecture of the human regulatory network derived from {ENCODE} data}, volume = {489}, copyright = {© 2012 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v489/n7414/full/nature11245.html}, doi = {10.1038/nature11245}, abstract = {Transcription factors bind in a combinatorial fashion to specify the on-and-off states of genes; the ensemble of these binding events forms a regulatory network, constituting the wiring diagram for a cell. To examine the principles of the human transcriptional regulatory network, we determined the genomic binding information of 119 transcription-related factors in over 450 distinct experiments. We found the combinatorial, co-association of transcription factors to be highly context specific: distinct combinations of factors bind at specific genomic locations. In particular, there are significant differences in the binding proximal and distal to genes. We organized all the transcription factor binding into a hierarchy and integrated it with other genomic information (for example, microRNA regulation), forming a dense meta-network. Factors at different levels have different properties; for instance, top-level transcription factors more strongly influence expression and middle-level ones co-regulate targets to mitigate information-flow bottlenecks. Moreover, these co-regulations give rise to many enriched network motifs (for example, noise-buffering feed-forward loops). Finally, more connected network components are under stronger selection and exhibit a greater degree of allele-specific activity (that is, differential binding to the two parental alleles). The regulatory information obtained in this study will be crucial for interpreting personal genome sequences and understanding basic principles of human biology and disease.}, language = {en}, number = {7414}, urldate = {2016-08-17}, journal = {Nature}, author = {Gerstein, Mark B. and Kundaje, Anshul and Hariharan, Manoj and Landt, Stephen G. and Yan, Koon-Kiu and Cheng, Chao and Mu, Xinmeng Jasmine and Khurana, Ekta and Rozowsky, Joel and Alexander, Roger and Min, Renqiang and Alves, Pedro and Abyzov, Alexej and Addleman, Nick and Bhardwaj, Nitin and Boyle, Alan P. and Cayting, Philip and Charos, Alexandra and Chen, David Z. and Cheng, Yong and Clarke, Declan and Eastman, Catharine and Euskirchen, Ghia and Frietze, Seth and Fu, Yao and Gertz, Jason and Grubert, Fabian and Harmanci, Arif and Jain, Preti and Kasowski, Maya and Lacroute, Phil and Leng, Jing and Lian, Jin and Monahan, Hannah and O’Geen, Henriette and Ouyang, Zhengqing and Partridge, E. Christopher and Patacsil, Dorrelyn and Pauli, Florencia and Raha, Debasish and Ramirez, Lucia and Reddy, Timothy E. and Reed, Brian and Shi, Minyi and Slifer, Teri and Wang, Jing and Wu, Linfeng and Yang, Xinqiong and Yip, Kevin Y. and Zilberman-Schapira, Gili and Batzoglou, Serafim and Sidow, Arend and Farnham, Peggy J. and Myers, Richard M. and Weissman, Sherman M. and Snyder, Michael}, month = sep, year = {2012}, keywords = {genetics, genomics}, pages = {91--100}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/47UG7U49/Gerstein et al. - 2012 - Architecture of the human regulatory network deriv.pdf:application/pdf;Gerstein et al. - 2012 - supplemental.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/47UG7U49/Gerstein et al. - 2012 - supplemental.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9SNJKB5X/nature11245.html:text/html} } @article{whitfield_functional_2012, title = {Functional analysis of transcription factor binding sites in human promoters}, volume = {13}, issn = {1474-760X}, url = {http://dx.doi.org/10.1186/gb-2012-13-9-r50}, doi = {10.1186/gb-2012-13-9-r50}, abstract = {The binding of transcription factors to specific locations in the genome is integral to the orchestration of transcriptional regulation in cells. To characterize transcription factor binding site function on a large scale, we predicted and mutagenized 455 binding sites in human promoters. We carried out functional tests on these sites in four different immortalized human cell lines using transient transfections with a luciferase reporter assay, primarily for the transcription factors CTCF, GABP, GATA2, E2F, STAT, and YY1.}, urldate = {2016-08-17}, journal = {Genome Biology}, author = {Whitfield, Troy W. and Wang, Jie and Collins, Patrick J. and Partridge, E. Christopher and Aldred, Shelley Force and Trinklein, Nathan D. and Myers, Richard M. and Weng, Zhiping}, year = {2012}, pages = {R50}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IPRTU6H6/Whitfield et al. - 2012 - Functional analysis of transcription factor bindin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AGSRGNM2/gb-2012-13-9-r50.html:text/html} } @article{heinz_simple_2010, title = {Simple {Combinations} of {Lineage}-{Determining} {Transcription} {Factors} {Prime} cis-{Regulatory} {Elements} {Required} for {Macrophage} and {B} {Cell} {Identities}}, volume = {38}, issn = {1097-2765}, url = {http://www.sciencedirect.com/science/article/pii/S1097276510003667}, doi = {10.1016/j.molcel.2010.05.004}, abstract = {Summary Genome-scale studies have revealed extensive, cell type-specific colocalization of transcription factors, but the mechanisms underlying this phenomenon remain poorly understood. Here, we demonstrate in macrophages and B cells that collaborative interactions of the common factor PU.1 with small sets of macrophage- or B cell lineage-determining transcription factors establish cell-specific binding sites that are associated with the majority of promoter-distal H3K4me1-marked genomic regions. PU.1 binding initiates nucleosome remodeling, followed by H3K4 monomethylation at large numbers of genomic regions associated with both broadly and specifically expressed genes. These locations serve as beacons for additional factors, exemplified by liver X receptors, which drive both cell-specific gene expression and signal-dependent responses. Together with analyses of transcription factor binding and H3K4me1 patterns in other cell types, these studies suggest that simple combinations of lineage-determining transcription factors can specify the genomic sites ultimately responsible for both cell identity and cell type-specific responses to diverse signaling inputs.}, number = {4}, urldate = {2016-08-23}, journal = {Molecular Cell}, author = {Heinz, Sven and Benner, Christopher and Spann, Nathanael and Bertolino, Eric and Lin, Yin C. and Laslo, Peter and Cheng, Jason X. and Murre, Cornelis and Singh, Harinder and Glass, Christopher K.}, month = may, year = {2010}, keywords = {DNA, MOLIMMUNO}, pages = {576--589}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CPTT6622/Heinz et al. - 2010 - Simple Combinations of Lineage-Determining Transcr.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RHRR6DM6/S1097276510003667.html:text/html} } @article{perner_inference_2014, title = {Inference of interactions between chromatin modifiers and histone modifications: from {ChIP}-{Seq} data to chromatin-signaling}, volume = {42}, issn = {0305-1048, 1362-4962}, shorttitle = {Inference of interactions between chromatin modifiers and histone modifications}, url = {http://nar.oxfordjournals.org/content/42/22/13689}, doi = {10.1093/nar/gku1234}, abstract = {Chromatin modifiers and histone modifications are components of a chromatin-signaling network involved in transcription and its regulation. The interactions between chromatin modifiers and histone modifications are often unknown, are based on the analysis of few genes or are studied in vitro. Here, we apply computational methods to recover interactions between chromatin modifiers and histone modifications from genome-wide ChIP-Seq data. These interactions provide a high-confidence backbone of the chromatin-signaling network. Many recovered interactions have literature support; others provide hypotheses about yet unknown interactions. We experimentally verified two of these predicted interactions, leading to a link between H4K20me1 and members of the Polycomb Repressive Complexes 1 and 2. Our results suggest that our computationally derived interactions are likely to lead to novel biological insights required to establish the connectivity of the chromatin-signaling network involved in transcription and its regulation.}, language = {en}, number = {22}, urldate = {2016-09-27}, journal = {Nucleic Acids Research}, author = {Perner, Juliane and Lasserre, Julia and Kinkley, Sarah and Vingron, Martin and Chung, Ho-Ryun}, month = dec, year = {2014}, pmid = {25414326}, pages = {13689--13695}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/X5PX2TZR/Perner et al. - 2014 - Inference of interactions between chromatin modifi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EFRWRTEU/13689.html:text/html} } @article{mukherjee_rapid_2004, title = {Rapid analysis of the {DNA}-binding specificities of transcription factors with {DNA} microarrays}, volume = {36}, copyright = {© 2004 Nature Publishing Group}, issn = {1061-4036}, url = {http://www.nature.com/ng/journal/v36/n12/full/ng1473.html}, doi = {10.1038/ng1473}, abstract = {We developed a new DNA microarray-based technology, called protein binding microarrays (PBMs), that allows rapid, high-throughput characterization of the in vitro DNA binding–site sequence specificities of transcription factors in a single day. Using PBMs, we identified the DNA binding–site sequence specificities of the yeast transcription factors Abf1, Rap1 and Mig1. Comparison of these proteins' in vitro binding sites with their in vivo binding sites indicates that PBM-derived sequence specificities can accurately reflect in vivo DNA sequence specificities. In addition to previously identified targets, Abf1, Rap1 and Mig1 bound to 107, 90 and 75 putative new target intergenic regions, respectively, many of which were upstream of previously uncharacterized open reading frames. Comparative sequence analysis indicated that many of these newly identified sites are highly conserved across five sequenced sensu stricto yeast species and, therefore, are probably functional in vivo binding sites that may be used in a condition-specific manner. Similar PBM experiments should be useful in identifying new cis regulatory elements and transcriptional regulatory networks in various genomes.}, language = {en}, number = {12}, urldate = {2016-08-23}, journal = {Nature Genetics}, author = {Mukherjee, Sonali and Berger, Michael F. and Jona, Ghil and Wang, Xun S. and Muzzey, Dale and Snyder, Michael and Young, Richard A. and Bulyk, Martha L.}, month = dec, year = {2004}, pages = {1331--1339}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W3HW5SCU/Mukherjee et al. - 2004 - Rapid analysis of the DNA-binding specificities of.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/66IUM3A8/ng1473.html:text/html} } @article{berger_compact_2006, title = {Compact, universal {DNA} microarrays to comprehensively determine transcription-factor binding site specificities}, volume = {24}, copyright = {© 2006 Nature Publishing Group}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v24/n11/full/nbt1246.html}, doi = {10.1038/nbt1246}, abstract = {Transcription factors (TFs) interact with specific DNA regulatory sequences to control gene expression throughout myriad cellular processes. However, the DNA binding specificities of only a small fraction of TFs are sufficiently characterized to predict the sequences that they can and cannot bind. We present a maximally compact, synthetic DNA sequence design for protein binding microarray (PBM) experiments that represents all possible DNA sequence variants of a given length k (that is, all 'k-mers') on a single, universal microarray. We constructed such all k-mer microarrays covering all 10–base pair (bp) binding sites by converting high-density single-stranded oligonucleotide arrays to double-stranded (ds) DNA arrays. Using these microarrays we comprehensively determined the binding specificities over a full range of affinities for five TFs of different structural classes from yeast, worm, mouse and human. The unbiased coverage of all k-mers permits high-throughput interrogation of binding site preferences, including nucleotide interdependencies, at unprecedented resolution.}, language = {en}, number = {11}, urldate = {2016-08-23}, journal = {Nature Biotechnology}, author = {Berger, Michael F. and Philippakis, Anthony A. and Qureshi, Aaron M. and He, Fangxue S. and Estep, Preston W. and Bulyk, Martha L.}, month = nov, year = {2006}, pages = {1429--1435}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F5R2C9GV/Berger et al. - 2006 - Compact, universal DNA microarrays to comprehensiv.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NV6A7NWG/nbt1246.html:text/html} } @article{kouzarides_chromatin_2007, title = {Chromatin {Modifications} and {Their} {Function}}, volume = {128}, issn = {0092-8674}, url = {http://www.sciencedirect.com/science/article/pii/S0092867407001845}, doi = {10.1016/j.cell.2007.02.005}, abstract = {The surface of nucleosomes is studded with a multiplicity of modifications. At least eight different classes have been characterized to date and many different sites have been identified for each class. Operationally, modifications function either by disrupting chromatin contacts or by affecting the recruitment of nonhistone proteins to chromatin. Their presence on histones can dictate the higher-order chromatin structure in which DNA is packaged and can orchestrate the ordered recruitment of enzyme complexes to manipulate DNA. In this way, histone modifications have the potential to influence many fundamental biological processes, some of which may be epigenetically inherited.}, number = {4}, urldate = {2016-08-25}, journal = {Cell}, author = {Kouzarides, Tony}, month = feb, year = {2007}, pages = {693--705}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5W94T3M9/Kouzarides - 2007 - Chromatin Modifications and Their Function.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SS4ZR8W3/S0092867407001845.html:text/html} } @article{fischle_regulation_2005, title = {Regulation of {HP}1–chromatin binding by histone {H}3 methylation and phosphorylation}, volume = {438}, copyright = {© 2005 Nature Publishing Group}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v438/n7071/full/nature04219.html}, doi = {10.1038/nature04219}, abstract = {Tri-methylation of histone H3 lysine 9 is important for recruiting heterochromatin protein 1 (HP1) to discrete regions of the genome, thereby regulating gene expression, chromatin packaging and heterochromatin formation. Here we show that HP1, -, and - are released from chromatin during the M phase of the cell cycle, even though tri-methylation levels of histone H3 lysine 9 remain unchanged. However, the additional, transient modification of histone H3 by phosphorylation of serine 10 next to the more stable methyl-lysine 9 mark is sufficient to eject HP1 proteins from their binding sites. Inhibition or depletion of the mitotic kinase Aurora B, which phosphorylates serine 10 on histone H3, causes retention of HP1 proteins on mitotic chromosomes, suggesting that H3 serine 10 phosphorylation is necessary for the dissociation of HP1 from chromatin in M phase. These findings establish a regulatory mechanism of protein–protein interactions, through a combinatorial readout of two adjacent post-translational modifications: a stable methylation and a dynamic phosphorylation mark.}, language = {en}, number = {7071}, urldate = {2016-08-25}, journal = {Nature}, author = {Fischle, Wolfgang and Tseng, Boo Shan and Dormann, Holger L. and Ueberheide, Beatrix M. and Garcia, Benjamin A. and Shabanowitz, Jeffrey and Hunt, Donald F. and Funabiki, Hironori and Allis, C. David}, month = dec, year = {2005}, pages = {1116--1122}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5CFJUGEB/Fischle et al. - 2005 - Regulation of HP1–chromatin binding by histone H3 .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B5G4MKGB/nature04219.html:text/html} } @article{stormo_use_1982, title = {Use of the ‘{Perceptron}’ algorithm to distinguish translational initiation sites in {E}. coli}, volume = {10}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/10/9/2997}, doi = {10.1093/nar/10.9.2997}, abstract = {We have used a “Perceptron” algorithm to find a weighting function which distinguishes E. coli translational initiation sites from all other sites in a library of over 78,000 nucleotides of mRNA sequence. The “Perceptron” examined sequences as linear representations. The “Perceptron” is more successful at finding gene beginnings than our previous searches using “rules” (see previous paper). We note that the weighting function can find translational initiation sites within sequences that were not included in the training set.}, language = {en}, number = {9}, urldate = {2016-08-25}, journal = {Nucleic Acids Research}, author = {Stormo, Gary D. and Schneider, Thomas D. and Gold, Larry and Ehrenfeucht, Andrzej}, month = may, year = {1982}, pmid = {7048259}, pages = {2997--3011}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IU3EEKKP/Stormo et al. - 1982 - Use of the ‘Perceptron’ algorithm to distinguish t.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2V79XU79/2997.html:text/html} } @article{takahashi_induction_2006, title = {Induction of {Pluripotent} {Stem} {Cells} from {Mouse} {Embryonic} and {Adult} {Fibroblast} {Cultures} by {Defined} {Factors}}, volume = {126}, issn = {0092-8674, 1097-4172}, url = {/cell/abstract/S0092-8674(06)00976-7}, doi = {10.1016/j.cell.2006.07.024}, abstract = {Differentiated cells can be reprogrammed to an embryonic-like state by transfer of nuclear contents into oocytes or by fusion with embryonic stem (ES) cells. Little is known about factors that induce this reprogramming. Here, we demonstrate induction of pluripotent stem cells from mouse embryonic or adult fibroblasts by introducing four factors, Oct3/4, Sox2, c-Myc, and Klf4, under ES cell culture conditions. Unexpectedly, Nanog was dispensable. These cells, which we designated iPS (induced pluripotent stem) cells, exhibit the morphology and growth properties of ES cells and express ES cell marker genes. Subcutaneous transplantation of iPS cells into nude mice resulted in tumors containing a variety of tissues from all three germ layers. Following injection into blastocysts, iPS cells contributed to mouse embryonic development. These data demonstrate that pluripotent stem cells can be directly generated from fibroblast cultures by the addition of only a few defined factors.}, language = {English}, number = {4}, urldate = {2016-08-26}, journal = {Cell}, author = {Takahashi, Kazutoshi and Yamanaka, Shinya}, month = aug, year = {2006}, pmid = {16904174, 16904174}, pages = {663--676}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/47IZ9WIV/Takahashi et Yamanaka - 2006 - Induction of Pluripotent Stem Cells from Mouse Emb.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/N9BCVH52/S0092-8674(06)00976-7.html:text/html} } @article{yu_induced_2007, title = {Induced {Pluripotent} {Stem} {Cell} {Lines} {Derived} from {Human} {Somatic} {Cells}}, volume = {318}, copyright = {American Association for the Advancement of Science}, issn = {0036-8075, 1095-9203}, url = {http://science.sciencemag.org/content/318/5858/1917}, doi = {10.1126/science.1151526}, abstract = {Somatic cell nuclear transfer allows trans-acting factors present in the mammalian oocyte to reprogram somatic cell nuclei to an undifferentiated state. We show that four factors (OCT4, SOX2, NANOG, and LIN28) are sufficient to reprogram human somatic cells to pluripotent stem cells that exhibit the essential characteristics of embryonic stem (ES) cells. These induced pluripotent human stem cells have normal karyotypes, express telomerase activity, express cell surface markers and genes that characterize human ES cells, and maintain the developmental potential to differentiate into advanced derivatives of all three primary germ layers. Such induced pluripotent human cell lines should be useful in the production of new disease models and in drug development, as well as for applications in transplantation medicine, once technical limitations (for example, mutation through viral integration) are eliminated. Human fibroblasts transfected with four genes exhibit the properties of embryonic stem cells. Human fibroblasts transfected with four genes exhibit the properties of embryonic stem cells.}, language = {en}, number = {5858}, urldate = {2016-08-26}, journal = {Science}, author = {Yu, Junying and Vodyanik, Maxim A. and Smuga-Otto, Kim and Antosiewicz-Bourget, Jessica and Frane, Jennifer L. and Tian, Shulan and Nie, Jeff and Jonsdottir, Gudrun A. and Ruotti, Victor and Stewart, Ron and Slukvin, Igor I. and Thomson, James A.}, month = dec, year = {2007}, pmid = {18029452}, pages = {1917--1920}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QJZJ4TMW/Yu et al. - 2007 - Induced Pluripotent Stem Cell Lines Derived from H.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/N5KDWEPM/1917.html:text/html} } @article{darnell_transcription_2002, title = {Transcription factors as targets for cancer therapy}, volume = {2}, copyright = {© 2002 Nature Publishing Group}, issn = {1474-175X}, url = {http://www.nature.com/nrc/journal/v2/n10/full/nrc906.html}, doi = {10.1038/nrc906}, abstract = {A limited list of transcription factors are overactive in most human cancer cells, which makes them targets for the development of anticancer drugs. That they are the most direct and hopeful targets for treating cancer is proposed, and this is supported by the fact that there are many more human oncogenes in signalling pathways than there are oncogenic transcription factors. But how could specific transcription-factor activity be inhibited?}, language = {en}, number = {10}, urldate = {2016-08-26}, journal = {Nature Reviews Cancer}, author = {Darnell, James E.}, month = oct, year = {2002}, pages = {740--749}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G93Q5ETV/Darnell - 2002 - Transcription factors as targets for cancer therap.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E7PDA294/nrc906.html:text/html} } @article{zaret_pioneer_2011, title = {Pioneer transcription factors: establishing competence for gene expression}, volume = {25}, issn = {0890-9369, 1549-5477}, shorttitle = {Pioneer transcription factors}, url = {http://genesdev.cshlp.org/content/25/21/2227}, doi = {10.1101/gad.176826.111}, abstract = {Transcription factors are adaptor molecules that detect regulatory sequences in the DNA and target the assembly of protein complexes that control gene expression. Yet much of the DNA in the eukaryotic cell is in nucleosomes and thereby occluded by histones, and can be further occluded by higher-order chromatin structures and repressor complexes. Indeed, genome-wide location analyses have revealed that, for all transcription factors tested, the vast majority of potential DNA-binding sites are unoccupied, demonstrating the inaccessibility of most of the nuclear DNA. This raises the question of how target sites at silent genes become bound de novo by transcription factors, thereby initiating regulatory events in chromatin. Binding cooperativity can be sufficient for many kinds of factors to simultaneously engage a target site in chromatin and activate gene expression. However, in cases in which the binding of a series of factors is sequential in time and thus not initially cooperative, special “pioneer transcription factors” can be the first to engage target sites in chromatin. Such initial binding can passively enhance transcription by reducing the number of additional factors that are needed to bind the DNA, culminating in activation. In addition, pioneer factor binding can actively open up the local chromatin and directly make it competent for other factors to bind. Passive and active roles for the pioneer factor FoxA occur in embryonic development, steroid hormone induction, and human cancers. Herein we review the field and describe how pioneer factors may enable cellular reprogramming.}, language = {en}, number = {21}, urldate = {2016-08-26}, journal = {Genes \& Development}, author = {Zaret, Kenneth S. and Carroll, Jason S.}, month = nov, year = {2011}, pmid = {22056668}, keywords = {cancer, development, pioneer factors, transcription, activation, competence, steroid hormone receptors}, pages = {2227--2241}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8UMN6NNI/Zaret et Carroll - 2011 - Pioneer transcription factors establishing compet.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JXSETAKT/2227.html:text/html} } @article{zhao_inferring_2009, title = {Inferring {Binding} {Energies} from {Selected} {Binding} {Sites}}, volume = {5}, issn = {1553-7358}, url = {http://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1000590}, doi = {10.1371/journal.pcbi.1000590}, abstract = {Author Summary The DNA binding sites of transcription factors that control gene expression are often predicted based on a collection of known or selected binding sites. The most commonly used methods for inferring the binding site pattern, or sequence motif, assume that the sites are selected in proportion to their affinity for the transcription factor, ignoring the effect of the transcription factor concentration. We have developed a new maximum likelihood approach, in a program called BEEML, that directly takes into account the transcription factor concentration as well as non-specific contributions to the binding affinity, and we show in simulation studies that it gives a much more accurate model of the transcription factor binding sites than previous methods. We also develop a new method for extracting binding sites for a transcription factor from a random pool of DNA sequences, called high-throughput SELEX (HT-SELEX), and we show that after a single round of selection BEEML can obtain an accurate model of the transcription factor binding sites.}, number = {12}, urldate = {2016-08-26}, journal = {PLOS Comput Biol}, author = {Zhao, Yue and Granas, David and Stormo, Gary D.}, year = {2009}, keywords = {Transcription Factors, biophysics, Sequence motif analysis, DNA-binding proteins, DNA sequence analysis, Binding analysis, Sequence analysis, Free energy}, pages = {e1000590}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9MID4X6P/Zhao et al. - 2009 - Inferring Binding Energies from Selected Binding S.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/54ET4E87/article.html:text/html} } @article{ellrott_identifying_2002, title = {Identifying transcription factor binding sites through {Markov} chain optimization}, volume = {18}, issn = {1367-4803, 1460-2059}, url = {http://bioinformatics.oxfordjournals.org/content/18/suppl_2/S100}, doi = {10.1093/bioinformatics/18.suppl_2.S100}, abstract = {Even though every cell in an organism contains the same genetic material, each cell does not express the same cohort of genes. Therefore, one of the major problems facing genomic research today is to determine not only which genes are differentially expressed and under what conditions, but also how the expression of those genes is regulated. The first step in determining differential gene expression is the binding of sequence-specific DNA binding proteins (i.e. transcription factors) to regulatory regions of the genes (i.e. promoters and enhancers). An important aspect to understanding how a given transcription factor functions is to know the entire gamut of binding sites and subsequently potential target genes that the factor may bind/regulate. In this study, we have developed a computer algorithm to scan genomic databases for transcription factor binding sites, based on a novel Markov chain optimization method, and used it to scan the human genome for sites that bind to hepatocyte nuclear factor 4 α (HNF4α). A list of 71 known HNF4α binding sites from the literature were used to train our Markov chain model. By looking at the window of 600 nucleotides around the transcription start site of each confirmed gene on the human genome, we identified 849 sites with varying binding potential and experimentally tested 109 of those sites for binding to HNF4α. Our results show that the program was very successful in identifying 77 new HNF4α binding sites with varying binding affinities (i.e. a 71\% success rate). Therefore, this computational method for searching genomic databases for potential transcription factor binding sites is a powerful tool for investigating mechanisms of differential gene regulation. Contact: jiang@cs.ucr.edu}, language = {en}, number = {suppl 2}, urldate = {2016-08-29}, journal = {Bioinformatics}, author = {Ellrott, Kyle and Yang, Chuhu and Sladek, Frances M. and Jiang, Tao}, month = oct, year = {2002}, pmid = {12385991}, pages = {S100--S109}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5226R9D9/Ellrott et al. - 2002 - Identifying transcription factor binding sites thr.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U4937D39/S100.html:text/html} } @article{granek_explicit_2005, title = {Explicit equilibrium modeling of transcription-factor binding and gene regulation}, volume = {6}, issn = {1474-760X}, url = {http://dx.doi.org/10.1186/gb-2005-6-10-r87}, doi = {10.1186/gb-2005-6-10-r87}, abstract = {We have developed a computational model that predicts the probability of transcription factor binding to any site in the genome. GOMER (generalizable occupancy model of expression regulation) calculates binding probabilities on the basis of position weight matrices, and incorporates the effects of cooperativity and competition by explicit calculation of coupled binding equilibria. GOMER can be used to test hypotheses regarding gene regulation that build upon this physically principled prediction of protein-DNA binding.}, urldate = {2016-08-29}, journal = {Genome Biology}, author = {Granek, Joshua A. and Clarke, Neil D.}, year = {2005}, pages = {R87}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UNX9KDTM/Granek et Clarke - 2005 - Explicit equilibrium modeling of transcription-fac.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7H3ZRUJ6/gb-2005-6-10-r87.html:text/html} } @article{berg_selection_1988, title = {Selection of {DNA} binding sites by regulatory proteins}, volume = {200}, issn = {0022-2836}, url = {http://www.sciencedirect.com/science/article/pii/0022283688904822}, doi = {10.1016/0022-2836(88)90482-2}, abstract = {The statistics of base-pair usage within known recognition sites for a particular DNA-binding protein can be used to estimate the relative protein binding affinities to these sites, as well as to sites containing any other combinations of base-pairs. As has been described elsewhere, the connection between base-pair statistics and binding free energy is made by an equal probability selection assumption; i.e. that all base-pair sequences that provide appropriate binding strength are equally likely to have been chosen as recognition sites in the course of evolution. This is analogous to a statistical-mechanical system where all configurations with the same energy are equally likely to occur. In this communication, we apply the statistical-mechanical selection theory to analyze the base-pair statistics of the known recognition sequences for the cyclic AMP receptor protein (CRP). The theoretical predictions are found to be in reasonable agreement with binding data for those sequences for which experimental binding information is available, thus lending support to the basic assumptions of the selection theory. On the basis of this agreement, we can predict the affinity for CRP binding to any base-pair sequence, albeit with a large statistical uncertainty. When the known recognition sites for CRP are ranked according to predicted binding affinities, we find that the ranking is consistent with the hypothesis that the level of function of these sites parallels their fractional saturation with CRP-cAMP under in-vivo conditions. When applied to the entire genome, the theory predicts the existence of a large number of randomly occurring “pseudosites” with strong binding affinity for CRP. It appears that most CRP molecules are engaged in non-productive binding at non-specific or pseudospecific sites under in-vivo conditions. In this sense, the specificity of the CRP binding site is very low. Relative specificity requirements for polymerases, repressors and activators are compared in light of the results of this and the first paper in this series.}, number = {4}, urldate = {2016-08-29}, journal = {Journal of Molecular Biology}, author = {Berg, Otto G. and von Hippel, Peter H.}, month = apr, year = {1988}, pages = {709--723}, file = {1-s2.0-0968000488900850-main.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MN27QNMC/1-s2.0-0968000488900850-main.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MN27QNMC/0022283688904822.html:text/html} } @article{huang_optimized_2006, title = {Optimized mixed {Markov} models for motif identification}, volume = {7}, issn = {1471-2105}, url = {http://dx.doi.org/10.1186/1471-2105-7-279}, doi = {10.1186/1471-2105-7-279}, abstract = {Identifying functional elements, such as transcriptional factor binding sites, is a fundamental step in reconstructing gene regulatory networks and remains a challenging issue, largely due to limited availability of training samples.}, urldate = {2016-08-31}, journal = {BMC Bioinformatics}, author = {Huang, Weichun and Umbach, David M. and Ohler, Uwe and Li, Leping}, year = {2006}, pages = {279}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RQARQ6ZZ/Huang et al. - 2006 - Optimized mixed Markov models for motif identifica.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TF3D3CHE/1471-2105-7-279.html:text/html} } @article{maaskola_binding_2014, title = {Binding site discovery from nucleic acid sequences by discriminative learning of hidden {Markov} models}, volume = {42}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/42/21/12995}, doi = {10.1093/nar/gku1083}, abstract = {We present a discriminative learning method for pattern discovery of binding sites in nucleic acid sequences based on hidden Markov models. Sets of positive and negative example sequences are mined for sequence motifs whose occurrence frequency varies between the sets. The method offers several objective functions, but we concentrate on mutual information of condition and motif occurrence. We perform a systematic comparison of our method and numerous published motif-finding tools. Our method achieves the highest motif discovery performance, while being faster than most published methods. We present case studies of data from various technologies, including ChIP-Seq, RIP-Chip and PAR-CLIP, of embryonic stem cell transcription factors and of RNA-binding proteins, demonstrating practicality and utility of the method. For the alternative splicing factor RBM10, our analysis finds motifs known to be splicing-relevant. The motif discovery method is implemented in the free software package Discrover. It is applicable to genome- and transcriptome-scale data, makes use of available repeat experiments and aside from binary contrasts also more complex data configurations can be utilized.}, language = {en}, number = {21}, urldate = {2016-08-31}, journal = {Nucleic Acids Research}, author = {Maaskola, Jonas and Rajewsky, Nikolaus}, month = dec, year = {2014}, pmid = {25389269}, pages = {12995--13011}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M2JZH46C/Maaskola et Rajewsky - 2014 - Binding site discovery from nucleic acid sequences.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XRV4RKGA/12995.html:text/html} } -@article{zhao_improved_2012-1, +@article{zhao_improved_2012, title = {Improved {Models} for {Transcription} {Factor} {Binding} {Site} {Identification} {Using} {Nonindependent} {Interactions}}, volume = {191}, copyright = {Copyright © 2012 by the Genetics Society of America}, issn = {0016-6731, 1943-2631}, url = {http://www.genetics.org/content/191/3/781}, doi = {10.1534/genetics.112.138685}, abstract = {Identifying transcription factor (TF) binding sites is essential for understanding regulatory networks. The specificity of most TFs is currently modeled using position weight matrices (PWMs) that assume the positions within a binding site contribute independently to binding affinity for any site. Extensive, high-throughput quantitative binding assays let us examine, for the first time, the independence assumption for many TFs. We find that the specificity of most TFs is well fit with the simple PWM model, but in some cases more complex models are required. We introduce a binding energy model (BEM) that can include energy parameters for nonindependent contributions to binding affinity. We show that in most cases where a PWM is not sufficient, a BEM that includes energy parameters for adjacent dinucleotide contributions models the specificity very well. Having more accurate models of specificity greatly improves the interpretation of in vivo TF localization data, such as from chromatin immunoprecipitation followed by sequencing (ChIP-seq) experiments.}, language = {en}, number = {3}, urldate = {2016-08-31}, journal = {Genetics}, author = {Zhao, Yue and Ruan, Shuxiang and Pandey, Manishi and Stormo, Gary D.}, month = jul, year = {2012}, pmid = {22505627}, pages = {781--790}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IV477UNE/Zhao et al. - 2012 - Improved Models for Transcription Factor Binding S.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PZZ2SF6P/781.html:text/html} } @article{kulakovskiy_binding_2013, title = {From binding motifs in chip-seq data to improved models of transcription factor binding sites}, volume = {11}, issn = {0219-7200}, url = {http://www.worldscientific.com/doi/abs/10.1142/S0219720013400040}, doi = {10.1142/S0219720013400040}, abstract = {Chromatin immunoprecipitation followed by deep sequencing (ChIP-Seq) became a method of choice to locate DNA segments bound by different regulatory proteins. ChIP-Seq produces extremely valuable information to study transcriptional regulation. The wet-lab workflow is often supported by downstream computational analysis including construction of models of nucleotide sequences of transcription factor binding sites in DNA, which can be used to detect binding sites in ChIP-Seq data at a single base pair resolution. The most popular TFBS model is represented by positional weight matrix (PWM) with statistically independent positional weights of nucleotides in different columns; such PWMs are constructed from a gapless multiple local alignment of sequences containing experimentally identified TFBSs. Modern high-throughput techniques, including ChIP-Seq, provide enough data for careful training of advanced models containing more parameters than PWM. Yet, many suggested multiparametric models often provide only incremental improvement of TFBS recognition quality comparing to traditional PWMs trained on ChIP-Seq data. We present a novel computational tool, diChIPMunk, that constructs TFBS models as optimal dinucleotide PWMs, thus accounting for correlations between nucleotides neighboring in input sequences. diChIPMunk utilizes many advantages of ChIPMunk, its ancestor algorithm, accounting for ChIP-Seq base coverage profiles ("peak shape") and using the effective subsampling-based core procedure which allows processing of large datasets. We demonstrate that diPWMs constructed by diChIPMunk outperform traditional PWMs constructed by ChIPMunk from the same ChIP-Seq data. Software website: http://autosome.ru/dichipmunk/}, number = {01}, urldate = {2016-08-31}, journal = {Journal of Bioinformatics and Computational Biology}, author = {Kulakovskiy, Ivan and Levitsky, Victor and Oshchepkov, Dmitry and Bryzgalov, Leonid and Vorontsov, Ilya and Makeev, Vsevolod}, month = jan, year = {2013}, pages = {1340004}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UQPRI686/Kulakovskiy et al. - 2013 - From binding motifs in chip-seq data to improved m.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IN3VXZCU/S0219720013400040.html:text/html} } @article{mathelier_jaspar_2014, title = {{JASPAR} 2014: an extensively expanded and updated open-access database of transcription factor binding profiles}, volume = {42}, issn = {0305-1048, 1362-4962}, shorttitle = {{JASPAR} 2014}, url = {http://nar.oxfordjournals.org/content/42/D1/D142}, doi = {10.1093/nar/gkt997}, abstract = {JASPAR (http://jaspar.genereg.net) is the largest open-access database of matrix-based nucleotide profiles describing the binding preference of transcription factors from multiple species. The fifth major release greatly expands the heart of JASPAR—the JASPAR CORE subcollection, which contains curated, non-redundant profiles—with 135 new curated profiles (74 in vertebrates, 8 in Drosophila melanogaster, 10 in Caenorhabditis elegans and 43 in Arabidopsis thaliana; a 30\% increase in total) and 43 older updated profiles (36 in vertebrates, 3 in D. melanogaster and 4 in A. thaliana; a 9\% update in total). The new and updated profiles are mainly derived from published chromatin immunoprecipitation-seq experimental datasets. In addition, the web interface has been enhanced with advanced capabilities in browsing, searching and subsetting. Finally, the new JASPAR release is accompanied by a new BioPython package, a new R tool package and a new R/Bioconductor data package to facilitate access for both manual and automated methods.}, language = {en}, number = {D1}, urldate = {2016-08-31}, journal = {Nucleic Acids Research}, author = {Mathelier, Anthony and Zhao, Xiaobei and Zhang, Allen W. and Parcy, François and Worsley-Hunt, Rebecca and Arenillas, David J. and Buchman, Sorana and Chen, Chih-yu and Chou, Alice and Ienasescu, Hans and Lim, Jonathan and Shyr, Casper and Tan, Ge and Zhou, Michelle and Lenhard, Boris and Sandelin, Albin and Wasserman, Wyeth W.}, month = jan, year = {2014}, pmid = {24194598}, pages = {D142--D147}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AFFH4HPG/Mathelier et al. - 2014 - JASPAR 2014 an extensively expanded and updated o.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/23IJ7N8C/D142.html:text/html} } -@article{man_non-independence_2001-1, +@article{man_non-independence_2001, title = {Non-independence of {Mnt} repressor–operator interaction determined by a new quantitative multiple fluorescence relative affinity ({QuMFRA}) assay}, volume = {29}, issn = {0305-1048}, url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC55749/}, abstract = {Salmonella bacteriophage repressor Mnt belongs to the ribbon–helix–helix class of transcription factors. Previous SELEX results suggested that interactions of Mnt with positions 16 and 17 of the operator DNA are not independent. Using a newly developed high-throughput quantitative multiple fluorescence relative affinity (QuMFRA) assay, we directly quantified the relative equilibrium binding constants (Kref) of Mnt to operators carrying all the possible dinucleotide combinations at these two positions. Results show that Mnt prefers binding to C, instead of wild-type A, at position 16 when wild-type C at position 17 is changed to other bases. The measured Kref values of double mutants were also higher than the values predicted from single mutants, demonstrating the non-independence of these two positions. The ability to produce a large number of quantitative binding data simultaneously and the potential to scale up makes QuMFRA a valuable tool for the large-scale study of macromolecular interaction.}, number = {12}, urldate = {2016-09-02}, journal = {Nucleic Acids Research}, author = {Man, Tsz-Kwong and Stormo, Gary D.}, month = jun, year = {2001}, pmid = {11410653}, pmcid = {PMC55749}, pages = {2471--2478}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JDFJKSJ4/Man et Stormo - 2001 - Non-independence of Mnt repressor–operator interac.pdf:application/pdf} } -@article{munteanu_cougerco-factors_2014, - title = {{COUGER}—co-factors associated with uniquely-bound genomic regions}, - volume = {42}, - issn = {0305-1048, 1362-4962}, - url = {http://nar.oxfordjournals.org/content/42/W1/W461}, - doi = {10.1093/nar/gku435}, - abstract = {Most transcription factors (TFs) belong to protein families that share a common DNA binding domain and have very similar DNA binding preferences. However, many paralogous TFs (i.e. members of the same TF family) perform different regulatory functions and interact with different genomic regions in the cell. A potential mechanism for achieving this differential in vivo specificity is through interactions with protein co-factors. Computational tools for studying the genomic binding profiles of paralogous TFs and identifying their putative co-factors are currently lacking. Here, we present an interactive web implementation of COUGER, a classification-based framework for identifying protein co-factors that might provide specificity to paralogous TFs. COUGER takes as input two sets of genomic regions bound by paralogous TFs, and it identifies a small set of putative co-factors that best distinguish the two sets of sequences. To achieve this task, COUGER uses a classification approach, with features that reflect the DNA-binding specificities of the putative co-factors. The identified co-factors are presented in a user-friendly output page, together with information that allows the user to understand and to explore the contributions of individual co-factor features. COUGER can be run as a stand-alone tool or through a web interface: http://couger.oit.duke.edu.}, - language = {en}, - number = {W1}, - urldate = {2016-09-27}, - journal = {Nucleic Acids Research}, - author = {Munteanu, Alina and Ohler, Uwe and Gordân, Raluca}, - month = jul, - year = {2014}, - pmid = {24861628}, - pages = {W461--W467}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7VJD97U6/Munteanu et al. - 2014 - COUGER—co-factors associated with uniquely-bound g.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MN4JNW29/W461.html:text/html} -} - @article{ibrahim_jamm:_2015, title = {{JAMM}: a peak finder for joint analysis of {NGS} replicates}, volume = {31}, issn = {1367-4803, 1460-2059}, shorttitle = {{JAMM}}, url = {http://bioinformatics.oxfordjournals.org/content/31/1/48}, doi = {10.1093/bioinformatics/btu568}, abstract = {Motivation: Although peak finding in next-generation sequencing (NGS) datasets has been addressed extensively, there is no consensus on how to analyze and process biological replicates. Furthermore, most peak finders do not focus on accurate determination of enrichment site widths and are not widely applicable to different types of datasets. Results: We developed JAMM (Joint Analysis of NGS replicates via Mixture Model clustering): a peak finder that can integrate information from biological replicates, determine enrichment site widths accurately and resolve neighboring narrow peaks. JAMM is a universal peak finder that is applicable to different types of datasets. We show that JAMM is among the best performing peak finders in terms of site detection accuracy and in terms of accurate determination of enrichment sites widths. In addition, JAMM’s replicate integration improves peak spatial resolution, sorting and peak finding accuracy. Availability and implementation: JAMM is available for free and can run on Linux machines through the command line: http://code.google.com/p/jamm-peak-finder Contact: mahmoud.ibrahim@mdc-berlin.de or uwe.ohler@mdc-berlin.de. Supplementary information: Supplementary data are available at Bioinformatics online.}, language = {en}, number = {1}, urldate = {2016-10-17}, journal = {Bioinformatics}, author = {Ibrahim, Mahmoud M. and Lacadie, Scott A. and Ohler, Uwe}, month = jan, year = {2015}, pmid = {25223640}, pages = {48--55}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IMV7KPV6/Ibrahim et al. - 2015 - JAMM a peak finder for joint analysis of NGS repl.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VJKHWJP7/48.html:text/html} } -@article{munteanu_cougerco-factors_2014-1, +@article{munteanu_cougerco-factors_2014, title = {{COUGER}—co-factors associated with uniquely-bound genomic regions}, volume = {42}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/42/W1/W461}, doi = {10.1093/nar/gku435}, abstract = {Most transcription factors (TFs) belong to protein families that share a common DNA binding domain and have very similar DNA binding preferences. However, many paralogous TFs (i.e. members of the same TF family) perform different regulatory functions and interact with different genomic regions in the cell. A potential mechanism for achieving this differential in vivo specificity is through interactions with protein co-factors. Computational tools for studying the genomic binding profiles of paralogous TFs and identifying their putative co-factors are currently lacking. Here, we present an interactive web implementation of COUGER, a classification-based framework for identifying protein co-factors that might provide specificity to paralogous TFs. COUGER takes as input two sets of genomic regions bound by paralogous TFs, and it identifies a small set of putative co-factors that best distinguish the two sets of sequences. To achieve this task, COUGER uses a classification approach, with features that reflect the DNA-binding specificities of the putative co-factors. The identified co-factors are presented in a user-friendly output page, together with information that allows the user to understand and to explore the contributions of individual co-factor features. COUGER can be run as a stand-alone tool or through a web interface: http://couger.oit.duke.edu.}, language = {en}, number = {W1}, urldate = {2016-10-17}, journal = {Nucleic Acids Research}, author = {Munteanu, Alina and Ohler, Uwe and Gordân, Raluca}, month = jul, year = {2014}, pmid = {24861628}, pages = {W461--W467}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GHRB6VBH/Munteanu et al. - 2014 - COUGER—co-factors associated with uniquely-bound g.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9A38J3KA/W461.html:text/html} } @article{perner_inference_2014-1, title = {Inference of interactions between chromatin modifiers and histone modifications: from {ChIP}-{Seq} data to chromatin-signaling}, volume = {42}, issn = {0305-1048, 1362-4962}, shorttitle = {Inference of interactions between chromatin modifiers and histone modifications}, url = {http://nar.oxfordjournals.org/content/42/22/13689}, doi = {10.1093/nar/gku1234}, abstract = {Chromatin modifiers and histone modifications are components of a chromatin-signaling network involved in transcription and its regulation. The interactions between chromatin modifiers and histone modifications are often unknown, are based on the analysis of few genes or are studied in vitro. Here, we apply computational methods to recover interactions between chromatin modifiers and histone modifications from genome-wide ChIP-Seq data. These interactions provide a high-confidence backbone of the chromatin-signaling network. Many recovered interactions have literature support; others provide hypotheses about yet unknown interactions. We experimentally verified two of these predicted interactions, leading to a link between H4K20me1 and members of the Polycomb Repressive Complexes 1 and 2. Our results suggest that our computationally derived interactions are likely to lead to novel biological insights required to establish the connectivity of the chromatin-signaling network involved in transcription and its regulation.}, language = {en}, number = {22}, urldate = {2016-10-17}, journal = {Nucleic Acids Research}, author = {Perner, Juliane and Lasserre, Julia and Kinkley, Sarah and Vingron, Martin and Chung, Ho-Ryun}, month = dec, year = {2014}, pmid = {25414326}, pages = {13689--13695}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/22APC2DQ/Perner et al. - 2014 - Inference of interactions between chromatin modifi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5AKI5GG2/13689.html:text/html} } @article{mendoza-parra_reconstructed_2016, title = {Reconstructed cell fate-regulatory programs in stem cells reveal hierarchies and key factors of neurogenesis}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/early/2016/09/20/gr.208926.116}, doi = {10.1101/gr.208926.116}, abstract = {An international, peer-reviewed genome sciences journal featuring outstanding original research that offers novel insights into the biology of all organisms}, language = {en}, urldate = {2016-10-17}, journal = {Genome Research}, author = {Mendoza-Parra, Marco-Antonio and Malysheva, Valeriya and Saleem, Mohamed Ashick Mohamed and Lieb, Michele and Godel, Aurelie and Gronemeyer, Hinrich}, month = sep, year = {2016}, pmid = {27650846}, pages = {gr.208926.116}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FF6R7IRA/Mendoza-Parra et al. - 2016 - Reconstructed cell fate-regulatory programs in ste.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6G67CP2U/gr.208926.116.html:text/html} } -@article{mendoza-parra_reconstructed_2016-1, - title = {Reconstructed cell fate-regulatory programs in stem cells reveal hierarchies and key factors of neurogenesis}, - issn = {1088-9051, 1549-5469}, - url = {http://genome.cshlp.org/content/early/2016/09/20/gr.208926.116}, - doi = {10.1101/gr.208926.116}, - abstract = {An international, peer-reviewed genome sciences journal featuring outstanding original research that offers novel insights into the biology of all organisms}, - language = {en}, - urldate = {2016-10-17}, - journal = {Genome Research}, - author = {Mendoza-Parra, Marco-Antonio and Malysheva, Valeriya and Saleem, Mohamed Ashick Mohamed and Lieb, Michele and Godel, Aurelie and Gronemeyer, Hinrich}, - month = sep, - year = {2016}, - pmid = {27650846}, - pages = {gr.208926.116}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/AUZC6XII/Mendoza-Parra et al. - 2016 - Reconstructed cell fate-regulatory programs in ste.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/29H6XUNF/gr.208926.116.html:text/html} -} - @article{boeva_analysis_2016, title = {Analysis of {Genomic} {Sequence} {Motifs} for {Deciphering} {Transcription} {Factor} {Binding} and {Transcriptional} {Regulation} in {Eukaryotic} {Cells}}, url = {http://journal.frontiersin.org/article/10.3389/fgene.2016.00024/full}, doi = {10.3389/fgene.2016.00024}, abstract = {Eukaryotic genomes contain a variety of structured patterns: repetitive elements, binding sites of DNA and RNA associated proteins, splice sites, and so on. Often, these structured patterns can be formalized as motifs and described using a proper mathematical model such as position weight matrix and IUPAC consensus. Two key tasks are typically carried out for motifs in the context of the analysis of genomic sequences. These are: identification in a set of DNA regions of over-represented motifs from a particular motif database, and de novo discovery of over-represented motifs. Here we describe existing methodology to perform these two tasks for motifs characterizing transcription factor binding. When applied to the output of ChIP-seq and ChIP-exo experiments, or to promoter regions of co-modulated genes, motif analysis techniques allow for the prediction of transcription factor binding events and enable identification of transcriptional regulators and co-regulators. The usefulness of motif analysis is further exemplified in this review by how motif discovery improves peak calling in ChIP-seq and ChIP-exo experiments and, when coupled with information on gene expression, allows insights into physical mechanisms of transcriptional modulation.}, urldate = {2016-11-09}, journal = {Bioinformatics and Computational Biology}, author = {Boeva, Valentina}, year = {2016}, keywords = {Transcription Factors, Binding Sites, motif discovery, position-specific scoring matrices, regulation of gene transcription, ChIP-seq, binding motif models}, pages = {24}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KDGW3PE5/Boeva - 2016 - Analysis of Genomic Sequence Motifs for Decipherin.pdf:application/pdf} } @article{kulakovskiy_deeper_2011, title = {A deeper look into transcription regulatory code by preferred pair distance templates for transcription factor binding sites}, volume = {27}, issn = {1367-4803, 1460-2059}, url = {http://bioinformatics.oxfordjournals.org/content/27/19/2621}, doi = {10.1093/bioinformatics/btr453}, abstract = {Motivation: Modern experimental methods provide substantial information on protein–DNA recognition. Studying arrangements of transcription factor binding sites (TFBSs) of interacting transcription factors (TFs) advances understanding of the transcription regulatory code. Results: We constructed binding motifs for TFs forming a complex with HIF-1α at the erythropoietin 3′-enhancer. Corresponding TFBSs were predicted in the segments around transcription start sites (TSSs) of all human genes. Using the genome-wide set of regulatory regions, we observed several strongly preferred distances between hypoxia-responsive element (HRE) and binding sites of a particular cofactor protein. The set of preferred distances was called as a preferred pair distance template (PPDT). PPDT dramatically depended on the TF and orientation of its binding sites relative to HRE. PPDT evaluated from the genome-wide set of regulatory sequences was used to detect significant PPDT-consistent binding site pairs in regulatory regions of hypoxia-responsive genes. We believe PPDT can help to reveal the layout of eukaryotic regulatory segments. Contact: ivan.kulakovskiy@gmail.com Supplementary information: Supplementary data are available at Bioinformatics online.}, language = {en}, number = {19}, urldate = {2016-11-25}, journal = {Bioinformatics}, author = {Kulakovskiy, I. V. and Belostotsky, A. A. and Kasianov, A. S. and Esipova, N. G. and Medvedeva, Y. A. and Eliseeva, I. A. and Makeev, V. J.}, month = oct, year = {2011}, pmid = {21852305}, pages = {2621--2624}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VPI9SK28/Kulakovskiy et al. - 2011 - A deeper look into transcription regulatory code b.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TSHP7AW7/2621.html:text/html} } @article{kulakovskiy_hocomoco:_2013, title = {{HOCOMOCO}: a comprehensive collection of human transcription factor binding sites models}, volume = {41}, issn = {0305-1048, 1362-4962}, shorttitle = {{HOCOMOCO}}, url = {http://nar.oxfordjournals.org/content/41/D1/D195}, doi = {10.1093/nar/gks1089}, abstract = {Transcription factor (TF) binding site (TFBS) models are crucial for computational reconstruction of transcription regulatory networks. In existing repositories, a TF often has several models (also called binding profiles or motifs), obtained from different experimental data. Having a single TFBS model for a TF is more pragmatic for practical applications. We show that integration of TFBS data from various types of experiments into a single model typically results in the improved model quality probably due to partial correction of source specific technique bias. We present the Homo sapiens comprehensive model collection (HOCOMOCO, http://autosome.ru/HOCOMOCO/, http://cbrc.kaust.edu.sa/hocomoco/) containing carefully hand-curated TFBS models constructed by integration of binding sequences obtained by both low- and high-throughput methods. To construct position weight matrices to represent these TFBS models, we used ChIPMunk software in four computational modes, including newly developed periodic positional prior mode associated with DNA helix pitch. We selected only one TFBS model per TF, unless there was a clear experimental evidence for two rather distinct TFBS models. We assigned a quality rating to each model. HOCOMOCO contains 426 systematically curated TFBS models for 401 human TFs, where 172 models are based on more than one data source.}, language = {en}, number = {D1}, urldate = {2016-11-25}, journal = {Nucleic Acids Research}, author = {Kulakovskiy, Ivan V. and Medvedeva, Yulia A. and Schaefer, Ulf and Kasianov, Artem S. and Vorontsov, Ilya E. and Bajic, Vladimir B. and Makeev, Vsevolod J.}, month = jan, year = {2013}, pmid = {23175603}, pages = {D195--D202}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4ZXU8QGZ/Kulakovskiy et al. - 2013 - HOCOMOCO a comprehensive collection of human tran.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UI3C8F8N/D195.html:text/html} } @article{kulakovskiy_hocomoco:_2016, title = {{HOCOMOCO}: expansion and enhancement of the collection of transcription factor binding sites models}, volume = {44}, issn = {0305-1048, 1362-4962}, shorttitle = {{HOCOMOCO}}, url = {http://nar.oxfordjournals.org/content/44/D1/D116}, doi = {10.1093/nar/gkv1249}, abstract = {Models of transcription factor (TF) binding sites provide a basis for a wide spectrum of studies in regulatory genomics, from reconstruction of regulatory networks to functional annotation of transcripts and sequence variants. While TFs may recognize different sequence patterns in different conditions, it is pragmatic to have a single generic model for each particular TF as a baseline for practical applications. Here we present the expanded and enhanced version of HOCOMOCO (http://hocomoco.autosome.ru and http://www.cbrc.kaust.edu.sa/hocomoco10), the collection of models of DNA patterns, recognized by transcription factors. HOCOMOCO now provides position weight matrix (PWM) models for binding sites of 601 human TFs and, in addition, PWMs for 396 mouse TFs. Furthermore, we introduce the largest up to date collection of dinucleotide PWM models for 86 (52) human (mouse) TFs. The update is based on the analysis of massive ChIP-Seq and HT-SELEX datasets, with the validation of the resulting models on in vivo data. To facilitate a practical application, all HOCOMOCO models are linked to gene and protein databases (Entrez Gene, HGNC, UniProt) and accompanied by precomputed score thresholds. Finally, we provide command-line tools for PWM and diPWM threshold estimation and motif finding in nucleotide sequences.}, language = {en}, number = {D1}, urldate = {2016-11-25}, journal = {Nucleic Acids Research}, author = {Kulakovskiy, Ivan V. and Vorontsov, Ilya E. and Yevshin, Ivan S. and Soboleva, Anastasiia V. and Kasianov, Artem S. and Ashoor, Haitham and Ba-alawi, Wail and Bajic, Vladimir B. and Medvedeva, Yulia A. and Kolpakov, Fedor A. and Makeev, Vsevolod J.}, month = jan, year = {2016}, pmid = {26586801}, pages = {D116--D125}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2W77ZX4K/Kulakovskiy et al. - 2016 - HOCOMOCO expansion and enhancement of the collect.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MZ3QRPWE/D116.html:text/html} } @article{kulakovskiy_deep_2010, title = {Deep and wide digging for binding motifs in {ChIP}-{Seq} data}, volume = {26}, issn = {1367-4803, 1460-2059}, url = {http://bioinformatics.oxfordjournals.org/content/26/20/2622}, doi = {10.1093/bioinformatics/btq488}, abstract = {Summary: ChIP-Seq data are a new challenge for motif discovery. Such a data typically consists of thousands of DNA segments with base-specific coverage values. We present a new version of our DNA motif discovery software ChIPMunk adapted for ChIP-Seq data. ChIPMunk is an iterative algorithm that combines greedy optimization with bootstrapping and uses coverage profiles as motif positional preferences. ChIPMunk does not require truncation of long DNA segments and it is practical for processing up to tens of thousands of data sequences. Comparison with traditional (MEME) or ChIP-Seq-oriented (HMS) motif discovery tools shows that ChIPMunk identifies the correct motifs with the same or better quality but works dramatically faster. Availability and implementation: ChIPMunk is freely available within the ru\_genetika Java package: http://line.imb.ac.ru/ChIPMunk. Web-based version is also available. Contact: ivan.kulakovskiy@gmail.com Supplementary information: Supplementary data are available at Bioinformatics online.}, language = {en}, number = {20}, urldate = {2016-11-25}, journal = {Bioinformatics}, author = {Kulakovskiy, I. V. and Boeva, V. A. and Favorov, A. V. and Makeev, V. J.}, month = oct, year = {2010}, pmid = {20736340}, pages = {2622--2623}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4IXGI69U/Kulakovskiy et al. - 2010 - Deep and wide digging for binding motifs in ChIP-S.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FPC6UKKW/2622.html:text/html} } @article{boeva_exact_2007, title = {Exact p-value calculation for heterotypic clusters of regulatory motifs and its application in computational annotation of cis-regulatory modules}, volume = {2}, issn = {1748-7188}, url = {http://dx.doi.org/10.1186/1748-7188-2-13}, doi = {10.1186/1748-7188-2-13}, abstract = {cis-Regulatory modules (CRMs) of eukaryotic genes often contain multiple binding sites for transcription factors. The phenomenon that binding sites form clusters in CRMs is exploited in many algorithms to locate CRMs in a genome. This gives rise to the problem of calculating the statistical significance of the event that multiple sites, recognized by different factors, would be found simultaneously in a text of a fixed length. The main difficulty comes from overlapping occurrences of motifs. So far, no tools have been developed allowing the computation of p-values for simultaneous occurrences of different motifs which can overlap.}, urldate = {2016-11-30}, journal = {Algorithms for Molecular Biology}, author = {Boeva, Valentina and Clément, Julien and Régnier, Mireille and Roytberg, Mikhail A. and Makeev, Vsevolod J.}, year = {2007}, pages = {13}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JGZCT7TD/Boeva et al. - 2007 - Exact p-value calculation for heterotypic clusters.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8ZZ9BTCW/1748-7188-2-13.html:text/html} } @article{guo_high_2012, title = {High {Resolution} {Genome} {Wide} {Binding} {Event} {Finding} and {Motif} {Discovery} {Reveals} {Transcription} {Factor} {Spatial} {Binding} {Constraints}}, volume = {8}, issn = {1553-7358}, url = {http://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1002638}, doi = {10.1371/journal.pcbi.1002638}, - abstract = {Author Summary The letters in our genome spell words and phrases that control when each gene is activated. To understand how these words and phrases function in health and disease, we have developed a new computational method to determine what word positions in our genomic text are used by each genome regulatory protein, and how these active words are spaced relative to one another. Our method achieves exceptional spatial accuracy by integrating experimental data with the text of our genome to find the precise words that are regulated by each protein factor. Using this analysis we have discovered novel word spacings in the experimental data that suggest novel genome grammatical control constructs.}, - number = {8}, - urldate = {2016-11-30}, - journal = {PLOS Computational Biology}, - author = {Guo, Yuchun and Mahony, Shaun and Gifford, David K.}, - month = aug, - year = {2012}, - keywords = {Transcription Factors, Sequence motif analysis, Sequence alignment, Mammalian genomics, Genomic databases, Binding analysis, Cell binding assay, Cell binding}, - pages = {e1002638}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QQ456JAQ/Guo et al. - 2012 - High Resolution Genome Wide Binding Event Finding .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W83PTGJE/article.html:text/html} -} - -@article{starick_chip-exo_2015, - title = {{ChIP}-exo signal associated with {DNA}-binding motifs provides insight into the genomic binding of the glucocorticoid receptor and cooperating transcription factors}, - volume = {25}, - issn = {1088-9051, 1549-5469}, - url = {http://genome.cshlp.org/content/25/6/825}, - doi = {10.1101/gr.185157.114}, - abstract = {The classical DNA recognition sequence of the glucocorticoid receptor (GR) appears to be present at only a fraction of bound genomic regions. To identify sequences responsible for recruitment of this transcription factor (TF) to individual loci, we turned to the high-resolution ChIP-exo approach. We exploited this signal by determining footprint profiles of TF binding at single-base-pair resolution using ExoProfiler, a computational pipeline based on DNA binding motifs. When applied to our GR and the few available public ChIP-exo data sets, we find that ChIP-exo footprints are protein- and recognition sequence-specific signatures of genomic TF association. Furthermore, we show that ChIP-exo captures information about TFs other than the one directly targeted by the antibody in the ChIP procedure. Consequently, the shape of the ChIP-exo footprint can be used to discriminate between direct and indirect (tethering to other DNA-bound proteins) DNA association of GR. Together, our findings indicate that the absence of classical recognition sequences can be explained by direct GR binding to a broader spectrum of sequences than previously known, either as a homodimer or as a heterodimer binding together with a member of the ETS or TEAD families of TFs, or alternatively by indirect recruitment via FOX or STAT proteins. ChIP-exo footprints also bring structural insights and locate DNA:protein cross-link points that are compatible with crystal structures of the studied TFs. Overall, our generically applicable footprint-based approach uncovers new structural and functional insights into the diverse ways of genomic cooperation and association of TFs.}, - language = {en}, - number = {6}, - urldate = {2016-11-30}, - journal = {Genome Research}, - author = {Starick, Stephan R. and Ibn-Salem, Jonas and Jurk, Marcel and Hernandez, Céline and Love, Michael I. and Chung, Ho-Ryun and Vingron, Martin and Thomas-Chollier, Morgane and Meijsing, Sebastiaan H.}, - month = jun, - year = {2015}, - pmid = {25720775}, - pages = {825--835}, - file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9FI2MFFE/825.html:text/html} + abstract = {Author Summary The letters in our genome spell words and phrases that control when each gene is activated. To understand how these words and phrases function in health and disease, we have developed a new computational method to determine what word positions in our genomic text are used by each genome regulatory protein, and how these active words are spaced relative to one another. Our method achieves exceptional spatial accuracy by integrating experimental data with the text of our genome to find the precise words that are regulated by each protein factor. Using this analysis we have discovered novel word spacings in the experimental data that suggest novel genome grammatical control constructs.}, + number = {8}, + urldate = {2016-11-30}, + journal = {PLOS Computational Biology}, + author = {Guo, Yuchun and Mahony, Shaun and Gifford, David K.}, + month = aug, + year = {2012}, + keywords = {Transcription Factors, Sequence motif analysis, Sequence alignment, Mammalian genomics, Genomic databases, Binding analysis, Cell binding assay, Cell binding}, + pages = {e1002638}, + file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QQ456JAQ/Guo et al. - 2012 - High Resolution Genome Wide Binding Event Finding .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W83PTGJE/article.html:text/html} } -@article{starick_chip-exo_2015-1, +@article{starick_chip-exo_2015, title = {{ChIP}-exo signal associated with {DNA}-binding motifs provides insight into the genomic binding of the glucocorticoid receptor and cooperating transcription factors}, volume = {25}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/25/6/825}, doi = {10.1101/gr.185157.114}, abstract = {An international, peer-reviewed genome sciences journal featuring outstanding original research that offers novel insights into the biology of all organisms}, language = {en}, number = {6}, urldate = {2016-11-30}, journal = {Genome Research}, author = {Starick, Stephan R. and Ibn-Salem, Jonas and Jurk, Marcel and Hernandez, Céline and Love, Michael I. and Chung, Ho-Ryun and Vingron, Martin and Thomas-Chollier, Morgane and Meijsing, Sebastiaan H.}, month = jun, year = {2015}, pmid = {25720775}, pages = {825--835}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DBUJKDFD/Starick et al. - 2015 - ChIP-exo signal associated with DNA-binding motifs.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/89CTWNPR/825.full.html:text/html} } -@article{starick_chip-exo_2015-2, - title = {{ChIP}-exo signal associated with {DNA}-binding motifs provides insight into the genomic binding of the glucocorticoid receptor and cooperating transcription factors}, - volume = {25}, - issn = {1088-9051, 1549-5469}, - url = {http://genome.cshlp.org/content/25/6/825}, - doi = {10.1101/gr.185157.114}, - abstract = {The classical DNA recognition sequence of the glucocorticoid receptor (GR) appears to be present at only a fraction of bound genomic regions. To identify sequences responsible for recruitment of this transcription factor (TF) to individual loci, we turned to the high-resolution ChIP-exo approach. We exploited this signal by determining footprint profiles of TF binding at single-base-pair resolution using ExoProfiler, a computational pipeline based on DNA binding motifs. When applied to our GR and the few available public ChIP-exo data sets, we find that ChIP-exo footprints are protein- and recognition sequence-specific signatures of genomic TF association. Furthermore, we show that ChIP-exo captures information about TFs other than the one directly targeted by the antibody in the ChIP procedure. Consequently, the shape of the ChIP-exo footprint can be used to discriminate between direct and indirect (tethering to other DNA-bound proteins) DNA association of GR. Together, our findings indicate that the absence of classical recognition sequences can be explained by direct GR binding to a broader spectrum of sequences than previously known, either as a homodimer or as a heterodimer binding together with a member of the ETS or TEAD families of TFs, or alternatively by indirect recruitment via FOX or STAT proteins. ChIP-exo footprints also bring structural insights and locate DNA:protein cross-link points that are compatible with crystal structures of the studied TFs. Overall, our generically applicable footprint-based approach uncovers new structural and functional insights into the diverse ways of genomic cooperation and association of TFs.}, - language = {en}, - number = {6}, - urldate = {2016-11-30}, - journal = {Genome Research}, - author = {Starick, Stephan R. and Ibn-Salem, Jonas and Jurk, Marcel and Hernandez, Céline and Love, Michael I. and Chung, Ho-Ryun and Vingron, Martin and Thomas-Chollier, Morgane and Meijsing, Sebastiaan H.}, - month = jun, - year = {2015}, - pmid = {25720775}, - pages = {825--835}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NC23VPZP/Starick et al. - 2015 - ChIP-exo signal associated with DNA-binding motifs.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BVCUVC2R/825.html:text/html} -} - @article{jonkers_getting_2015, title = {Getting up to speed with transcription elongation by {RNA} polymerase {II}}, volume = {16}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0072}, url = {http://www.nature.com/nrm/journal/v16/n3/full/nrm3953.html}, doi = {10.1038/nrm3953}, abstract = {Recent advances in sequencing techniques that measure nascent transcripts and that reveal the positioning of RNA polymerase II (Pol II) have shown that the pausing of Pol II in promoter-proximal regions and its release to initiate a phase of productive elongation are key steps in transcription regulation. Moreover, after the release of Pol II from the promoter-proximal region, elongation rates are highly dynamic throughout the transcription of a gene, and vary on a gene-by-gene basis. Interestingly, Pol II elongation rates affect co-transcriptional processes such as splicing, termination and genome stability. Increasing numbers of factors and regulatory mechanisms have been associated with the steps of transcription elongation by Pol II, revealing that elongation is a highly complex process. Elongation is thus now recognized as a key phase in the regulation of transcription by Pol II.}, language = {en}, number = {3}, urldate = {2016-12-16}, journal = {Nature Reviews Molecular Cell Biology}, author = {Jonkers, Iris and Lis, John T.}, month = mar, year = {2015}, keywords = {transcriptomics, transcription}, pages = {167--177}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/D6XBEGWR/Jonkers and Lis - 2015 - Getting up to speed with transcription elongation .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UCEUN62Q/nrm3953.html:text/html} } @article{heinz_selection_2015, title = {The selection and function of cell type-specific enhancers}, volume = {16}, copyright = {© 2015 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0072}, url = {http://www.nature.com/nrm/journal/v16/n3/full/nrm3949.html}, doi = {10.1038/nrm3949}, abstract = {The human body contains several hundred cell types, all of which share the same genome. In metazoans, much of the regulatory code that drives cell type-specific gene expression is located in distal elements called enhancers. Although mammalian genomes contain millions of potential enhancers, only a small subset of them is active in a given cell type. Cell type-specific enhancer selection involves the binding of lineage-determining transcription factors that prime enhancers. Signal-dependent transcription factors bind to primed enhancers, which enables these broadly expressed factors to regulate gene expression in a cell type-specific manner. The expression of genes that specify cell type identity and function is associated with densely spaced clusters of active enhancers known as super-enhancers. The functions of enhancers and super-enhancers are influenced by, and affect, higher-order genomic organization.}, language = {en}, number = {3}, urldate = {2016-12-16}, journal = {Nature Reviews Molecular Cell Biology}, author = {Heinz, Sven and Romanoski, Casey E. and Benner, Christopher and Glass, Christopher K.}, month = mar, year = {2015}, keywords = {Transcriptional regulatory elements, Transcription Factors, transcription}, pages = {144--154}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2XKV3K9Z/Heinz et al. - 2015 - The selection and function of cell type-specific e.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PB9S77UU/nrm3949.html:text/html} } @article{mavrich_barrier_2008, title = {A barrier nucleosome model for statistical positioning of nucleosomes throughout the yeast genome}, volume = {18}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/18/7/1073}, doi = {10.1101/gr.078261.108}, abstract = {Most nucleosomes are well-organized at the 5′ ends of S. cerevisiae genes where “−1” and “+1” nucleosomes bracket a nucleosome-free promoter region (NFR). How nucleosomal organization is specified by the genome is less clear. Here we establish and inter-relate rules governing genomic nucleosome organization by sequencing DNA from more than one million immunopurified S. cerevisiae nucleosomes (displayed at http://atlas.bx.psu.edu/). Evidence is presented that the organization of nucleosomes throughout genes is largely a consequence of statistical packing principles. The genomic sequence specifies the location of the −1 and +1 nucleosomes. The +1 nucleosome forms a barrier against which nucleosomes are packed, resulting in uniform positioning, which decays at farther distances from the barrier. We present evidence for a novel 3′ NFR that is present at {\textgreater}95\% of all genes. 3′ NFRs may be important for transcription termination and anti-sense initiation. We present a high-resolution genome-wide map of TFIIB locations that implicates 3′ NFRs in gene looping.}, language = {en}, number = {7}, urldate = {2016-12-21}, journal = {Genome Research}, author = {Mavrich, Travis N. and Ioshikhes, Ilya P. and Venters, Bryan J. and Jiang, Cizhong and Tomsho, Lynn P. and Qi, Ji and Schuster, Stephan C. and Albert, Istvan and Pugh, B. Franklin}, month = jul, year = {2008}, pmid = {18550805}, pages = {1073--1083}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z3E3FSWP/Mavrich et al. - 2008 - A barrier nucleosome model for statistical positio.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9HHGETWS/1073.html:text/html} } @article{wasson_ensemble_2009, title = {An ensemble model of competitive multi-factor binding of the genome}, volume = {19}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/19/11/2101}, doi = {10.1101/gr.093450.109}, abstract = {Hundreds of different factors adorn the eukaryotic genome, binding to it in large number. These DNA binding factors (DBFs) include nucleosomes, transcription factors (TFs), and other proteins and protein complexes, such as the origin recognition complex (ORC). DBFs compete with one another for binding along the genome, yet many current models of genome binding do not consider different types of DBFs together simultaneously. Additionally, binding is a stochastic process that results in a continuum of binding probabilities at any position along the genome, but many current models tend to consider positions as being either binding sites or not. Here, we present a model that allows a multitude of DBFs, each at different concentrations, to compete with one another for binding sites along the genome. The result is an “occupancy profile,” a probabilistic description of the DNA occupancy of each factor at each position. We implement our model efficiently as the software package COMPETE. We demonstrate genome-wide and at specific loci how modeling nucleosome binding alters TF binding, and vice versa, and illustrate how factor concentration influences binding occupancy. Binding cooperativity between nearby TFs arises implicitly via mutual competition with nucleosomes. Our method applies not only to TFs, but also recapitulates known occupancy profiles of a well-studied replication origin with and without ORC binding. Importantly, the sequence preferences our model takes as input are derived from in vitro experiments. This ensures that the calculated occupancy profiles are the result of the forces of competition represented explicitly in our model and the inherent sequence affinities of the constituent DBFs.}, language = {en}, number = {11}, urldate = {2016-12-21}, journal = {Genome Research}, author = {Wasson, Todd and Hartemink, Alexander J.}, month = nov, year = {2009}, pmid = {19720867}, pages = {2101--2112}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T8QQ3CRU/Wasson and Hartemink - 2009 - An ensemble model of competitive multi-factor bind.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B2RHGVV5/2101.html:text/html} } @book{mcginty_robert_k._and_tan_song_fundamentals_2014, address = {New York}, edition = {2014}, title = {Fundamentals of {Chromatin}, chapter 1 {Histone}, {Nucleosomes} and {Chromatin} {Structure}}, isbn = {978-1-4614-8623-7}, url = {http://www.springer.com/biomed/human+genetics/book/978-1-4614-8623-7}, abstract = {Chromatin is the combination of \{DNA\} and proteins that make up the genetic material of chromosomes. It is essential for packaging \{DNA\}, regulation of gene expression, \{DNA\} replication and repair. The audience for this book includes ...}, publisher = {Jerry L. Workman and Susan M. Abmayr}, author = {{McGinty Robert K. and Tan Song}}, year = {2014} } -@book{noauthor_notitle_nodate-1 -} - -@book{noauthor_notitle_nodate-2 -} - -@incollection{robert_k._mcginty_fundamentals_nodate, - title = {Fundamentals of {Chromatin}}, - author = {{Robert K. McGinty}} -} - -@article{lee_initiation_2005, - title = {The initiation of liver development is dependent on {Foxa} transcription factors}, - volume = {435}, - copyright = {© 2005 Nature Publishing Group}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v435/n7044/full/nature03649.html}, - doi = {10.1038/nature03649}, - abstract = {The specification of the vertebrate liver is thought to occur in a two-step process, beginning with the establishment of competence within the foregut endoderm for responding to organ-specific signals, followed by the induction of liver-specific genes. On the basis of expression and in vitro studies, it has been proposed that the Foxa transcription factors establish competence by opening compacted chromatin structures within liver-specific target genes. Here we show that Foxa1 and Foxa2 (forkhead box proteins A1 and A2) are required in concert for hepatic specification in mouse. In embryos deficient for both genes in the foregut endoderm, no liver bud is evident and expression of the hepatoblast marker alpha-fetoprotein (Afp) is lost. Furthermore, Foxa1/Foxa2-deficient endoderm cultured in the presence of exogenous fibroblast growth factor 2 (FGF2) fails to initiate expression of the liver markers albumin and transthyretin. Thus, Foxa1 and Foxa2 are required for the establishment of competence within the foregut endoderm and the onset of hepatogenesis.}, - language = {en}, - number = {7044}, - urldate = {2016-12-21}, - journal = {Nature}, - author = {Lee, Catherine S. and Friedman, Joshua R. and Fulmer, James T. and Kaestner, Klaus H.}, - month = jun, - year = {2005}, - pages = {944--947}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SMGD4VAC/Lee et al. - 2005 - The initiation of liver development is dependent o.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/76XXCRTD/nature03649.html:text/html} -} - -@article{sekiya_direct_2011, - title = {Direct conversion of mouse fibroblasts to hepatocyte-like cells by defined factors}, - volume = {475}, - copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, - issn = {0028-0836}, - url = {http://www.nature.com/nature/journal/v475/n7356/full/nature10263.html}, - doi = {10.1038/nature10263}, - abstract = {The location and timing of cellular differentiation must be stringently controlled for proper organ formation. Normally, hepatocytes differentiate from hepatic progenitor cells to form the liver during development. However, previous studies have shown that the hepatic program can also be activated in non-hepatic lineage cells after exposure to particular stimuli or fusion with hepatocytes. These unexpected findings suggest that factors critical to hepatocyte differentiation exist and become activated to induce hepatocyte-specific properties in different cell types. Here, by screening the effects of twelve candidate factors, we identify three specific combinations of two transcription factors, comprising Hnf4α plus Foxa1, Foxa2 or Foxa3, that can convert mouse embryonic and adult fibroblasts into cells that closely resemble hepatocytes in vitro. The induced hepatocyte-like (iHep) cells have multiple hepatocyte-specific features and reconstitute damaged hepatic tissues after transplantation. The generation of iHep cells may provide insights into the molecular nature of hepatocyte differentiation and potential therapies for liver diseases.}, - language = {en}, - number = {7356}, - urldate = {2016-12-21}, - journal = {Nature}, - author = {Sekiya, Sayaka and Suzuki, Atsushi}, - month = jul, - year = {2011}, - keywords = {biotechnology, medical research}, - pages = {390--393}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WPKFXHX8/Sekiya and Suzuki - 2011 - Direct conversion of mouse fibroblasts to hepatocy.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QBBU897A/nature10263.html:text/html} -} - @article{cirillo_opening_2002, title = {Opening of {Compacted} {Chromatin} by {Early} {Developmental} {Transcription} {Factors} {HNF}3 ({FoxA}) and {GATA}-4}, volume = {9}, issn = {1097-2765}, url = {http://www.sciencedirect.com/science/article/pii/S1097276502004598}, doi = {10.1016/S1097-2765(02)00459-8}, abstract = {The transcription factors HNF3 (FoxA) and GATA-4 are the earliest known to bind the albumin gene enhancer in liver precursor cells in embryos. To understand how they access sites in silent chromatin, we assembled nucleosome arrays containing albumin enhancer sequences and compacted them with linker histone. HNF3 and GATA-4, but not NF-1, C/EBP, and GAL4-AH, bound their sites in compacted chromatin and opened the local nucleosomal domain in the absence of ATP-dependent enzymes. The ability of HNF3 to open chromatin is mediated by a high affinity DNA binding site and by the C-terminal domain of the protein, which binds histones H3 and H4. Thus, factors that potentiate transcription in development are inherently capable of initiating chromatin opening events.}, number = {2}, urldate = {2016-12-21}, journal = {Molecular Cell}, author = {Cirillo, Lisa Ann and Lin, Frank Robert and Cuesta, Isabel and Friedman, Dara and Jarnik, Michal and Zaret, Kenneth S}, month = feb, year = {2002}, pages = {279--289}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZWHQ5CF9/Cirillo et al. - 2002 - Opening of Compacted Chromatin by Early Developmen.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZXQVJ2PE/S1097276502004598.html:text/html} } @article{cirillo_early_1999, title = {An {Early} {Developmental} {Transcription} {Factor} {Complex} that {Is} {More} {Stable} on {Nucleosome} {Core} {Particles} {Than} on {Free} {DNA}}, volume = {4}, issn = {1097-2765}, url = {http://www.sciencedirect.com/science/article/pii/S1097276500802257}, doi = {10.1016/S1097-2765(00)80225-7}, abstract = {In vivo footprinting studies have shown that transcription factor binding sites for HNF3 and GATA-4 are occupied on the albumin gene enhancer in embryonic endoderm, prior to the developmental activation of liver gene transcription. We have investigated how these factors can stably occupy silent chromatin. Remarkably, we find that HNF3, but not GATA-4 or a GAL4 control protein, binds far more stably to nucleosome core particles than to free DNA. In the presence of HNF3, GATA-4 binds stably to an HNF3-positioned nucleosome. Histone acetylation does not affect HNF3 binding. This is evidence for stable nucleosome binding by a transcription factor and shows that a winged helix protein is sufficient to initiate the assembly of an enhancer complex on nonacetylated nucleosomes.}, number = {6}, urldate = {2016-12-21}, journal = {Molecular Cell}, author = {Cirillo, Lisa Ann and Zaret, Kenneth S}, month = dec, year = {1999}, pages = {961--969}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/P56D6XMZ/Cirillo and Zaret - 1999 - An Early Developmental Transcription Factor Comple.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XI82F8KX/S1097276500802257.html:text/html} } -@article{sekiya_direct_2011-1, +@article{sekiya_direct_2011, title = {Direct conversion of mouse fibroblasts to hepatocyte-like cells by defined factors}, volume = {475}, copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v475/n7356/abs/nature10263.html}, doi = {10.1038/nature10263}, abstract = {The location and timing of cellular differentiation must be stringently controlled for proper organ formation. Normally, hepatocytes differentiate from hepatic progenitor cells to form the liver during development. However, previous studies have shown that the hepatic program can also be activated in non-hepatic lineage cells after exposure to particular stimuli or fusion with hepatocytes. These unexpected findings suggest that factors critical to hepatocyte differentiation exist and become activated to induce hepatocyte-specific properties in different cell types. Here, by screening the effects of twelve candidate factors, we identify three specific combinations of two transcription factors, comprising Hnf4α plus Foxa1, Foxa2 or Foxa3, that can convert mouse embryonic and adult fibroblasts into cells that closely resemble hepatocytes in vitro. The induced hepatocyte-like (iHep) cells have multiple hepatocyte-specific features and reconstitute damaged hepatic tissues after transplantation. The generation of iHep cells may provide insights into the molecular nature of hepatocyte differentiation and potential therapies for liver diseases.}, language = {en}, number = {7356}, urldate = {2016-12-21}, journal = {Nature}, author = {Sekiya, Sayaka and Suzuki, Atsushi}, month = jul, year = {2011}, keywords = {biotechnology, medical research}, pages = {390--393}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QXVHEIQK/Sekiya and Suzuki - 2011 - Direct conversion of mouse fibroblasts to hepatocy.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VXXU93UV/nature10263.html:text/html} } @article{huang_induction_2011, title = {Induction of functional hepatocyte-like cells from mouse fibroblasts by defined factors}, volume = {475}, copyright = {© 2011 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v475/n7356/full/nature10116.html%3Fmessage-global%3Dremove}, doi = {10.1038/nature10116}, abstract = {The generation of functional hepatocytes independent of donor liver organs is of great therapeutic interest with regard to regenerative medicine and possible cures for liver disease. Induced hepatic differentiation has been achieved previously using embryonic stem cells or induced pluripotent stem cells. Particularly, hepatocytes generated from a patient/'s own induced pluripotent stem cells could theoretically avoid immunological rejection. However, the induction of hepatocytes from induced pluripotent stem cells is a complicated process that would probably be replaced with the arrival of improved technology. Overexpression of lineage-specific transcription factors directly converts terminally differentiated cells into some other lineages, including neurons, cardiomyocytes and blood progenitors; however, it remains unclear whether these lineage-converted cells could repair damaged tissues in vivo. Here we demonstrate the direct induction of functional hepatocyte-like (iHep) cells from mouse tail-tip fibroblasts by transduction of Gata4, Hnf1α and Foxa3, and inactivation of p19Arf. iHep cells show typical epithelial morphology, express hepatic genes and acquire hepatocyte functions. Notably, transplanted iHep cells repopulate the livers of fumarylacetoacetate-hydrolase-deficient (Fah-/-) mice and rescue almost half of recipients from death by restoring liver functions. Our study provides a novel strategy to generate functional hepatocyte-like cells for the purpose of liver engineering and regenerative medicine.}, language = {en}, number = {7356}, urldate = {2016-12-21}, journal = {Nature}, author = {Huang, Pengyu and He, Zhiying and Ji, Shuyi and Sun, Huawang and Xiang, Dao and Liu, Changcheng and Hu, Yiping and Wang, Xin and Hui, Lijian}, month = jul, year = {2011}, keywords = {stem cells, Cell Biology}, pages = {386--389}, file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G2NSW4FG/nature10116.html:text/html} } @article{lawrence_expectation_1990, title = {An expectation maximization ({EM}) algorithm for the identification and characterization of common sites in unaligned biopolymer sequences}, volume = {7}, issn = {0887-3585}, doi = {10.1002/prot.340070105}, abstract = {Statistical methodology for the identification and characterization of protein binding sites in a set of unaligned DNA fragments is presented. Each sequence must contain at least one common site. No alignment of the sites is required. Instead, the uncertainty in the location of the sites is handled by employing the missing information principle to develop an "expectation maximization" (EM) algorithm. This approach allows for the simultaneous identification of the sites and characterization of the binding motifs. The reliability of the algorithm increases with the number of fragments, but the computations increase only linearly. The method is illustrated with an example, using known cyclic adenosine monophosphate receptor protein (CRP) binding sites. The final motif is utilized in a search for undiscovered CRP binding sites.}, language = {eng}, number = {1}, journal = {Proteins}, author = {Lawrence, C. E. and Reilly, A. A.}, year = {1990}, pmid = {2184437}, keywords = {Algorithms, DNA-binding proteins, Base Sequence, Binding Sites, Escherichia coli, Information Systems, Molecular Sequence Data, Nucleic Acid Conformation, Receptors, Cyclic AMP, Statistics as Topic}, pages = {41--51}, file = {Lawrence90.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Lawrence90.pdf:application/pdf} } @article{schneider_sequence_1990, title = {Sequence logos: a new way to display consensus sequences}, volume = {18}, issn = {0305-1048, 1362-4962}, shorttitle = {Sequence logos}, url = {http://nar.oxfordjournals.org/content/18/20/6097}, doi = {10.1093/nar/18.20.6097}, abstract = {A graphical method is presented for displaying the patterns in a set of aligned sequences. The characters representing the sequence are stacked on top of each other for each position in the aligned sequences. The height of each letter is made proportional to Its frequency, and the letters are sorted so the most common one is on top. The height of the entire stack is then adjusted to signify the information content of the sequences at that position. From these ‘sequence logos’, one can determine not only the consensus sequence but also the relative frequency of bases and the information content (measured In bits) at every position in a site or sequence. The logo displays both significant residues and subtle sequence patterns.}, language = {en}, number = {20}, urldate = {2016-12-23}, journal = {Nucleic Acids Research}, author = {Schneider, Thomas D. and Stephens, R. Michael}, month = oct, year = {1990}, pmid = {2172928}, pages = {6097--6100}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F4MJBIVJ/Schneider and Stephens - 1990 - Sequence logos a new way to display consensus seq.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XPZMIRWU/6097.html:text/html} } @article{stormo_dna_2000, title = {{DNA} binding sites: representation and discovery}, volume = {16}, issn = {1367-4803, 1460-2059}, shorttitle = {{DNA} binding sites}, url = {http://bioinformatics.oxfordjournals.org/content/16/1/16}, doi = {10.1093/bioinformatics/16.1.16}, language = {en}, number = {1}, urldate = {2016-12-27}, journal = {Bioinformatics}, author = {Stormo, Gary D.}, month = jan, year = {2000}, pmid = {10812473}, pages = {16--23}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BWUSTADT/Stormo - 2000 - DNA binding sites representation and discovery.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DEDTEW2G/16.html:text/html} } @article{whitington_inferring_2011, title = {Inferring transcription factor complexes from {ChIP}-seq data}, volume = {39}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/39/15/e98}, doi = {10.1093/nar/gkr341}, abstract = {Chromatin immunoprecipitation followed by high-throughput sequencing (ChIP-seq) allows researchers to determine the genome-wide binding locations of individual transcription factors (TFs) at high resolution. This information can be interrogated to study various aspects of TF behaviour, including the mechanisms that control TF binding. Physical interaction between TFs comprises one important aspect of TF binding in eukaryotes, mediating tissue-specific gene expression. We have developed an algorithm, spaced motif analysis (SpaMo), which is able to infer physical interactions between the given TF and TFs bound at neighbouring sites at the DNA interface. The algorithm predicts TF interactions in half of the ChIP-seq data sets we test, with the majority of these predictions supported by direct evidence from the literature or evidence of homodimerization. High resolution motif spacing information obtained by this method can facilitate an improved understanding of individual TF complex structures. SpaMo can assist researchers in extracting maximum information relating to binding mechanisms from their TF ChIP-seq data. SpaMo is available for download and interactive use as part of the MEME Suite (http://meme.nbcr.net).}, language = {en}, number = {15}, urldate = {2016-12-28}, journal = {Nucleic Acids Research}, author = {Whitington, Tom and Frith, Martin C. and Johnson, James and Bailey, Timothy L.}, month = aug, year = {2011}, pmid = {21602262}, pages = {e98--e98}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BPH3Q5R4/Whitington et al. - 2011 - Inferring transcription factor complexes from ChIP.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TZPCKMJ3/e98.html:text/html} } @article{wolberger_multiprotein-dna_1999, title = {Multiprotein-{Dna} {Complexes} in {Transcriptional} {Regulation}}, volume = {28}, url = {http://dx.doi.org/10.1146/annurev.biophys.28.1.29}, doi = {10.1146/annurev.biophys.28.1.29}, abstract = {Transcription in eukaryotes is frequently regulated by a mechanism termed combinatorial control, whereby several different proteins must bind DNA in concert to achieve appropriate regulation of the downstream gene. X-ray crystallographic studies of multiprotein complexes bound to DNA have been carried out to investigate the molecular determinants of complex assembly and DNA binding. This work has provided important insights into the specific protein-protein and protein-DNA interactions that govern the assembly of multiprotein regulatory complexes. The results of these studies are reviewed here, and the general insights into the mechanism of combinatorial gene regulation are discussed.}, number = {1}, urldate = {2016-12-28}, journal = {Annual Review of Biophysics and Biomolecular Structure}, author = {Wolberger, Cynthia}, year = {1999}, pmid = {10410794}, keywords = {Gene regulation, transcription, protein-DNA interactions, crystal structure, combinatorial control}, pages = {29--56}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UBG5A8J8/Wolberger - 1999 - Multiprotein-Dna Complexes in Transcriptional Regu.pdf:application/pdf} } @article{ravasi_atlas_2010, title = {An {Atlas} of {Combinatorial} {Transcriptional} {Regulation} in {Mouse} and {Man}}, volume = {140}, issn = {0092-8674}, url = {http://www.sciencedirect.com/science/article/pii/S0092867410000796}, doi = {10.1016/j.cell.2010.01.044}, abstract = {Summary Combinatorial interactions among transcription factors are critical to directing tissue-specific gene expression. To build a global atlas of these combinations, we have screened for physical interactions among the majority of human and mouse DNA-binding transcription factors (TFs). The complete networks contain 762 human and 877 mouse interactions. Analysis of the networks reveals that highly connected TFs are broadly expressed across tissues, and that roughly half of the measured interactions are conserved between mouse and human. The data highlight the importance of TF combinations for determining cell fate, and they lead to the identification of a SMAD3/FLI1 complex expressed during development of immunity. The availability of large TF combinatorial networks in both human and mouse will provide many opportunities to study gene regulation, tissue differentiation, and mammalian evolution.}, number = {5}, urldate = {2016-12-28}, journal = {Cell}, author = {Ravasi, Timothy and Suzuki, Harukazu and Cannistraci, Carlo Vittorio and Katayama, Shintaro and Bajic, Vladimir B. and Tan, Kai and Akalin, Altuna and Schmeier, Sebastian and Kanamori-Katayama, Mutsumi and Bertin, Nicolas and Carninci, Piero and Daub, Carsten O. and Forrest, Alistair R. R. and Gough, Julian and Grimmond, Sean and Han, Jung-Hoon and Hashimoto, Takehiro and Hide, Winston and Hofmann, Oliver and Kamburov, Atanas and Kaur, Mandeep and Kawaji, Hideya and Kubosaki, Atsutaka and Lassmann, Timo and van Nimwegen, Erik and MacPherson, Cameron Ross and Ogawa, Chihiro and Radovanovic, Aleksandar and Schwartz, Ariel and Teasdale, Rohan D. and Tegnér, Jesper and Lenhard, Boris and Teichmann, Sarah A. and Arakawa, Takahiro and Ninomiya, Noriko and Murakami, Kayoko and Tagami, Michihira and Fukuda, Shiro and Imamura, Kengo and Kai, Chikatoshi and Ishihara, Ryoko and Kitazume, Yayoi and Kawai, Jun and Hume, David A. and Ideker, Trey and Hayashizaki, Yoshihide}, month = mar, year = {2010}, keywords = {DNA}, pages = {744--752}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SHBZTQ2U/Ravasi et al. - 2010 - An Atlas of Combinatorial Transcriptional Regulati.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZEKZPIRS/S0092867410000796.html:text/html} } @book{marsland_machine_2015, address = {Boca Raton}, edition = {Second Edition}, title = {Machine {Learning}, {An} algorithmic {Perspective}, {Chapter} 3 {Neurons}, {Neural} {Network} and {Linear} {Discriminants}}, isbn = {978-1-4398-8921-3}, url = {https://www.crcpress.com/Machine-Learning-An-Algorithmic-Perspective/Marsland/p/book/9781439889213}, publisher = {CRC Press}, author = {Marsland, Stephen}, year = {2015} } @article{hertz_identification_1990, title = {Identification of consensus patterns in unaligned {DNA} sequences known to be functionally related}, volume = {6}, issn = {0266-7061}, abstract = {We have developed a method for identifying consensus patterns in a set of unaligned DNA sequences known to bind a common protein or to have some other common biochemical function. The method is based on a matrix representation of binding site patterns. Each row of the matrix represents one of the four possible bases, each column represents one of the positions of the binding site and each element is determined by the frequency the indicated base occurs at the indicated position. The goal of the method is to find the most significant matrix--i.e. the one with the lowest probability of occurring by chance--out of all the matrices that can be formed from the set of related sequences. The reliability of the method improves with the number of sequences, while the time required increases only linearly with the number of sequences. To test this method, we analysed 11 DNA sequences containing promoters regulated by the Escherichia coli LexA protein. The matrices we found were consistent with the known consensus sequence, and could distinguish the generally accepted LexA binding sites from other DNA sequences.}, language = {eng}, number = {2}, journal = {Computer applications in the biosciences: CABIOS}, author = {Hertz, G. Z. and Hartzell, G. W. and Stormo, G. D.}, month = apr, year = {1990}, pmid = {2193692}, keywords = {DNA, Algorithms, Base Sequence, Binding Sites, Escherichia coli, Molecular Sequence Data, Bacterial Proteins, DNA, Bacterial, Genes, Bacterial, Pattern Recognition, Automated, Serine Endopeptidases, Software}, pages = {81--92}, file = {Hertz90.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Hertz90.pdf:application/pdf} } @article{shi_transcriptional_1991, title = {Transcriptional repression by {YY}1, a human {GLI}-{Krüippel}-related protein, and relief of repression by adenovirus {E}1A protein}, volume = {67}, issn = {0092-8674}, url = {http://www.sciencedirect.com/science/article/pii/0092867491901896}, doi = {10.1016/0092-8674(91)90189-6}, abstract = {A sequence within the transcription control region of the adeno-associated virus P5 promoter has been shown to mediate transcriptional activation by the adenovirus E1A protein. We report here that this same element mediates transcriptional repression in the abaence of E1A. Two cellular proteins have been found to bind to overlapping regions within this sequence element. One of these proteins, YY1, is responsible for the repression. E1A relieves repression exerted by YY1 and further activates transcription through its binding site. A YYl-specific cDNA has been isolated. Its sequence reveals YY1 to be a zinc finger protein that belongs to the GLI-Krüppel gene family. The product of the cDNA binds to YY1 sites. When fused to the GAL4 DNA-binding domain, it is capable of repressing transcription directed by a promoter that contains GAL4- binding sites, and E1A proteins can relieve the repression and activate transcription through the fusion protein.}, number = {2}, urldate = {2017-01-04}, journal = {Cell}, author = {Shi, Yang and Seto, Edward and Chang, Long-Sheng and Shenk, Thomas}, month = oct, year = {1991}, pages = {377--388}, file = {ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RSE2UKDF/0092867491901896.html:text/html;Shi et al 1991.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RSE2UKDF/Shi et al 1991.pdf:application/pdf} } -@article{schones_dynamic_2008-1, +@article{schones_dynamic_2008, title = {Dynamic {Regulation} of {Nucleosome} {Positioning} in the {Human} {Genome}}, volume = {132}, issn = {0092-8674}, url = {http://www.sciencedirect.com/science/article/pii/S0092867408002705}, doi = {10.1016/j.cell.2008.02.022}, abstract = {Summary The positioning of nucleosomes with respect to DNA plays an important role in regulating transcription. However, nucleosome mapping has been performed for only limited genomic regions in humans. We have generated genome-wide maps of nucleosome positions in both resting and activated human CD4+ T cells by direct sequencing of nucleosome ends using the Solexa high-throughput sequencing technique. We find that nucleosome phasing relative to the transcription start sites is directly correlated to RNA polymerase II (Pol II) binding. Furthermore, the first nucleosome downstream of a start site exhibits differential positioning in active and silent genes. TCR signaling induces extensive nucleosome reorganization in promoters and enhancers to allow transcriptional activation or repression. Our results suggest that H2A.Z-containing and modified nucleosomes are preferentially lost from the −1 nucleosome position. Our data provide a comprehensive view of the nucleosome landscape and its dynamic regulation in the human genome.}, number = {5}, urldate = {2017-01-05}, journal = {Cell}, author = {Schones, Dustin E. and Cui, Kairong and Cuddapah, Suresh and Roh, Tae-Young and Barski, Artem and Wang, Zhibin and Wei, Gang and Zhao, Keji}, month = mar, year = {2008}, keywords = {DNA, SIGNALING}, pages = {887--898}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/C63W6BPF/Schones et al. - 2008 - Dynamic Regulation of Nucleosome Positioning in th.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U7WWVSTV/S0092867408002705.html:text/html} } @article{dreos_eukaryotic_2017, title = {The eukaryotic promoter database in its 30th year: focus on non-vertebrate organisms}, volume = {45}, issn = {0305-1048, 1362-4962}, shorttitle = {The eukaryotic promoter database in its 30th year}, url = {http://nar.oxfordjournals.org/content/45/D1/D51}, doi = {10.1093/nar/gkw1069}, abstract = {We present an update of the Eukaryotic Promoter Database EPD (http://epd.vital-it.ch), more specifically on the EPDnew division, which contains comprehensive organisms-specific transcription start site (TSS) collections automatically derived from next generation sequencing (NGS) data. Thanks to the abundant release of new high-throughput transcript mapping data (CAGE, TSS-seq, GRO-cap) the database could be extended to plant and fungal species. We further report on the expansion of the mass genome annotation (MGA) repository containing promoter-relevant chromatin profiling data and on improvements for the EPD entry viewers. Finally, we present a new data access tool, ChIP-Extract, which enables computational biologists to extract diverse types of promoter-associated data in numerical table formats that are readily imported into statistical analysis platforms such as R.}, language = {en}, number = {D1}, urldate = {2017-01-05}, journal = {Nucleic Acids Research}, author = {Dreos, René and Ambrosini, Giovanna and Groux, Romain and Cavin Périer, Rouaïda and Bucher, Philipp}, month = jan, year = {2017}, pmid = {27899657}, pages = {D51--D55}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JMIFBMU3/Dreos et al. - 2017 - The eukaryotic promoter database in its 30th year.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NESWBKE4/D51.html:text/html} } @article{shlyueva_transcriptional_2014, title = {Transcriptional enhancers: from properties to genome-wide predictions}, volume = {15}, copyright = {© 2014 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1471-0056}, shorttitle = {Transcriptional enhancers}, url = {http://www.nature.com/nrg/journal/v15/n4/full/nrg3682.html}, doi = {10.1038/nrg3682}, abstract = {Cellular development, morphology and function are governed by precise patterns of gene expression. These are established by the coordinated action of genomic regulatory elements known as enhancers or cis-regulatory modules. More than 30 years after the initial discovery of enhancers, many of their properties have been elucidated; however, despite major efforts, we only have an incomplete picture of enhancers in animal genomes. In this Review, we discuss how properties of enhancer sequences and chromatin are used to predict enhancers in genome-wide studies. We also cover recently developed high-throughput methods that allow the direct testing and identification of enhancers on the basis of their activity. Finally, we discuss recent technological advances and current challenges in the field of regulatory genomics.}, language = {en}, number = {4}, urldate = {2017-01-06}, journal = {Nature Reviews Genetics}, author = {Shlyueva, Daria and Stampfel, Gerald and Stark, Alexander}, month = apr, year = {2014}, keywords = {Chromatin, Gene regulation, Transcriptional regulatory elements, Regulatory networks}, pages = {272--286}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PPV2MDTW/Shlyueva et al. - 2014 - Transcriptional enhancers from properties to geno.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5QXIK7V9/nrg3682.html:text/html} } @article{fu_insulator_2008, title = {The {Insulator} {Binding} {Protein} {CTCF} {Positions} 20 {Nucleosomes} around {Its} {Binding} {Sites} across the {Human} {Genome}}, volume = {4}, issn = {1553-7404}, url = {http://journals.plos.org/plosgenetics/article?id=10.1371/journal.pgen.1000138}, doi = {10.1371/journal.pgen.1000138}, abstract = {Author Summary The accessibility of genomic DNA to regulatory proteins and to the transcriptional machinery plays an important role in eukaryotic transcription regulation. Some regulatory proteins alter chromatin structures by evicting histones in selected loci. Nonetheless, no regulatory proteins have been reported to position nucleosomes genome-wide. The only genomic landmark that has been associated with well-positioned nucleosomes is the transcriptional start site (TSS)—several well-positioned nucleosomes are observed downstream of TSS genome-wide. Here we report that the CCCTC-binding factor (CTCF), a protein that binds insulator elements to prevent the spreading of heterochromatin and restricting transcriptional enhancers from activating unrelated promoters, possesses greater ability to position nucleosomes across the human genome than does the TSS. These well-positioned nucleosomes are highly enriched in a histone variant H2A.Z and 11 histone modifications. The nucleosomes enriched in the histone modifications previously implicated to correlate with active transcription tend to have less protected DNA against digestion by micrococcal nuclease, or greater DNA accessibility. This nucleosome-positioning ability is likely unique to CTCF, because it was not found in the other transcriptional factors we investigated. Thus we suggest that the binding of CTCF provides an anchor for positioning nucleosomes, and chromatin remodeling is an important aspect of CTCF function.}, number = {7}, urldate = {2017-01-10}, journal = {PLOS Genetics}, author = {Fu, Yutao and Sinha, Manisha and Peterson, Craig L. and Weng, Zhiping}, year = {2008}, keywords = {Chromatin, Transcription Factors, Nucleosomes, Histones, Nucleosome mapping, Histone modification, Insulators, DNA transcription}, pages = {e1000138}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GB4N7TQG/Fu et al. - 2008 - The Insulator Binding Protein CTCF Positions 20 Nu.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4KZ29XEU/article.html:text/html} } @article{boeva_novo_2010, title = {De novo motif identification improves the accuracy of predicting transcription factor binding sites in {ChIP}-{Seq} data analysis}, volume = {38}, issn = {0305-1048, 1362-4962}, url = {http://nar.oxfordjournals.org/content/38/11/e126}, doi = {10.1093/nar/gkq217}, abstract = {Dramatic progress in the development of next-generation sequencing technologies has enabled accurate genome-wide characterization of the binding sites of DNA-associated proteins. This technique, baptized as ChIP-Seq, uses a combination of chromatin immunoprecipitation and massively parallel DNA sequencing. Other published tools that predict binding sites from ChIP-Seq data use only positional information of mapped reads. In contrast, our algorithm MICSA (Motif Identification for ChIP-Seq Analysis) combines this source of positional information with information on motif occurrences to better predict binding sites of transcription factors (TFs). We proved the greater accuracy of MICSA with respect to several other tools by running them on datasets for the TFs NRSF, GABP, STAT1 and CTCF. We also applied MICSA on a dataset for the oncogenic TF EWS-FLI1. We discovered {\textgreater}2000 binding sites and two functionally different binding motifs. We observed that EWS-FLI1 can activate gene transcription when (i) its binding site is located in close proximity to the gene transcription start site (up to ∼150 kb), and (ii) it contains a microsatellite sequence. Furthermore, we observed that sites without microsatellites can also induce regulation of gene expression—positively as often as negatively—and at much larger distances (up to ∼1 Mb).}, language = {en}, number = {11}, urldate = {2017-01-11}, journal = {Nucleic Acids Research}, author = {Boeva, Valentina and Surdez, Didier and Guillon, Noëlle and Tirode, Franck and Fejes, Anthony P. and Delattre, Olivier and Barillot, Emmanuel}, month = jun, year = {2010}, pmid = {20375099}, pages = {e126--e126}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9CBMJ2JP/Boeva et al. - 2010 - De novo motif identification improves the accuracy.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W6RIZBBF/e126.html:text/html} } -@article{siepel_evolutionarily_2005-1, - title = {Evolutionarily conserved elements in vertebrate, insect, worm, and yeast genomes}, - volume = {15}, - issn = {1088-9051, 1549-5469}, - url = {http://genome.cshlp.org/content/15/8/1034}, - doi = {10.1101/gr.3715005}, - abstract = {We have conducted a comprehensive search for conserved elements in vertebrate genomes, using genome-wide multiple alignments of five vertebrate species (human, mouse, rat, chicken, and Fugu rubripes). Parallel searches have been performed with multiple alignments of four insect species (three species of Drosophila and Anopheles gambiae), two species of Caenorhabditis, and seven species of Saccharomyces. Conserved elements were identified with a computer program called phastCons, which is based on a two-state phylogenetic hidden Markov model (phylo-HMM). PhastCons works by fitting a phylo-HMM to the data by maximum likelihood, subject to constraints designed to calibrate the model across species groups, and then predicting conserved elements based on this model. The predicted elements cover roughly 3\%–8\% of the human genome (depending on the details of the calibration procedure) and substantially higher fractions of the more compact Drosophila melanogaster (37\%–53\%), Caenorhabditis elegans (18\%–37\%), and Saccharaomyces cerevisiae (47\%–68\%) genomes. From yeasts to vertebrates, in order of increasing genome size and general biological complexity, increasing fractions of conserved bases are found to lie outside of the exons of known protein-coding genes. In all groups, the most highly conserved elements (HCEs), by log-odds score, are hundreds or thousands of bases long. These elements share certain properties with ultraconserved elements, but they tend to be longer and less perfectly conserved, and they overlap genes of somewhat different functional categories. In vertebrates, HCEs are associated with the 3′ UTRs of regulatory genes, stable gene deserts, and megabase-sized regions rich in moderately conserved noncoding sequences. Noncoding HCEs also show strong statistical evidence of an enrichment for RNA secondary structure.}, - language = {en}, - number = {8}, - urldate = {2017-01-18}, - journal = {Genome Research}, - author = {Siepel, Adam and Bejerano, Gill and Pedersen, Jakob S. and Hinrichs, Angie S. and Hou, Minmei and Rosenbloom, Kate and Clawson, Hiram and Spieth, John and Hillier, LaDeana W. and Richards, Stephen and Weinstock, George M. and Wilson, Richard K. and Gibbs, Richard A. and Kent, W. James and Miller, Webb and Haussler, David}, - month = aug, - year = {2005}, - pmid = {16024819}, - pages = {1034--1050}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SN4RW9KZ/Siepel et al. - 2005 - Evolutionarily conserved elements in vertebrate, i.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XSQKJB4E/1034.html:text/html} -} - @article{boeva_nebulaweb_server_2012, title = {Nebula—a web\_server for advanced {ChIP}-seq data analysis}, volume = {28}, issn = {1367-4803}, url = {https://academic.oup.com/bioinformatics/article/28/19/2517/288900/Nebula-a-web-server-for-advanced-ChIP-seq-data}, doi = {10.1093/bioinformatics/bts463}, number = {19}, urldate = {2017-01-19}, journal = {Bioinformatics}, author = {Boeva, Valentina and Lermine, Alban and Barette, Camille and Guillouf, Christel and Barillot, Emmanuel}, month = oct, year = {2012}, pages = {2517--2519}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H9ZFAN5U/Boeva et al. - 2012 - Nebula—a web-server for advanced ChIP-seq data ana.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T5I9WCVM/Nebula-a-web-server-for-advanced-ChIP-seq-data.html:text/html} } @article{ambrosini_chip-seq_2016, title = {The {ChIP}-{Seq} tools and web server: a resource for analyzing {ChIP}-seq and other types of genomic data}, volume = {17}, issn = {1471-2164}, shorttitle = {The {ChIP}-{Seq} tools and web server}, url = {http://dx.doi.org/10.1186/s12864-016-3288-8}, doi = {10.1186/s12864-016-3288-8}, abstract = {ChIP-seq and related high-throughput chromatin profilig assays generate ever increasing volumes of highly valuable biological data. To make sense out of it, biologists need versatile, efficient and user-friendly tools for access, visualization and itegrative analysis of such data.}, urldate = {2017-01-25}, journal = {BMC Genomics}, author = {Ambrosini, Giovanna and Dreos, René and Kumar, Sunil and Bucher, Philipp}, year = {2016}, keywords = {transcription factor binding sites, ChIP-seq data analysis, Bioinformatics resources, Web server, Peak finding, Genomic context analysis, Histone modifications, DNA sequence motifs}, pages = {938}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3TBE7A76/Ambrosini et al. - 2016 - The ChIP-Seq tools and web server a resource for .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KQWCAIV7/s12864-016-3288-8.html:text/html} } @article{singer_ciita_2013, title = {{CIITA} and {Its} {Dual} {Roles} in {MHC} {Gene} {Transcription}}, volume = {4}, issn = {1664-3224}, url = {http://journal.frontiersin.org/article/10.3389/fimmu.2013.00476/abstract}, doi = {10.3389/fimmu.2013.00476}, abstract = {CIITA is a transcriptional co-activator that regulates γ-interferon-activated transcription of Major Histocompatibility Complex (MHC) class I and class II genes. As such, it plays a critical role in immune responses: CIITA deficiency results in aberrant MHC gene expression and consequently in autoimmune diseases such as Type II bare lymphocyte syndrome. Although CIITA does not bind DNA directly, it regulates MHC transcription in two distinct ways– as a transcriptional activator and as a general transcription factor. As an activator, CIITA nucleates an enhanceosome consisting of the DNA binding transcription factors RFX, CREB and NF-Y. As a general transcription factor, CIITA functionally replaces the TFIID component, TAF1. Like TAF1, CIITA possesses acetyltransferase (AT) and kinase activities, both of which contribute to proper transcription of MHC class I and II genes. The substrate specificity and regulation of the CIITA AT and kinase activities also parallel those of TAF1. In addition, CIITA is tightly regulated by its various regulatory domains that undergo phosphorylation and influence its targeted localization. Thus, a complex picture of the mechanisms regulating CIITA function is emerging suggesting that CIITA has dual roles in transcriptional regulation which are summarized in this review.}, language = {English}, urldate = {2017-01-30}, journal = {Frontiers in Immunology}, author = {Singer, Dinah S. and Devaiah, Ballachanda Nanjappa}, year = {2013}, keywords = {CIITA, MHC transcription, TAF1, enhanceosome, general transcription factors, NLRCATERPILLER}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q6JDIC2G/Singer et Devaiah - 2013 - CIITA and Its Dual Roles in MHC Gene Transcription.pdf:application/pdf} } @article{vo_creb-binding_2001, title = {{CREB}-binding {Protein} and p300 in {Transcriptional} {Regulation}}, volume = {276}, issn = {0021-9258, 1083-351X}, url = {http://www.jbc.org/content/276/17/13505}, doi = {10.1074/jbc.R000025200}, language = {en}, number = {17}, urldate = {2017-01-30}, journal = {Journal of Biological Chemistry}, author = {Vo, Ngan and Goodman, Richard H.}, month = apr, year = {2001}, pmid = {11279224}, pages = {13505--13508}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E88QGRXZ/Vo et Goodman - 2001 - CREB-binding Protein and p300 in Transcriptional R.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GAJPFEN3/13505.html:text/html} } @article{bailey_fitting_1994, title = {Fitting a mixture model by expectation maximization to discover motifs in biopolymers}, volume = {2}, issn = {1553-0833}, abstract = {The algorithm described in this paper discovers one or more motifs in a collection of DNA or protein sequences by using the technique of expectation maximization to fit a two-component finite mixture model to the set of sequences. Multiple motifs are found by fitting a mixture model to the data, probabilistically erasing the occurrences of the motif thus found, and repeating the process to find successive motifs. The algorithm requires only a set of unaligned sequences and a number specifying the width of the motifs as input. It returns a model of each motif and a threshold which together can be used as a Bayes-optimal classifier for searching for occurrences of the motif in other databases. The algorithm estimates how many times each motif occurs in each sequence in the dataset and outputs an alignment of the occurrences of the motif. The algorithm is capable of discovering several different motifs with differing numbers of occurrences in a single dataset.}, language = {eng}, journal = {Proceedings. International Conference on Intelligent Systems for Molecular Biology}, author = {Bailey, T. L. and Elkan, C.}, year = {1994}, pmid = {7584402}, keywords = {Animals, Humans, Algorithms, Sequence analysis, Biopolymers, Models, Theoretical}, pages = {28--36}, file = {Bailey_Elkan94.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Bailey_Elkan94.pdf:application/pdf} } @article{isakova_smile-seq_2017, title = {{SMiLE}-seq identifies binding motifs of single and dimeric transcription factors}, volume = {advance online publication}, copyright = {© 2017 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1548-7091}, url = {http://www.nature.com/nmeth/journal/vaop/ncurrent/full/nmeth.4143.html}, doi = {10.1038/nmeth.4143}, abstract = {Resolving the DNA-binding specificities of transcription factors (TFs) is of critical value for understanding gene regulation. Here, we present a novel, semiautomated protein–DNA interaction characterization technology, selective microfluidics-based ligand enrichment followed by sequencing (SMiLE-seq). SMiLE-seq is neither limited by DNA bait length nor biased toward strong affinity binders; it probes the DNA-binding properties of TFs over a wide affinity range in a fast and cost-effective fashion. We validated SMiLE-seq by analyzing 58 full-length human, mouse, and Drosophila TFs from distinct structural classes. All tested TFs yielded DNA-binding models with predictive power comparable to or greater than that of other in vitro assays. De novo motif discovery on all JUN–FOS heterodimers and several nuclear receptor-TF complexes provided novel insights into partner-specific heterodimer DNA-binding preferences. We also successfully analyzed the DNA-binding properties of uncharacterized human C2H2 zinc-finger proteins and validated several using ChIP-exo.}, language = {en}, urldate = {2017-01-31}, journal = {Nature Methods}, author = {Isakova, Alina and Groux, Romain and Imbeault, Michael and Rainer, Pernille and Alpern, Daniel and Dainese, Riccardo and Ambrosini, Giovanna and Trono, Didier and Bucher, Philipp and Deplancke, Bart}, month = jan, year = {2017}, keywords = {Genomic analysis, Lab-on-a-chip}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JBXIE44F/Isakova et al. - 2017 - SMiLE-seq identifies binding motifs of single and .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EP3KB63D/nmeth.4143.html:text/html} } @book{marsland_machine_2015-1, address = {Boca Raton}, edition = {Second Edition}, title = {Machine {Learning}, {An} algorithmic {Perspective}, {Chapter} 7 {Probabilistic} {Learning}}, isbn = {978-1-4398-8921-3}, url = {https://www.crcpress.com/Machine-Learning-An-Algorithmic-Perspective/Marsland/p/book/9781439889213}, publisher = {CRC Press}, author = {Marsland, Stephen}, year = {2015} } @article{berger_universal_2009, title = {Universal protein-binding microarrays for the comprehensive characterization of the {DNA}-binding specificities of transcription factors}, volume = {4}, copyright = {© 2009 Nature Publishing Group}, issn = {1754-2189}, url = {http://www.nature.com/nprot/journal/v4/n3/full/nprot.2008.195.html}, doi = {10.1038/nprot.2008.195}, abstract = {Protein-binding microarray (PBM) technology provides a rapid, high-throughput means of characterizing the in vitro DNA-binding specificities of transcription factors (TFs). Using high-density, custom-designed microarrays containing all 10-mer sequence variants, one can obtain comprehensive binding-site measurements for any TF, regardless of its structural class or species of origin. Here, we present a protocol for the examination and analysis of TF-binding specificities at high resolution using such 'all 10-mer' universal PBMs. This procedure involves double-stranding a commercially synthesized DNA oligonucleotide array, binding a TF directly to the double-stranded DNA microarray and labeling the protein-bound microarray with a fluorophore-conjugated antibody. We describe how to computationally extract the relative binding preferences of the examined TF for all possible contiguous and gapped 8-mers over the full range of affinities, from highest affinity sites to nonspecific sites. Multiple proteins can be tested in parallel in separate chambers on a single microarray, enabling the processing of a dozen or more TFs in a single day.}, language = {en}, number = {3}, urldate = {2017-02-03}, journal = {Nature Protocols}, author = {Berger, Michael F. and Bulyk, Martha L.}, month = mar, year = {2009}, pages = {393--411}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/34HD9HV2/Berger et Bulyk - 2009 - Universal protein-binding microarrays for the comp.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5EJI7WIQ/nprot.2008.195.html:text/html} } @article{jolma_multiplexed_2010, title = {Multiplexed massively parallel {SELEX} for characterization of human transcription factor binding specificities}, volume = {20}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/20/6/861}, doi = {10.1101/gr.100552.109}, abstract = {The genetic code—the binding specificity of all transfer-RNAs—defines how protein primary structure is determined by DNA sequence. DNA also dictates when and where proteins are expressed, and this information is encoded in a pattern of specific sequence motifs that are recognized by transcription factors. However, the DNA-binding specificity is only known for a small fraction of the ∼1400 human transcription factors (TFs). We describe here a high-throughput method for analyzing transcription factor binding specificity that is based on systematic evolution of ligands by exponential enrichment (SELEX) and massively parallel sequencing. The method is optimized for analysis of large numbers of TFs in parallel through the use of affinity-tagged proteins, barcoded selection oligonucleotides, and multiplexed sequencing. Data are analyzed by a new bioinformatic platform that uses the hundreds of thousands of sequencing reads obtained to control the quality of the experiments and to generate binding motifs for the TFs. The described technology allows higher throughput and identification of much longer binding profiles than current microarray-based methods. In addition, as our method is based on proteins expressed in mammalian cells, it can also be used to characterize DNA-binding preferences of full-length proteins or proteins requiring post-translational modifications. We validate the method by determining binding specificities of 14 different classes of TFs and by confirming the specificities for NFATC1 and RFX3 using ChIP-seq. Our results reveal unexpected dimeric modes of binding for several factors that were thought to preferentially bind DNA as monomers.}, language = {en}, number = {6}, urldate = {2017-02-03}, journal = {Genome Research}, author = {Jolma, Arttu and Kivioja, Teemu and Toivonen, Jarkko and Cheng, Lu and Wei, Gonghong and Enge, Martin and Taipale, Mikko and Vaquerizas, Juan M. and Yan, Jian and Sillanpää, Mikko J. and Bonke, Martin and Palin, Kimmo and Talukder, Shaheynoor and Hughes, Timothy R. and Luscombe, Nicholas M. and Ukkonen, Esko and Taipale, Jussi}, month = jun, year = {2010}, pmid = {20378718}, pages = {861--873}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FJUK62JA/Jolma et al. - 2010 - Multiplexed massively parallel SELEX for character.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MDXB4KDB/861.html:text/html} } @article{thompson_rna_2012, title = {{RNA} {Profiling} and {Chromatin} {Immunoprecipitation}-{Sequencing} {Reveal} that {PTF}1a {Stabilizes} {Pancreas} {Progenitor} {Identity} via the {Control} of {MNX}1/{HLXB}9 and a {Network} of {Other} {Transcription} {Factors}}, volume = {32}, issn = {0270-7306, 1098-5549}, url = {http://mcb.asm.org/content/32/6/1189}, doi = {10.1128/MCB.06318-11}, abstract = {Pancreas development is initiated by the specification and expansion of a small group of endodermal cells. Several transcription factors are crucial for progenitor maintenance and expansion, but their interactions and the downstream targets mediating their activity are poorly understood. Among those factors, PTF1a, a basic helix-loop-helix (bHLH) transcription factor which controls pancreas exocrine cell differentiation, maintenance, and functionality, is also needed for the early specification of pancreas progenitors. We used RNA profiling and chromatin immunoprecipitation (ChIP) sequencing to identify a set of targets in pancreas progenitors. We demonstrate that Mnx1, a gene that is absolutely required in pancreas progenitors, is a major direct target of PTF1a and is regulated by a distant enhancer element. Pdx1, Nkx6.1, and Onecut1 are also direct PTF1a targets whose expression is promoted by PTF1a. These proteins, most of which were previously shown to be necessary for pancreas bud maintenance or formation, form a transcription factor network that allows the maintenance of pancreas progenitors. In addition, we identify Bmp7, Nr5a2, RhoV, and P2rx1 as new targets of PTF1a in pancreas progenitors.}, language = {en}, number = {6}, urldate = {2017-02-03}, journal = {Molecular and Cellular Biology}, author = {Thompson, Nancy and Gésina, Emilie and Scheinert, Peter and Bucher, Philipp and Grapin-Botton, Anne}, month = mar, year = {2012}, pmid = {22232429}, pages = {1189--1199}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3AAJMX28/Thompson et al. - 2012 - RNA Profiling and Chromatin Immunoprecipitation-Se.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BCNGS5A6/1189.html:text/html} } @article{isakova_smile-seq_2017-1, title = {{SMiLE}-seq identifies binding motifs of single and dimeric transcription factors}, volume = {advance online publication}, copyright = {© 2017 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1548-7091}, url = {http://www.nature.com/nmeth/journal/vaop/ncurrent/full/nmeth.4143.html}, doi = {10.1038/nmeth.4143}, abstract = {Resolving the DNA-binding specificities of transcription factors (TFs) is of critical value for understanding gene regulation. Here, we present a novel, semiautomated protein–DNA interaction characterization technology, selective microfluidics-based ligand enrichment followed by sequencing (SMiLE-seq). SMiLE-seq is neither limited by DNA bait length nor biased toward strong affinity binders; it probes the DNA-binding properties of TFs over a wide affinity range in a fast and cost-effective fashion. We validated SMiLE-seq by analyzing 58 full-length human, mouse, and Drosophila TFs from distinct structural classes. All tested TFs yielded DNA-binding models with predictive power comparable to or greater than that of other in vitro assays. De novo motif discovery on all JUN–FOS heterodimers and several nuclear receptor-TF complexes provided novel insights into partner-specific heterodimer DNA-binding preferences. We also successfully analyzed the DNA-binding properties of uncharacterized human C2H2 zinc-finger proteins and validated several using ChIP-exo.}, language = {en}, urldate = {2017-02-03}, journal = {Nature Methods}, author = {Isakova, Alina and Groux, Romain and Imbeault, Michael and Rainer, Pernille and Alpern, Daniel and Dainese, Riccardo and Ambrosini, Giovanna and Trono, Didier and Bucher, Philipp and Deplancke, Bart}, month = jan, year = {2017}, keywords = {Genomic analysis, Lab-on-a-chip}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/W72MXR9H/Isakova et al. - 2017 - SMiLE-seq identifies binding motifs of single and .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/C7I7TIXW/nmeth.4143.html:text/html} } @article{robertson_genome-wide_2007, title = {Genome-wide profiles of {STAT}1 {DNA} association using chromatin immunoprecipitation and massively parallel sequencing}, volume = {4}, copyright = {© 2007 Nature Publishing Group}, issn = {1548-7091}, url = {http://www.nature.com/nmeth/journal/v4/n8/full/nmeth1068.html}, doi = {10.1038/nmeth1068}, abstract = {We developed a method, ChIP-sequencing (ChIP-seq), combining chromatin immunoprecipitation (ChIP) and massively parallel sequencing to identify mammalian DNA sequences bound by transcription factors in vivo. We used ChIP-seq to map STAT1 targets in interferon-γ (IFN-γ)–stimulated and unstimulated human HeLa S3 cells, and compared the method's performance to ChIP-PCR and to ChIP-chip for four chromosomes. By ChIP-seq, using 15.1 and 12.9 million uniquely mapped sequence reads, and an estimated false discovery rate of less than 0.001, we identified 41,582 and 11,004 putative STAT1-binding regions in stimulated and unstimulated cells, respectively. Of the 34 loci known to contain STAT1 interferon-responsive binding sites, ChIP-seq found 24 (71\%). ChIP-seq targets were enriched in sequences similar to known STAT1 binding motifs. Comparisons with two ChIP-PCR data sets suggested that ChIP-seq sensitivity was between 70\% and 92\% and specificity was at least 95\%.}, language = {en}, number = {8}, urldate = {2017-02-05}, journal = {Nature Methods}, author = {Robertson, Gordon and Hirst, Martin and Bainbridge, Matthew and Bilenky, Misha and Zhao, Yongjun and Zeng, Thomas and Euskirchen, Ghia and Bernier, Bridget and Varhol, Richard and Delaney, Allen and Thiessen, Nina and Griffith, Obi L. and He, Ann and Marra, Marco and Snyder, Michael and Jones, Steven}, month = aug, year = {2007}, pages = {651--657}, file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/59396VND/nmeth1068.html:text/html} } @article{schutz_mamot:_2008, title = {{MAMOT}: hidden {Markov} modeling tool}, volume = {24}, issn = {1367-4803}, shorttitle = {{MAMOT}}, url = {https://academic.oup.com/bioinformatics/article/24/11/1399/192734/MAMOT-hidden-Markov-modeling-tool}, doi = {10.1093/bioinformatics/btn201}, number = {11}, urldate = {2017-02-05}, journal = {Bioinformatics}, author = {Schütz, Frédéric and Delorenzi, Mauro}, month = jun, year = {2008}, pages = {1399--1400}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WMUURNHG/Schütz et Delorenzi - 2008 - MAMOT hidden Markov modeling tool.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HHAXMX5Z/MAMOT-hidden-Markov-modeling-tool.html:text/html} } @article{donohoe_identification_2007, title = {Identification of a {Ctcf} {Cofactor}, {Yy}1, for the {X} {Chromosome} {Binary} {Switch}}, volume = {25}, issn = {1097-2765}, url = {https://www.sciencedirect.com/science/article/pii/S109727650600788X}, doi = {10.1016/j.molcel.2006.11.017}, abstract = {Summary -In mammals, inactivation of one X chromosome in the female equalizes gene dosages between XX females and XY males. Two noncoding loci, Tsix and Xite, together regulate X chromosome fate by controlling homologous chromosome pairing, counting, and mutually exclusive choice. Following choice, the asymmetry of Xite and Tsix expression drives divergent chromosome fates, but how this pattern becomes established is currently unknown. Although no proven trans-acting factors have been identified, a likely candidate is Ctcf, a chromatin insulator with essential function in autosomal imprinting. Here, we search for trans-factors and identify Yy1 as a required cofactor for Ctcf. Paired Ctcf-Yy1 elements are highly clustered within the counting/choice and imprinting domain of Tsix. A deficiency of Yy1 leads to aberrant Tsix and Xist expression, resulting in a deficit of male and female embryos. Yy1 and Ctcf associate through specific protein-protein interactions and together transactivate Tsix. We propose that the Ctcf-Yy1-Tsix complex functions as a key component of the X chromosome binary switch.}, - number = {1}, - urldate = {2017-02-07}, - journal = {Molecular Cell}, - author = {Donohoe, Mary E. and Zhang, Li-Feng and Xu, Na and Shi, Yang and Lee, Jeannie T.}, - month = jan, - year = {2007}, - keywords = {DNA, DEVBIO}, - pages = {43--56}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HBBFAT33/Donohoe et al. - 2007 - Identification of a Ctcf Cofactor, Yy1, for the X .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E6ZTI833/S109727650600788X.html:text/html} -} - -@article{donohoe_identification_2007-1, - title = {Identification of a {Ctcf} {Cofactor}, {Yy}1, for the {X} {Chromosome} {Binary} {Switch}}, - volume = {25}, - issn = {1097-2765}, - url = {https://www.sciencedirect.com/science/article/pii/S109727650600788X}, - doi = {10.1016/j.molcel.2006.11.017}, - abstract = {Summary In mammals, inactivation of one X chromosome in the female equalizes gene dosages between XX females and XY males. Two noncoding loci, Tsix and Xite, together regulate X chromosome fate by controlling homologous chromosome pairing, counting, and mutually exclusive choice. Following choice, the asymmetry of Xite and Tsix expression drives divergent chromosome fates, but how this pattern becomes established is currently unknown. Although no proven trans-acting factors have been identified, a likely candidate is Ctcf, a chromatin insulator with essential function in autosomal imprinting. Here, we search for trans-factors and identify Yy1 as a required cofactor for Ctcf. Paired Ctcf-Yy1 elements are highly clustered within the counting/choice and imprinting domain of Tsix. A deficiency of Yy1 leads to aberrant Tsix and Xist expression, resulting in a deficit of male and female embryos. Yy1 and Ctcf associate through specific protein-protein interactions and together transactivate Tsix. We propose that the Ctcf-Yy1-Tsix complex functions as a key component of the X chromosome binary switch.}, number = {1}, urldate = {2017-02-07}, journal = {Molecular Cell}, author = {Donohoe, Mary E. and Zhang, Li-Feng and Xu, Na and Shi, Yang and Lee, Jeannie T.}, month = jan, year = {2007}, keywords = {DNA, DEVBIO}, pages = {43--56}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FUWNBNEA/Donohoe et al. - 2007 - Identification of a Ctcf Cofactor, Yy1, for the X .pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SQSMKC36/S109727650600788X.html:text/html} } @article{stedman_cohesins_2008, title = {Cohesins localize with {CTCF} at the {KSHV} latency control region and at cellular c-myc and {H}19 {Igf}2 insulators}, volume = {27}, copyright = {Copyright © 2008 European Molecular Biology Organization}, issn = {0261-4189, 1460-2075}, url = {http://emboj.embopress.org/content/27/4/654}, doi = {10.1038/emboj.2008.1}, abstract = {Cohesins, which mediate sister chromatin cohesion, and CTCF, which functions at chromatin boundaries, play key roles in the structural and functional organization of chromosomes. We examined the binding of these two factors on the Kaposi's sarcoma‐associated herpesvirus (KSHV) episome during latent infection and found a striking colocalization within the control region of the major latency transcript responsible for expressing LANA (ORF73), vCyclin (ORF72), vFLIP (ORF71), and vmiRNAs. Deletion of the CTCF‐binding site from the viral genome disrupted cohesin binding, and crippled colony formation in 293 cells. Clonal instability correlated with elevated expression of lytic cycle gene products, notably the neighbouring promoter for K14 and vGPCR (ORF74). siRNA depletion of RAD21 from latently infected cells caused an increase in K14 and ORF74, and lytic inducers caused a rapid dissociation of RAD21 from the viral genome. RAD21 and SMC1 also associate with the cellular CTCF sites at mammalian c‐myc promoter and H19 / Igf2 imprinting control region. We conclude that cohesin subunits associate with viral and cellular CTCF sites involved in complex gene regulation and chromatin organization.}, language = {en}, number = {4}, urldate = {2017-02-07}, journal = {The EMBO Journal}, author = {Stedman, William and Kang, Hyojeung and Lin, Shu and Kissil, Joseph L. and Bartolomei, Marisa S. and Lieberman, Paul M.}, month = feb, year = {2008}, pmid = {18219272}, pages = {654--666}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6JPAWDK8/Stedman et al. - 2008 - Cohesins localize with CTCF at the KSHV latency co.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RXH9XCBG/654.html:text/html} } @article{orenstein_comparative_2014, title = {A comparative analysis of transcription factor binding models learned from {PBM}, {HT}-{SELEX} and {ChIP} data}, volume = {42}, issn = {0305-1048}, url = {https://academic.oup.com/nar/article/42/8/e63/1067315/A-comparative-analysis-of-transcription-factor}, doi = {10.1093/nar/gku117}, number = {8}, urldate = {2017-02-07}, journal = {Nucleic Acids Research}, author = {Orenstein, Yaron and Shamir, Ron}, month = apr, year = {2014}, pages = {e63--e63}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KSRXNAZ6/Orenstein et Shamir - 2014 - A comparative analysis of transcription factor bin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XAPXSRB5/gku117.html:text/html} } @article{guo_discovering_2010, title = {Discovering homotypic binding events at high spatial resolution}, volume = {26}, issn = {1367-4803}, url = {https://academic.oup.com/bioinformatics/article/26/24/3028/289014/Discovering-homotypic-binding-events-at-high}, doi = {10.1093/bioinformatics/btq590}, number = {24}, urldate = {2017-02-13}, journal = {Bioinformatics}, author = {Guo, Yuchun and Papachristoudis, Georgios and Altshuler, Robert C. and Gerber, Georg K. and Jaakkola, Tommi S. and Gifford, David K. and Mahony, Shaun}, month = dec, year = {2010}, pages = {3028--3034}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NHTWZW37/Guo et al. - 2010 - Discovering homotypic binding events at high spati.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/G4B37CI9/btq590.html:text/html} } @article{roulet_high-throughput_2002, title = {High-throughput {SELEX}–{SAGE} method for quantitative modeling of transcription-factor binding sites}, volume = {20}, copyright = {© 2002 Nature Publishing Group}, issn = {1087-0156}, url = {http://www.nature.com/nbt/journal/v20/n8/full/nbt718.html}, doi = {10.1038/nbt718}, abstract = {The ability to determine the location and relative strength of all transcription-factor binding sites in a genome is important both for a comprehensive understanding of gene regulation and for effective promoter engineering in biotechnological applications. Here we present a bioinformatically driven experimental method to accurately define the DNA-binding sequence specificity of transcription factors. A generalized profile was used as a predictive quantitative model for binding sites, and its parameters were estimated from in vitro–selected ligands using standard hidden Markov model training algorithms. Computer simulations showed that several thousand low- to medium-affinity sequences are required to generate a profile of desired accuracy. To produce data on this scale, we applied high-throughput genomics methods to the biochemical problem addressed here. A method combining systematic evolution of ligands by exponential enrichment (SELEX) and serial analysis of gene expression (SAGE) protocols was coupled to an automated quality-controlled sequence extraction procedure based on Phred quality scores. This allowed the sequencing of a database of more than 10,000 potential DNA ligands for the CTF/NFI transcription factor. The resulting binding-site model defines the sequence specificity of this protein with a high degree of accuracy not achieved earlier and thereby makes it possible to identify previously unknown regulatory sequences in genomic DNA. A covariance analysis of the selected sites revealed non-independent base preferences at different nucleotide positions, providing insight into the binding mechanism.}, language = {en}, number = {8}, urldate = {2017-02-19}, journal = {Nature Biotechnology}, author = {Roulet, Emmanuelle and Busso, Stéphane and Camargo, Anamaria A. and Simpson, Andrew J. G. and Mermod, Nicolas and Bucher, Philipp}, month = aug, year = {2002}, pages = {831--835}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7G98EPPD/Roulet et al. - 2002 - High-throughput SELEX–SAGE method for quantitative.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GNXT26I9/nbt718.html:text/html} } @article{ghirlando_ctcf:_2016, - title = {{CTCF}: making the right connections}, - volume = {30}, - issn = {0890-9369, 1549-5477}, - shorttitle = {{CTCF}}, - url = {http://genesdev.cshlp.org/content/30/8/881}, - doi = {10.1101/gad.277863.116}, - abstract = {The role of the zinc finger protein CTCF in organizing the genome within the nucleus is now well established. Widely separated sites on DNA, occupied by both CTCF and the cohesin complex, make physical contacts that create large loop domains. Additional contacts between loci within those domains, often also mediated by CTCF, tend to be favored over contacts between loci in different domains. A large number of studies during the past 2 years have addressed the questions: How are these loops generated? What are the effects of disrupting them? Are there rules governing large-scale genome organization? It now appears that the strongest and evolutionarily most conserved of these CTCF interactions have specific rules for the orientation of the paired CTCF sites, implying the existence of a nonequilibrium mechanism of generation. Recent experiments that invert, delete, or inactivate one of a mating CTCF pair result in major changes in patterns of organization and gene expression in the surrounding regions. What remain to be determined are the detailed molecular mechanisms for re-establishing loop domains and maintaining them after replication and mitosis. As recently published data show, some mechanisms may involve interactions with noncoding RNAs as well as protein cofactors. Many CTCF sites are also involved in other functions such as modulation of RNA splicing and specific regulation of gene expression, and the relationship between these activities and loop formation is another unanswered question that should keep investigators occupied for some time.}, - language = {en}, - number = {8}, - urldate = {2017-02-23}, - journal = {Genes \& Development}, - author = {Ghirlando, Rodolfo and Felsenfeld, Gary}, - month = apr, - year = {2016}, - pmid = {27083996}, - keywords = {Chromatin, Insulators, topologically associated domains}, - pages = {881--891}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UBR9U954/Ghirlando et Felsenfeld - 2016 - CTCF making the right connections.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/N3SCBDXN/881.html:text/html} -} - -@article{ghirlando_ctcf:_2016-1, title = {{CTCF}: making the right connections}, volume = {30}, issn = {0890-9369, 1549-5477}, shorttitle = {{CTCF}}, url = {http://genesdev.cshlp.org/content/30/8/881}, doi = {10.1101/gad.277863.116}, abstract = {The role of the zinc finger protein CTCF in organizing the genome within the nucleus is now well established. Widely separated sites on DNA, occupied by both CTCF and the cohesin complex, make physical contacts that create large loop domains. Additional contacts between loci within those domains, often also mediated by CTCF, tend to be favored over contacts between loci in different domains. A large number of studies during the past 2 years have addressed the questions: How are these loops generated? What are the effects of disrupting them? Are there rules governing large-scale genome organization? It now appears that the strongest and evolutionarily most conserved of these CTCF interactions have specific rules for the orientation of the paired CTCF sites, implying the existence of a nonequilibrium mechanism of generation. Recent experiments that invert, delete, or inactivate one of a mating CTCF pair result in major changes in patterns of organization and gene expression in the surrounding regions. What remain to be determined are the detailed molecular mechanisms for re-establishing loop domains and maintaining them after replication and mitosis. As recently published data show, some mechanisms may involve interactions with noncoding RNAs as well as protein cofactors. Many CTCF sites are also involved in other functions such as modulation of RNA splicing and specific regulation of gene expression, and the relationship between these activities and loop formation is another unanswered question that should keep investigators occupied for some time.}, language = {en}, number = {8}, urldate = {2017-02-23}, journal = {Genes \& Development}, author = {Ghirlando, Rodolfo and Felsenfeld, Gary}, month = apr, year = {2016}, pmid = {27083996}, keywords = {Chromatin, Insulators, topologically associated domains}, pages = {881--891}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ASNKGH65/Ghirlando et Felsenfeld - 2016 - CTCF making the right connections.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4NW9GNZ5/881.html:text/html} } @article{van_helden_confidence_2016, title = {Confidence intervals are no salvation from the alleged fickleness of the {P} value}, volume = {13}, copyright = {© 2016 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {1548-7091}, url = {http://www.nature.com/nmeth/journal/v13/n8/full/nmeth.3932.html?WT.ec_id=NMETH-201608&spMailingID=51937223&spUserID=ODkwMTM2NjMzMgS2&spJobID=964115062&spReportId=OTY0MTE1MDYyS0}, doi = {10.1038/nmeth.3932}, language = {en}, number = {8}, urldate = {2017-02-27}, journal = {Nature Methods}, author = {van Helden, Jacques}, month = aug, year = {2016}, keywords = {Scientific community, Standards, Statistical methods}, pages = {605--606}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9K4SNU5Q/van Helden - 2016 - Confidence intervals are no salvation from the all.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z3KUI6VQ/nmeth.3932.html:text/html} } @article{thomas-chollier_rsat:_2008, title = {{RSAT}: regulatory sequence analysis tools}, volume = {36}, issn = {0305-1048}, shorttitle = {{RSAT}}, url = {https://academic.oup.com/nar/article/36/suppl_2/W119/2506687/RSAT-regulatory-sequence-analysis-tools}, doi = {10.1093/nar/gkn304}, number = {suppl\_2}, urldate = {2017-02-27}, journal = {Nucleic Acids Research}, author = {Thomas-Chollier, Morgane and Sand, Olivier and Turatsinze, Jean-Valéry and Janky, Rekin's and Defrance, Matthieu and Vervisch, Eric and Brohée, Sylvain and van Helden, Jacques}, month = jul, year = {2008}, pages = {W119--W127}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/V565AVBF/Thomas-Chollier et al. - 2008 - RSAT regulatory sequence analysis tools.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GZBFC8BJ/RSAT-regulatory-sequence-analysis-tools.html:text/html} } @article{wilbanks_evaluation_2010-1, title = {Evaluation of {Algorithm} {Performance} in {ChIP}-{Seq} {Peak} {Detection}}, volume = {5}, issn = {1932-6203}, url = {http://journals.plos.org/plosone/article?id=10.1371/journal.pone.0011471}, doi = {10.1371/journal.pone.0011471}, abstract = {Next-generation DNA sequencing coupled with chromatin immunoprecipitation (ChIP-seq) is revolutionizing our ability to interrogate whole genome protein-DNA interactions. Identification of protein binding sites from ChIP-seq data has required novel computational tools, distinct from those used for the analysis of ChIP-Chip experiments. The growing popularity of ChIP-seq spurred the development of many different analytical programs (at last count, we noted 31 open source methods), each with some purported advantage. Given that the literature is dense and empirical benchmarking challenging, selecting an appropriate method for ChIP-seq analysis has become a daunting task. Herein we compare the performance of eleven different peak calling programs on common empirical, transcription factor datasets and measure their sensitivity, accuracy and usability. Our analysis provides an unbiased critical assessment of available technologies, and should assist researchers in choosing a suitable tool for handling ChIP-seq data.}, number = {7}, urldate = {2017-03-15}, journal = {PLOS ONE}, author = {Wilbanks, Elizabeth G. and Facciotti, Marc T.}, year = {2010}, keywords = {Transcription Factors, Sequence motif analysis, Algorithms, DNA-binding proteins, Computer software, Genomic databases, Sequence tagged site analysis, Human genomics}, pages = {e11471}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J5VJPGWV/Wilbanks et Facciotti - 2010 - Evaluation of Algorithm Performance in ChIP-Seq Pe.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HWSDRPH6/article.html:text/html} } @article{nozaki_tight_2011-1, title = {Tight associations between transcription promoter type and epigenetic variation in histone positioning and modification}, volume = {12}, issn = {1471-2164}, url = {http://dx.doi.org/10.1186/1471-2164-12-416}, doi = {10.1186/1471-2164-12-416}, abstract = {Transcription promoters are fundamental genomic cis-elements controlling gene expression. They can be classified into two types by the degree of imprecision of their transcription start sites: peak promoters, which initiate transcription from a narrow genomic region; and broad promoters, which initiate transcription from a wide-ranging region. Eukaryotic transcription initiation is suggested to be associated with the genomic positions and modifications of nucleosomes. For instance, it has been recently shown that histone with H3K9 acetylation (H3K9ac) is more likely to be distributed around broad promoters rather than peak promoters; it can thus be inferred that there is an association between histone H3K9 and promoter architecture.}, urldate = {2017-03-17}, journal = {BMC Genomics}, author = {Nozaki, Tadasu and Yachie, Nozomu and Ogawa, Ryu and Kratz, Anton and Saito, Rintaro and Tomita, Masaru}, year = {2011}, pages = {416}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VIU8E9VW/Nozaki et al. - 2011 - Tight associations between transcription promoter .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HTUH5TZD/1471-2164-12-416.html:text/html} } @article{the_fantom_consortium_and_the_riken_pmi_and_clst_dgt_promoter-level_2014, title = {A promoter-level mammalian expression atlas}, volume = {507}, copyright = {© 2014 Nature Publishing Group, a division of Macmillan Publishers Limited. All Rights Reserved.}, issn = {0028-0836}, url = {http://www.nature.com/nature/journal/v507/n7493/full/nature13182.html}, doi = {10.1038/nature13182}, abstract = {Regulated transcription controls the diversity, developmental pathways and spatial organization of the hundreds of cell types that make up a mammal. Using single-molecule cDNA sequencing, we mapped transcription start sites (TSSs) and their usage in human and mouse primary cells, cell lines and tissues to produce a comprehensive overview of mammalian gene expression across the human body. We find that few genes are truly ‘housekeeping’, whereas many mammalian promoters are composite entities composed of several closely separated TSSs, with independent cell-type-specific expression profiles. TSSs specific to different cell types evolve at different rates, whereas promoters of broadly expressed genes are the most conserved. Promoter-based expression analysis reveals key transcription factors defining cell states and links them to binding-site motifs. The functions of identified novel transcripts can be predicted by coexpression and sample ontology enrichment analyses. The functional annotation of the mammalian genome 5 (FANTOM5) project provides comprehensive expression profiles and functional annotation of mammalian cell-type-specific transcriptomes with wide applications in biomedical research.}, language = {en}, number = {7493}, urldate = {2017-03-17}, journal = {Nature}, author = {{The FANTOM Consortium and the RIKEN PMI and CLST (dgt)}}, month = mar, year = {2014}, keywords = {Gene regulation, transcriptomics, Gene regulatory networks, Multicellular systems}, pages = {462--470}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XRAKAQX9/The FANTOM Consortium and the RIKEN PMI and CLST (dgt) - 2014 - A promoter-level mammalian expression atlas.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QJQ6K929/nature13182.html:text/html} } @article{spivakov_analysis_2012, title = {Analysis of variation at transcription factor binding sites in {Drosophila} and humans}, volume = {13}, issn = {1474-760X}, url = {http://dx.doi.org/10.1186/gb-2012-13-9-r49}, doi = {10.1186/gb-2012-13-9-r49}, abstract = {Advances in sequencing technology have boosted population genomics and made it possible to map the positions of transcription factor binding sites (TFBSs) with high precision. Here we investigate TFBS variability by combining transcription factor binding maps generated by ENCODE, modENCODE, our previously published data and other sources with genomic variation data for human individuals and Drosophila isogenic lines.}, urldate = {2017-03-24}, journal = {Genome Biology}, author = {Spivakov, Mikhail and Akhtar, Junaid and Kheradpour, Pouya and Beal, Kathryn and Girardot, Charles and Koscielny, Gautier and Herrero, Javier and Kellis, Manolis and Furlong, Eileen EM and Birney, Ewan}, year = {2012}, pages = {R49}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/S2XFQGBR/Spivakov et al. - 2012 - Analysis of variation at transcription factor bind.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K43SM4MK/gb-2012-13-9-r49.html:text/html} } -@article{wilbanks_evaluation_2010-2, - title = {Evaluation of {Algorithm} {Performance} in {ChIP}-{Seq} {Peak} {Detection}}, - volume = {5}, - issn = {1932-6203}, - url = {http://journals.plos.org/plosone/article?id=10.1371/journal.pone.0011471}, - doi = {10.1371/journal.pone.0011471}, - abstract = {Next-generation DNA sequencing coupled with chromatin immunoprecipitation (ChIP-seq) is revolutionizing our ability to interrogate whole genome protein-DNA interactions. Identification of protein binding sites from ChIP-seq data has required novel computational tools, distinct from those used for the analysis of ChIP-Chip experiments. The growing popularity of ChIP-seq spurred the development of many different analytical programs (at last count, we noted 31 open source methods), each with some purported advantage. Given that the literature is dense and empirical benchmarking challenging, selecting an appropriate method for ChIP-seq analysis has become a daunting task. Herein we compare the performance of eleven different peak calling programs on common empirical, transcription factor datasets and measure their sensitivity, accuracy and usability. Our analysis provides an unbiased critical assessment of available technologies, and should assist researchers in choosing a suitable tool for handling ChIP-seq data.}, - number = {7}, - urldate = {2017-03-24}, - journal = {PLOS ONE}, - author = {Wilbanks, Elizabeth G. and Facciotti, Marc T.}, - year = {2010}, - keywords = {Transcription Factors, Sequence motif analysis, Algorithms, DNA-binding proteins, Computer software, Genomic databases, Sequence tagged site analysis, Human genomics}, - pages = {e11471}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3TSKDV8D/Wilbanks et Facciotti - 2010 - Evaluation of Algorithm Performance in ChIP-Seq Pe.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MUGACFTS/article.html:text/html} -} - @article{landt_chip-seq_2012-1, title = {{ChIP}-seq guidelines and practices of the {ENCODE} and {modENCODE} consortia}, volume = {22}, issn = {1088-9051, 1549-5469}, url = {http://genome.cshlp.org/content/22/9/1813}, doi = {10.1101/gr.136184.111}, abstract = {Chromatin immunoprecipitation (ChIP) followed by high-throughput DNA sequencing (ChIP-seq) has become a valuable and widely used approach for mapping the genomic location of transcription-factor binding and histone modifications in living cells. Despite its widespread use, there are considerable differences in how these experiments are conducted, how the results are scored and evaluated for quality, and how the data and metadata are archived for public use. These practices affect the quality and utility of any global ChIP experiment. Through our experience in performing ChIP-seq experiments, the ENCODE and modENCODE consortia have developed a set of working standards and guidelines for ChIP experiments that are updated routinely. The current guidelines address antibody validation, experimental replication, sequencing depth, data and metadata reporting, and data quality assessment. We discuss how ChIP quality, assessed in these ways, affects different uses of ChIP-seq data. All data sets used in the analysis have been deposited for public viewing and downloading at the ENCODE (http://encodeproject.org/ENCODE/) and modENCODE (http://www.modencode.org/) portals.}, language = {en}, number = {9}, urldate = {2017-03-24}, journal = {Genome Research}, author = {Landt, Stephen G. and Marinov, Georgi K. and Kundaje, Anshul and Kheradpour, Pouya and Pauli, Florencia and Batzoglou, Serafim and Bernstein, Bradley E. and Bickel, Peter and Brown, James B. and Cayting, Philip and Chen, Yiwen and DeSalvo, Gilberto and Epstein, Charles and Fisher-Aylor, Katherine I. and Euskirchen, Ghia and Gerstein, Mark and Gertz, Jason and Hartemink, Alexander J. and Hoffman, Michael M. and Iyer, Vishwanath R. and Jung, Youngsook L. and Karmakar, Subhradip and Kellis, Manolis and Kharchenko, Peter V. and Li, Qunhua and Liu, Tao and Liu, X. Shirley and Ma, Lijia and Milosavljevic, Aleksandar and Myers, Richard M. and Park, Peter J. and Pazin, Michael J. and Perry, Marc D. and Raha, Debasish and Reddy, Timothy E. and Rozowsky, Joel and Shoresh, Noam and Sidow, Arend and Slattery, Matthew and Stamatoyannopoulos, John A. and Tolstorukov, Michael Y. and White, Kevin P. and Xi, Simon and Farnham, Peggy J. and Lieb, Jason D. and Wold, Barbara J. and Snyder, Michael}, month = sep, year = {2012}, pmid = {22955991}, pages = {1813--1831}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/N7CG2BSN/Landt et al. - 2012 - ChIP-seq guidelines and practices of the ENCODE an.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/REBXQDRA/1813.html:text/html} } @article{lai_archalign:_2010, title = {{ArchAlign}: coordinate-free chromatin alignment reveals novel architectures}, volume = {11}, issn = {1474-760X}, shorttitle = {{ArchAlign}}, url = {http://dx.doi.org/10.1186/gb-2010-11-12-r126}, doi = {10.1186/gb-2010-11-12-r126}, abstract = {To facilitate identification and characterization of genomic functional elements, we have developed a chromatin architecture alignment algorithm (ArchAlign). ArchAlign identifies shared chromatin structural patterns from high-resolution chromatin structural datasets derived from next-generation sequencing or tiled microarray approaches for user defined regions of interest. We validated ArchAlign using well characterized functional elements, and used it to explore the chromatin structural architecture at CTCF binding sites in the human genome. ArchAlign is freely available at http://www.acsu.buffalo.edu/{\textasciitilde}mjbuck/ArchAlign.html .}, urldate = {2017-04-13}, journal = {Genome Biology}, author = {Lai, William KM and Buck, Michael J.}, year = {2010}, pages = {R126}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ARFHNX3Q/Lai et Buck - 2010 - ArchAlign coordinate-free chromatin alignment rev.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J7EV6WKM/gb-2010-11-12-r126.html:text/html} } -@article{lai_archalign:_2010-1, - title = {{ArchAlign}: coordinate-free chromatin alignment reveals novel architectures}, - volume = {11}, - issn = {1474-760X}, - shorttitle = {{ArchAlign}}, - url = {http://dx.doi.org/10.1186/gb-2010-11-12-r126}, - doi = {10.1186/gb-2010-11-12-r126}, - abstract = {To facilitate identification and characterization of genomic functional elements, we have developed a chromatin architecture alignment algorithm (ArchAlign). ArchAlign identifies shared chromatin structural patterns from high-resolution chromatin structural datasets derived from next-generation sequencing or tiled microarray approaches for user defined regions of interest. We validated ArchAlign using well characterized functional elements, and used it to explore the chromatin structural architecture at CTCF binding sites in the human genome. ArchAlign is freely available at http://www.acsu.buffalo.edu/{\textasciitilde}mjbuck/ArchAlign.html .}, - urldate = {2017-04-13}, - journal = {Genome Biology}, - author = {Lai, William KM and Buck, Michael J.}, - year = {2010}, - pages = {R126}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5MSBRBFM/Lai et Buck - 2010 - ArchAlign coordinate-free chromatin alignment rev.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XFPI2FGV/gb-2010-11-12-r126.html:text/html} -} - @article{deplancke_genetics_2016, title = {The {Genetics} of {Transcription} {Factor} {DNA} {Binding} {Variation}}, volume = {166}, issn = {0092-8674, 1097-4172}, url = {http://www.cell.com/cell/abstract/S0092-8674(16)30918-7}, doi = {10.1016/j.cell.2016.07.012}, abstract = {Most complex trait-associated variants are located in non-coding regulatory regions of the genome, where they have been shown to disrupt transcription factor (TF)-DNA binding motifs. Variable TF-DNA interactions are therefore increasingly considered as key drivers of phenotypic variation. However, recent genome-wide studies revealed that the majority of variable TF-DNA binding events are not driven by sequence alterations in the motif of the studied TF. This observation implies that the molecular mechanisms underlying TF-DNA binding variation and, by extrapolation, inter-individual phenotypic variation are more complex than originally anticipated. Here, we summarize the findings that led to this important paradigm shift and review proposed mechanisms for local, proximal, or distal genetic variation-driven variable TF-DNA binding. In addition, we discuss the biomedical implications of these findings for our ability to dissect the molecular role(s) of non-coding genetic variants in complex traits, including disease susceptibility.}, language = {English}, number = {3}, urldate = {2017-06-22}, journal = {Cell}, author = {Deplancke, Bart and Alpern, Daniel and Gardeux, Vincent}, month = jul, year = {2016}, pmid = {27471964}, pages = {538--554}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T7E8QFWA/Deplancke et al. - 2016 - The Genetics of Transcription Factor DNA Binding V.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/V7R8ZBU4/S0092-8674(16)30918-7.html:text/html} } @article{birney_allele-specific_2010, title = {Allele-specific and heritable chromatin signatures in humans}, volume = {19}, issn = {0964-6906}, url = {https://academic.oup.com/hmg/article/19/R2/R204/640861/Allele-specific-and-heritable-chromatin-signatures}, doi = {10.1093/hmg/ddq404}, number = {R2}, urldate = {2017-07-12}, journal = {Human Molecular Genetics}, author = {Birney, Ewan and Lieb, Jason D. and Furey, Terrence S. and Crawford, Gregory E. and Iyer, Vishwanath R.}, month = oct, year = {2010}, pages = {R204--R209}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M7K7MBWQ/Birney et al. - 2010 - Allele-specific and heritable chromatin signatures.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8ED43FEZ/ddq404.html:text/html} } @article{nielsen_catchprofiles:_2012, title = {{CATCHprofiles}: {Clustering} and {Alignment} {Tool} for {ChIP} {Profiles}}, volume = {7}, issn = {1932-6203}, shorttitle = {{CATCHprofiles}}, url = {http://journals.plos.org/plosone/article?id=10.1371/journal.pone.0028272}, doi = {10.1371/journal.pone.0028272}, abstract = {Chromatin Immuno Precipitation (ChIP) profiling detects in vivo protein-DNA binding, and has revealed a large combinatorial complexity in the binding of chromatin associated proteins and their post-translational modifications. To fully explore the spatial and combinatorial patterns in ChIP-profiling data and detect potentially meaningful patterns, the areas of enrichment must be aligned and clustered, which is an algorithmically and computationally challenging task. We have developed CATCHprofiles, a novel tool for exhaustive pattern detection in ChIP profiling data. CATCHprofiles is built upon a computationally efficient implementation for the exhaustive alignment and hierarchical clustering of ChIP profiling data. The tool features a graphical interface for examination and browsing of the clustering results. CATCHprofiles requires no prior knowledge about functional sites, detects known binding patterns “ab initio”, and enables the detection of new patterns from ChIP data at a high resolution, exemplified by the detection of asymmetric histone and histone modification patterns around H2A.Z-enriched sites. CATCHprofiles' capability for exhaustive analysis combined with its ease-of-use makes it an invaluable tool for explorative research based on ChIP profiling data. CATCHprofiles and the CATCH algorithm run on all platforms and is available for free through the CATCH website: http://catch.cmbi.ru.nl/. User support is available by subscribing to the mailing list catch-users@bioinformatics.org.}, number = {1}, urldate = {2017-07-20}, journal = {PLOS ONE}, author = {Nielsen, Fiona G. G. and Markus, Kasper Galschiøt and Friborg, Rune Møllegaard and Favrholdt, Lene Monrad and Stunnenberg, Hendrik G. and Huynen, Martijn}, month = jan, year = {2012}, keywords = {Sequence alignment, Algorithms, DNA-binding proteins, Nucleosomes, Histones, Genome analysis, Histone modification, Genomic signal processing}, pages = {e28272}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/C5N4PK8T/Nielsen et al. - 2012 - CATCHprofiles Clustering and Alignment Tool for C.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UKZNEK7P/article.html:text/html} } @article{dalton_clustering_2009, title = {Clustering {Algorithms}: {On} {Learning}, {Validation}, {Performance}, and {Applications} to {Genomics}}, volume = {10}, issn = {1389-2029}, shorttitle = {Clustering {Algorithms}}, url = {http://www.ncbi.nlm.nih.gov/pmc/articles/PMC2766793/}, doi = {10.2174/138920209789177601}, abstract = {The development of microarray technology has enabled scientists to measure the expression of thousands of genes simultaneously, resulting in a surge of interest in several disciplines throughout biology and medicine. While data clustering has been used for decades in image processing and pattern recognition, in recent years it has joined this wave of activity as a popular technique to analyze microarrays. To illustrate its application to genomics, clustering applied to genes from a set of microarray data groups together those genes whose expression levels exhibit similar behavior throughout the samples, and when applied to samples it offers the potential to discriminate pathologies based on their differential patterns of gene expression. Although clustering has now been used for many years in the context of gene expression microarrays, it has remained highly problematic. The choice of a clustering algorithm and validation index is not a trivial one, more so when applying them to high throughput biological or medical data. Factors to consider when choosing an algorithm include the nature of the application, the characteristics of the objects to be analyzed, the expected number and shape of the clusters, and the complexity of the problem versus computational power available. In some cases a very simple algorithm may be appropriate to tackle a problem, but many situations may require a more complex and powerful algorithm better suited for the job at hand. In this paper, we will cover the theoretical aspects of clustering, including error and learning, followed by an overview of popular clustering algorithms and classical validation indices. We also discuss the relative performance of these algorithms and indices and conclude with examples of the application of clustering to computational biology.}, number = {6}, journal = {Current Genomics}, author = {Dalton, Lori and Ballarin, Virginia and Brun, Marcel}, month = sep, year = {2009}, pmid = {20190957}, pmcid = {PMC2766793}, pages = {430--445}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9CNCMQR7/Dalton et al. - 2009 - Clustering Algorithms On Learning, Validation, Pe.pdf:application/pdf} } @article{rodriguez_clustering_2014, title = {Clustering by fast search and find of density peaks}, volume = {344}, copyright = {Copyright © 2014, American Association for the Advancement of Science}, issn = {0036-8075, 1095-9203}, url = {http://science.sciencemag.org/content/344/6191/1492}, doi = {10.1126/science.1242072}, abstract = {Discerning clusters of data points Cluster analysis is used in many disciplines to group objects according to a defined measure of distance. Numerous algorithms exist, some based on the analysis of the local density of data points, and others on predefined probability distributions. Rodriguez and Laio devised a method in which the cluster centers are recognized as local density maxima that are far away from any points of higher density. The algorithm depends only on the relative densities rather than their absolute values. The authors tested the method on a series of data sets, and its performance compared favorably to that of established techniques. Science, this issue p. 1492 Cluster analysis is aimed at classifying elements into categories on the basis of their similarity. Its applications range from astronomy to bioinformatics, bibliometrics, and pattern recognition. We propose an approach based on the idea that cluster centers are characterized by a higher density than their neighbors and by a relatively large distance from points with higher densities. This idea forms the basis of a clustering procedure in which the number of clusters arises intuitively, outliers are automatically spotted and excluded from the analysis, and clusters are recognized regardless of their shape and of the dimensionality of the space in which they are embedded. We demonstrate the power of the algorithm on several test cases. Local density of points is ranked and analyzed to categorize data. Local density of points is ranked and analyzed to categorize data.}, language = {en}, number = {6191}, urldate = {2017-08-07}, journal = {Science}, author = {Rodriguez, Alex and Laio, Alessandro}, month = jun, year = {2014}, pmid = {24970081}, pages = {1492--1496}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A8TS2M3Z/Rodriguez et Laio - 2014 - Clustering by fast search and find of density peak.pdf:application/pdf;Rodriguez.SM.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A8TS2M3Z/Rodriguez.SM.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BFPAPNRQ/1492.html:text/html} } @article{grant_fimo:_2011, title = {{FIMO}: scanning for occurrences of a given motif}, volume = {27}, issn = {1367-4803}, shorttitle = {{FIMO}}, url = {https://academic.oup.com/bioinformatics/article/27/7/1017/232614/FIMO-scanning-for-occurrences-of-a-given-motif}, doi = {10.1093/bioinformatics/btr064}, abstract = {Summary: A motif is a short DNA or protein sequence that contributes to the biological function of the sequence in which it resides. Over the past several decades, many computational methods have been described for identifying, characterizing and searching with sequence motifs. Critical to nearly any motif-based sequence analysis pipeline is the ability to scan a sequence database for occurrences of a given motif described by a position-specific frequency matrix.Results: We describe Find Individual Motif Occurrences (FIMO), a software tool for scanning DNA or protein sequences with motifs described as position-specific scoring matrices. The program computes a log-likelihood ratio score for each position in a given sequence database, uses established dynamic programming methods to convert this score to a P-value and then applies false discovery rate analysis to estimate a q-value for each position in the given sequence. FIMO provides output in a variety of formats, including HTML, XML and several Santa Cruz Genome Browser formats. The program is efficient, allowing for the scanning of DNA sequences at a rate of 3.5 Mb/s on a single CPU.Availability and Implementation: FIMO is part of the MEME Suite software toolkit. A web server and source code are available at http://meme.sdsc.edu.Contact:t.bailey@imb.uq.edu.au; t.bailey@imb.uq.edu.auSupplementary information:Supplementary data are available at Bioinformatics online.}, number = {7}, urldate = {2017-08-30}, journal = {Bioinformatics}, author = {Grant, Charles E. and Bailey, Timothy L. and Noble, William Stafford}, month = apr, year = {2011}, pages = {1017--1018}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EJG8BJ8F/Grant et al. - 2011 - FIMO scanning for occurrences of a given motif.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DIAU79C4/btr064.html:text/html} } @article{beckstette_fast_2006, title = {Fast index based algorithms and software for matching position specific scoring matrices}, volume = {7}, issn = {1471-2105}, url = {https://doi.org/10.1186/1471-2105-7-389}, doi = {10.1186/1471-2105-7-389}, abstract = {In biological sequence analysis, position specific scoring matrices (PSSMs) are widely used to represent sequence motifs in nucleotide as well as amino acid sequences. Searching with PSSMs in complete genomes or large sequence databases is a common, but computationally expensive task.}, journal = {BMC Bioinformatics}, author = {Beckstette, Michael and Homann, Robert and Giegerich, Robert and Kurtz, Stefan}, month = aug, year = {2006}, pages = {389}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DVPWJ2C6/Beckstette et al. - 2006 - Fast index based algorithms and software for match.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/REDQ96S6/1471-2105-7-389.html:text/html} } @article{raykov_what_2016, title = {What to {Do} {When} {K}-{Means} {Clustering} {Fails}: {A} {Simple} yet {Principled} {Alternative} {Algorithm}}, volume = {11}, issn = {1932-6203}, shorttitle = {What to {Do} {When} {K}-{Means} {Clustering} {Fails}}, url = {http://journals.plos.org/plosone/article?id=10.1371/journal.pone.0162259}, doi = {10.1371/journal.pone.0162259}, abstract = {The K-means algorithm is one of the most popular clustering algorithms in current use as it is relatively fast yet simple to understand and deploy in practice. Nevertheless, its use entails certain restrictive assumptions about the data, the negative consequences of which are not always immediately apparent, as we demonstrate. While more flexible algorithms have been developed, their widespread use has been hindered by their computational and technical complexity. Motivated by these considerations, we present a flexible alternative to K-means that relaxes most of the assumptions, whilst remaining almost as fast and simple. This novel algorithm which we call MAP-DP (maximum a-posteriori Dirichlet process mixtures), is statistically rigorous as it is based on nonparametric Bayesian Dirichlet process mixture modeling. This approach allows us to overcome most of the limitations imposed by K-means. The number of clusters K is estimated from the data instead of being fixed a-priori as in K-means. In addition, while K-means is restricted to continuous data, the MAP-DP framework can be applied to many kinds of data, for example, binary, count or ordinal data. Also, it can efficiently separate outliers from the data. This additional flexibility does not incur a significant computational overhead compared to K-means with MAP-DP convergence typically achieved in the order of seconds for many practical problems. Finally, in contrast to K-means, since the algorithm is based on an underlying statistical model, the MAP-DP framework can deal with missing data and enables model testing such as cross validation in a principled way. We demonstrate the simplicity and effectiveness of this algorithm on the health informatics problem of clinical sub-typing in a cluster of diseases known as parkinsonism.}, number = {9}, urldate = {2017-10-20}, journal = {PLOS ONE}, author = {Raykov, Yordan P. and Boukouvalas, Alexis and Baig, Fahd and Little, Max A.}, month = sep, year = {2016}, keywords = {Algorithms, Parkinson disease, Radii, Clustering algorithms, Myoclonus, Eyes, Permutation, Random variables}, pages = {e0162259}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SD4VR3ZM/Raykov et al. - 2016 - What to Do When K-Means Clustering Fails A Simple.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SCJRU8B8/article.html:text/html} } @article{porro_functional_2014, title = {Functional characterization of the {TERRA} transcriptome at damaged telomeres}, volume = {5}, copyright = {2014 Nature Publishing Group}, issn = {2041-1723}, url = {https://www.nature.com/articles/ncomms6379}, doi = {10.1038/ncomms6379}, abstract = {{\textless}p{\textgreater} -Telomere uncapping in senescent cells is accompanied by loss of the TRF2 telomere capping factor and upregulation of the long noncoding RNA TERRA. Here the authors characterize the TERRA transcriptome and show that TERRA upregulation may promote SUV39H1 recruitment, H3K9 trimethylation and telomere end-to-end fusions.{\textless}/p{\textgreater}}, - language = {en}, - urldate = {2017-11-21}, - journal = {Nature Communications}, - author = {Porro, Antonio and Feuerhahn, Sascha and Delafontaine, Julien and Riethman, Harold and Rougemont, Jacques and Lingner, Joachim}, - month = oct, - year = {2014}, - pages = {ncomms6379}, - file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8NVZJNUN/ncomms6379.html:text/html} -} - -@article{porro_functional_2014-1, - title = {Functional characterization of the {TERRA} transcriptome at damaged telomeres}, - volume = {5}, - copyright = {2014 Nature Publishing Group}, - issn = {2041-1723}, - url = {https://www.nature.com/articles/ncomms6379}, - doi = {10.1038/ncomms6379}, - abstract = {{\textless}p{\textgreater} -Telomere uncapping in senescent cells is accompanied by loss of the TRF2 telomere capping factor and upregulation of the long noncoding RNA TERRA. Here the authors characterize the TERRA transcriptome and show that TERRA upregulation may promote SUV39H1 recruitment, H3K9 trimethylation and telomere end-to-end fusions.{\textless}/p{\textgreater}}, - language = {en}, - urldate = {2017-11-21}, - journal = {Nature Communications}, - author = {Porro, Antonio and Feuerhahn, Sascha and Delafontaine, Julien and Riethman, Harold and Rougemont, Jacques and Lingner, Joachim}, - month = oct, - year = {2014}, - pages = {ncomms6379}, - file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/N865WZ9D/ncomms6379.html:text/html} -} - -@misc{noauthor_article_nodate, - title = {Article {Metrics} - {Functional} characterization of the {TERRA} transcriptome at damaged telomeres {\textbar} {Nature} {Communications}}, - copyright = {©2017 Macmillan Publishers Limited. All Rights Reserved.}, - url = {https://www.nature.com/articles/ncomms6379/metrics}, - abstract = {Functional characterization of the TERRA transcriptome at damaged telomeres}, - urldate = {2017-11-21}, - file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7N7ND2WM/metrics.html:text/html} -} - -@article{porro_functional_2014-2, - title = {Functional characterization of the {TERRA} transcriptome at damaged telomeres}, - volume = {5}, - copyright = {2014 Nature Publishing Group}, - issn = {2041-1723}, - url = {https://www.nature.com/articles/ncomms6379}, - doi = {10.1038/ncomms6379}, - abstract = {{\textless}p{\textgreater} Telomere uncapping in senescent cells is accompanied by loss of the TRF2 telomere capping factor and upregulation of the long noncoding RNA TERRA. Here the authors characterize the TERRA transcriptome and show that TERRA upregulation may promote SUV39H1 recruitment, H3K9 trimethylation and telomere end-to-end fusions.{\textless}/p{\textgreater}}, language = {en}, urldate = {2017-11-21}, journal = {Nature Communications}, author = {Porro, Antonio and Feuerhahn, Sascha and Delafontaine, Julien and Riethman, Harold and Rougemont, Jacques and Lingner, Joachim}, month = oct, year = {2014}, pages = {ncomms6379}, file = {Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/C3H58PDX/ncomms6379.html:text/html} } @article{das_survey_2007, title = {A survey of {DNA} motif finding algorithms}, volume = {8}, issn = {1471-2105}, url = {https://doi.org/10.1186/1471-2105-8-S7-S21}, doi = {10.1186/1471-2105-8-S7-S21}, abstract = {Unraveling the mechanisms that regulate gene expression is a major challenge in biology. An important task in this challenge is to identify regulatory elements, especially the binding sites in deoxyribonucleic acid (DNA) for transcription factors. These binding sites are short DNA segments that are called motifs. Recent advances in genome sequence availability and in high-throughput gene expression analysis technologies have allowed for the development of computational methods for motif finding. As a result, a large number of motif finding algorithms have been implemented and applied to various motif models over the past decade. This survey reviews the latest developments in DNA motif finding algorithms.}, number = {7}, journal = {BMC Bioinformatics}, author = {Das, Modan K. and Dai, Ho-Kwok}, month = nov, year = {2007}, pages = {S21}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TENU8HJ8/Das et Dai - 2007 - A survey of DNA motif finding algorithms.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FSHUHRF4/1471-2105-8-S7-S21.html:text/html} } @article{haberle_promoter_2016, series = {Transcriptional {Enhancers}}, title = {Promoter architectures and developmental gene regulation}, volume = {57}, issn = {1084-9521}, url = {http://www.sciencedirect.com/science/article/pii/S1084952116300143}, doi = {10.1016/j.semcdb.2016.01.014}, abstract = {Core promoters are minimal regions sufficient to direct accurate initiation of transcription and are crucial for regulation of gene expression. They are highly diverse in terms of associated core promoter motifs, underlying sequence composition and patterns of transcription initiation. Distinctive features of promoters are also seen at the chromatin level, including nucleosome positioning patterns and presence of specific histone modifications. Recent advances in identifying and characterizing promoters using next-generation sequencing-based technologies have provided the basis for their classification into functional groups and have shed light on their modes of regulation, with important implications for transcriptional regulation in development. This review discusses the methodology and the results of genome-wide studies that provided insight into the diversity of RNA polymerase II promoter architectures in vertebrates and other Metazoa, and the association of these architectures with distinct modes of regulation in embryonic development and differentiation.}, journal = {Seminars in Cell \& Developmental Biology}, author = {Haberle, Vanja and Lenhard, Boris}, month = sep, year = {2016}, keywords = {Transcriptional regulation, Core promoter, Transcription start sites, CAGE, Promoter types, Overlapping codes}, pages = {11--23}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/U9NFEUEZ/Haberle et Lenhard - 2016 - Promoter architectures and developmental gene regu.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H7H6IJF4/S1084952116300143.html:text/html} } -@article{haberle_promoter_2016-1, - series = {Transcriptional {Enhancers}}, - title = {Promoter architectures and developmental gene regulation}, - volume = {57}, - issn = {1084-9521}, - url = {http://www.sciencedirect.com/science/article/pii/S1084952116300143}, - doi = {10.1016/j.semcdb.2016.01.014}, - abstract = {Core promoters are minimal regions sufficient to direct accurate initiation of transcription and are crucial for regulation of gene expression. They are highly diverse in terms of associated core promoter motifs, underlying sequence composition and patterns of transcription initiation. Distinctive features of promoters are also seen at the chromatin level, including nucleosome positioning patterns and presence of specific histone modifications. Recent advances in identifying and characterizing promoters using next-generation sequencing-based technologies have provided the basis for their classification into functional groups and have shed light on their modes of regulation, with important implications for transcriptional regulation in development. This review discusses the methodology and the results of genome-wide studies that provided insight into the diversity of RNA polymerase II promoter architectures in vertebrates and other Metazoa, and the association of these architectures with distinct modes of regulation in embryonic development and differentiation.}, - journal = {Seminars in Cell \& Developmental Biology}, - author = {Haberle, Vanja and Lenhard, Boris}, - month = sep, - year = {2016}, - keywords = {Transcriptional regulation, Core promoter, Transcription start sites, CAGE, Promoter types, Overlapping codes}, - pages = {11--23}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EA3DNP6U/Haberle et Lenhard - 2016 - Promoter architectures and developmental gene regu.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/NM9EJ8GH/S1084952116300143.html:text/html} -} - -@article{haberle_promoter_2016-2, - series = {Transcriptional {Enhancers}}, - title = {Promoter architectures and developmental gene regulation}, - volume = {57}, - issn = {1084-9521}, - url = {http://www.sciencedirect.com/science/article/pii/S1084952116300143}, - doi = {10.1016/j.semcdb.2016.01.014}, - abstract = {Core promoters are minimal regions sufficient to direct accurate initiation of transcription and are crucial for regulation of gene expression. They are highly diverse in terms of associated core promoter motifs, underlying sequence composition and patterns of transcription initiation. Distinctive features of promoters are also seen at the chromatin level, including nucleosome positioning patterns and presence of specific histone modifications. Recent advances in identifying and characterizing promoters using next-generation sequencing-based technologies have provided the basis for their classification into functional groups and have shed light on their modes of regulation, with important implications for transcriptional regulation in development. This review discusses the methodology and the results of genome-wide studies that provided insight into the diversity of RNA polymerase II promoter architectures in vertebrates and other Metazoa, and the association of these architectures with distinct modes of regulation in embryonic development and differentiation.}, - journal = {Seminars in Cell \& Developmental Biology}, - author = {Haberle, Vanja and Lenhard, Boris}, - month = sep, - year = {2016}, - keywords = {Transcriptional regulation, Core promoter, Transcription start sites, CAGE, Promoter types, Overlapping codes}, - pages = {11--23}, - file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/672CF6I6/Haberle et Lenhard - 2016 - Promoter architectures and developmental gene regu.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VZF2P9ES/S1084952116300143.html:text/html} -} - @article{lenhard_metazoan_2012, title = {Metazoan promoters: emerging characteristics and insights into transcriptional regulation}, volume = {13}, copyright = {2012 Nature Publishing Group}, issn = {1471-0064}, shorttitle = {Metazoan promoters}, url = {https://www.nature.com/articles/nrg3163}, doi = {10.1038/nrg3163}, abstract = {Promoters are crucial for gene regulation. They vary greatly in terms of associated regulatory elements, sequence motifs, the choice of transcription start sites and other features. Several technologies that harness next-generation sequencing have enabled recent advances in identifying promoters and their features, helping researchers who are investigating functional categories of promoters and their modes of regulation. Additional features of promoters that are being characterized include types of histone modifications, nucleosome positioning, RNA polymerase pausing and novel small RNAs. In this Review, we discuss recent findings relating to metazoan promoters and how these findings are leading to a revised picture of what a gene promoter is and how it works.}, language = {en}, number = {4}, urldate = {2018-02-20}, journal = {Nature Reviews Genetics}, author = {Lenhard, Boris and Sandelin, Albin and Carninci, Piero}, month = apr, year = {2012}, pages = {233--245}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3A4V79DS/Lenhard et al. - 2012 - Metazoan promoters emerging characteristics and i.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WQFCRVTM/nrg3163.html:text/html} } @article{yang_prevalence_2007, title = {Prevalence of the initiator over the {TATA} box in human and yeast genes and identification of {DNA} motifs enriched in human {TATA}-less core promoters}, volume = {389}, issn = {0378-1119}, url = {http://www.sciencedirect.com/science/article/pii/S0378111906006238}, doi = {10.1016/j.gene.2006.09.029}, abstract = {The core promoter of eukaryotic genes is the minimal DNA region that recruits the basal transcription machinery to direct efficient and accurate transcription initiation. The fraction of human and yeast genes that contain specific core promoter elements such as the TATA box and the initiator (INR) remains unclear and core promoter motifs specific for TATA-less genes remain to be identified. Here, we present genome-scale computational analyses indicating that ∼76\% of human core promoters lack TATA-like elements, have a high GC content, and are enriched in Sp1-binding sites. We further identify two motifs – M3 (SCGGAAGY) and M22 (TGCGCANK) – that occur preferentially in human TATA-less core promoters. About 24\% of human genes have a TATA-like element and their promoters are generally AT-rich; however, only ∼10\% of these TATA-containing promoters have the canonical TATA box (TATAWAWR). In contrast, ∼46\% of human core promoters contain the consensus INR (YYANWYY) and ∼30\% are INR-containing TATA-less genes. Significantly, ∼46\% of human promoters lack both TATA-like and consensus INR elements. Surprisingly, mammalian-type INR sequences are present – and tend to cluster – in the transcription start site (TSS) region of ∼40\% of yeast core promoters and the frequency of specific core promoter types appears to be conserved in yeast and human genomes. Gene Ontology analyses reveal that TATA-less genes in humans, as in yeast, are frequently involved in basic “housekeeping” processes, while TATA-containing genes are more often highly regulated, such as by biotic or stress stimuli. These results reveal unexpected similarities in the occurrence of specific core promoter types and in their associated biological processes in yeast and humans and point to novel vertebrate-specific DNA motifs that might play a selective role in TATA-independent transcription.}, number = {1}, journal = {Gene}, author = {Yang, Chuhu and Bolotin, Eugene and Jiang, Tao and Sladek, Frances M. and Martinez, Ernest}, month = mar, year = {2007}, keywords = {transcription, Genome-wide computational analysis, Core promoter elements, Sp1, ELK-1, M22, Motif distribution}, pages = {52--65}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9PU5KSBT/Yang et al. - 2007 - Prevalence of the initiator over the TATA box in h.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8PZSB8IF/S0378111906006238.html:text/html} } @article{ye_seqminer:_2011, title = {{seqMINER}: an integrated {ChIP}-seq data interpretation platform}, volume = {39}, issn = {0305-1048}, shorttitle = {{seqMINER}}, url = {https://academic.oup.com/nar/article/39/6/e35/2411697}, doi = {10.1093/nar/gkq1287}, abstract = {In a single experiment, chromatin immunoprecipitation combined with high throughput sequencing (ChIP-seq) provides genome-wide information about a given covalent histone modification or transcription factor occupancy. However, time efficient bioinformatics resources for extracting biological meaning out of these gigabyte-scale datasets are often a limiting factor for data interpretation by biologists. We created an integrated portable ChIP-seq data interpretation platform called seqMINER, with optimized performances for efficient handling of multiple genome-wide datasets. seqMINER allows comparison and integration of multiple ChIP-seq datasets and extraction of qualitative as well as quantitative information. seqMINER can handle the biological complexity of most experimental situations and proposes methods to the user for data classification according to the analysed features. In addition, through multiple graphical representations, seqMINER allows visualization and modelling of general as well as specific patterns in a given dataset. To demonstrate the efficiency of seqMINER, we have carried out a comprehensive analysis of genome-wide chromatin modification data in mouse embryonic stem cells to understand the global epigenetic landscape and its change through cellular differentiation.}, language = {en}, number = {6}, urldate = {2018-02-21}, journal = {Nucleic Acids Research}, author = {Ye, Tao and Krebs, Arnaud R. and Choukrallah, Mohamed-Amin and Keime, Celine and Plewniak, Frederic and Davidson, Irwin and Tora, Laszlo}, month = mar, year = {2011}, pages = {e35--e35}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4RHT8HUV/Ye et al. - 2011 - seqMINER an integrated ChIP-seq data interpretati.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UCQ448QG/2411697.html:text/html} } @article{castro-mondragon_rsat_2017, title = {{RSAT} matrix-clustering: dynamic exploration and redundancy reduction of transcription factor binding motif collections}, volume = {45}, issn = {0305-1048}, shorttitle = {{RSAT} matrix-clustering}, url = {https://academic.oup.com/nar/article/45/13/e119/3862068}, doi = {10.1093/nar/gkx314}, abstract = {Transcription factor (TF) databases contain multitudes of binding motifs (TFBMs) from various sources, from which non-redundant collections are derived by manual curation. The advent of high-throughput methods stimulated the production of novel collections with increasing numbers of motifs. Meta-databases, built by merging these collections, contain redundant versions, because available tools are not suited to automatically identify and explore biologically relevant clusters among thousands of motifs. Motif discovery from genome-scale data sets (e.g. ChIP-seq) also produces redundant motifs, hampering the interpretation of results. We present matrix-clustering, a versatile tool that clusters similar TFBMs into multiple trees, and automatically creates non-redundant TFBM collections. A feature unique to matrix-clustering is its dynamic visualisation of aligned TFBMs, and its capability to simultaneously treat multiple collections from various sources. We demonstrate that matrix-clustering considerably simplifies the interpretation of combined results from multiple motif discovery tools, and highlights biologically relevant variations of similar motifs. We also ran a large-scale application to cluster ∼11 000 motifs from 24 entire databases, showing that matrix-clustering correctly groups motifs belonging to the same TF families, and drastically reduced motif redundancy. matrix-clustering is integrated within the RSAT suite (http://rsat.eu/), accessible through a user-friendly web interface or command-line for its integration in pipelines.}, language = {en}, number = {13}, urldate = {2018-03-21}, journal = {Nucleic Acids Research}, author = {Castro-Mondragon, Jaime Abraham and Jaeger, Sébastien and Thieffry, Denis and Thomas-Chollier, Morgane and van Helden, Jacques}, month = jul, year = {2017}, pages = {e119--e119}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5ZSJZ2JK/Castro-Mondragon et al. - 2017 - RSAT matrix-clustering dynamic exploration and re.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/X54R4KMJ/3862068.html:text/html} } @article{li_cd-hit:_2006, title = {Cd-hit: a fast program for clustering and comparing large sets of protein or nucleotide sequences}, volume = {22}, issn = {1367-4803}, shorttitle = {Cd-hit}, url = {https://academic.oup.com/bioinformatics/article/22/13/1658/194225}, doi = {10.1093/bioinformatics/btl158}, abstract = {Motivation: In 2001 and 2002, we published two papers (Bioinformatics, 17, 282–283, Bioinformatics, 18, 77–82) describing an ultrafast protein sequence clustering program called cd-hit. This program can efficiently cluster a huge protein database with millions of sequences. However, the applications of the underlying algorithm are not limited to only protein sequences clustering, here we present several new programs using the same algorithm including cd-hit-2d, cd-hit-est and cd-hit-est-2d. Cd-hit-2d compares two protein datasets and reports similar matches between them; cd-hit-est clusters a DNA/RNA sequence database and cd-hit-est-2d compares two nucleotide datasets. All these programs can handle huge datasets with millions of sequences and can be hundreds of times faster than methods based on the popular sequence comparison and database search tools, such as BLAST.Availability:Contact:liwz@sdsc.edu}, language = {en}, number = {13}, urldate = {2018-03-21}, journal = {Bioinformatics}, author = {Li, Weizhong and Godzik, Adam}, month = jul, year = {2006}, pages = {1658--1659}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8PTNE6P7/Li et Godzik - 2006 - Cd-hit a fast program for clustering and comparin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/C8G49ZEK/194225.html:text/html} } @article{bucher_weight_1990, title = {Weight matrix descriptions of four eukaryotic {RNA} polymerase {II} promoter elements derived from 502 unrelated promoter sequences}, volume = {212}, issn = {0022-2836}, url = {http://www.sciencedirect.com/science/article/pii/0022283690902239}, doi = {10.1016/0022-2836(90)90223-9}, abstract = {Optimized weight matrices defining four major eukaryotic promoter elements, the TATA-box, cap signal, CCAAT-, and GC-box, are presented; they were derived by comparative sequence analysis of 502 unrelated RNA polymerase II promoter regions. The new TATA-box and cap signal descriptions differ in several respects from the only hitherto available base frequency Tables. The CCAAT-box matrix, obtained with no prior assumption but CCAAT being the core of the motif, reflects precisely the sequence specificity of the recently discovered nuclear factor NY-I/CP1 but does not include typical recognition sequences of two other purported CCAAT-binding proteins, CTF and CBP. The GC-box description is longer than the previously proposed consensus sequences but is consistent with Sp1 protein-DNA binding data. The notion of a CACCC element distinct from the GC-box seems not to be justified any longer in view of the new weight matrix. Unlike the two fixed-distance elements, neither the CCAAT- nor the GC-box occurs at significantly high frequency in the upstream regions of non-vertebrate genes. Preliminary attempts to predict promoters with the aid of the new signal descriptions were unexpectedly successful. The new TATA-box matrix locates eukaryotic transcription initiation sites as reliably as do the best currently available methods to map Escherichia coli promoters. This analysis was made possible by the recently established Eukaryotic Promoter Database (EPD) of the EMBL Nucleotide Sequence Data Library. In order to derive the weight matrices, a novel algorithm has been devised that is generally applicable to sequence motifs positionally correlated with a biologically defined position in the sequences. The signal must be sufficiently over-represented in a particular region relative to the given site, but need not be present in all members of the input sequence collection. The algorithm iteratively redefines the set of putative motif representatives from which a weight matrix is derived, so as to maximize a quantitative measure of local over-representation, an optimization criterion that naturally combines structural and positional constancy. A comprehensive description of the technique is presented in Methods and Data.}, number = {4}, journal = {Journal of Molecular Biology}, author = {Bucher, Philipp}, month = apr, year = {1990}, pages = {563--578}, file = {Bucher90.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Bucher90.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KSDSN7JT/0022283690902239.html:text/html} } @article{buenrostro_transposition_2013, title = {Transposition of native chromatin for fast and sensitive epigenomic profiling of open chromatin, {DNA}-binding proteins and nucleosome position}, volume = {10}, copyright = {2013 Nature Publishing Group}, issn = {1548-7105}, url = {https://www.nature.com/articles/nmeth.2688}, doi = {10.1038/nmeth.2688}, abstract = {We describe an assay for transposase-accessible chromatin using sequencing (ATAC-seq), based on direct in vitro transposition of sequencing adaptors into native chromatin, as a rapid and sensitive method for integrative epigenomic analysis. ATAC-seq captures open chromatin sites using a simple two-step protocol with 500–50,000 cells and reveals the interplay between genomic locations of open chromatin, DNA-binding proteins, individual nucleosomes and chromatin compaction at nucleotide resolution. We discovered classes of DNA-binding factors that strictly avoided, could tolerate or tended to overlap with nucleosomes. Using ATAC-seq maps of human CD4+ T cells from a proband obtained on consecutive days, we demonstrated the feasibility of analyzing an individual's epigenome on a timescale compatible with clinical decision-making.}, language = {en}, number = {12}, urldate = {2018-03-23}, journal = {Nature Methods}, author = {Buenrostro, Jason D. and Giresi, Paul G. and Zaba, Lisa C. and Chang, Howard Y. and Greenleaf, William J.}, month = dec, year = {2013}, pages = {1213--1218}, file = {Buenrostro et al. - 2013 - Supplemental.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A62IVVST/Buenrostro et al. - 2013 - Supplemental.pdf:application/pdf;Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/A62IVVST/Buenrostro et al. - 2013 - Transposition of native chromatin for fast and sen.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B4S85K35/nmeth.html:text/html} } -@article{andersson_human_2015, - title = {Human {Gene} {Promoters} {Are} {Intrinsically} {Bidirectional}}, - volume = {60}, - issn = {1097-2765}, - url = {http://www.cell.com/molecular-cell/abstract/S1097-2765(15)00806-0}, - doi = {10.1016/j.molcel.2015.10.015}, - language = {English}, - number = {3}, - urldate = {2018-04-03}, - journal = {Molecular Cell}, - author = {Andersson, Robin and Chen, Yun and Core, Leighton and Lis, John T. and Sandelin, Albin and Jensen, Torben Heick}, - month = nov, - year = {2015}, - pmid = {26545074}, - pages = {346--347}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VW6MCTID/Andersson et al. - 2015 - Human Gene Promoters Are Intrinsically Bidirection.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6SPGS4R2/S1097-2765(15)00806-0.html:text/html} -} - @article{duttke_human_2015-1, title = {Human {Promoters} {Are} {Intrinsically} {Directional}}, volume = {57}, issn = {1097-2765}, url = {http://www.cell.com/molecular-cell/abstract/S1097-2765(14)01007-7}, doi = {10.1016/j.molcel.2014.12.029}, language = {English}, number = {4}, urldate = {2018-04-03}, journal = {Molecular Cell}, author = {Duttke, Sascha H. C. and Lacadie, Scott A. and Ibrahim, Mahmoud M. and Glass, Christopher K. and Corcoran, David L. and Benner, Christopher and Heinz, Sven and Kadonaga, James T. and Ohler, Uwe}, month = feb, year = {2015}, pmid = {25639469}, pages = {674--684}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/72BCMJ2J/Duttke et al. - 2015 - Human Promoters Are Intrinsically Directional.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K2P9ZEZV/S1097-2765(14)01007-7.html:text/html} } -@misc{noauthor_pooled_nodate, - title = {Pooled {ChIP}-{Seq} {Links} {Variation} in {Transcription} {Factor} {Binding} to {Complex} {Disease} {Risk}: {Cell}}, - url = {http://www.cell.com/cell/fulltext/S0092-8674(16)30339-7}, - urldate = {2018-04-11} -} - @article{tehranchi_pooled_2016, title = {Pooled {ChIP}-{Seq} {Links} {Variation} in {Transcription} {Factor} {Binding} to {Complex} {Disease} {Risk}}, volume = {165}, issn = {0092-8674, 1097-4172}, url = {http://www.cell.com/cell/abstract/S0092-8674(16)30339-7}, doi = {10.1016/j.cell.2016.03.041}, language = {English}, number = {3}, urldate = {2018-04-11}, journal = {Cell}, author = {Tehranchi, Ashley K. and Myrthil, Marsha and Martin, Trevor and Hie, Brian L. and Golan, David and Fraser, Hunter B.}, month = apr, year = {2016}, pmid = {27087447}, pages = {730--741}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/DIHDRW7A/Tehranchi et al. - 2016 - Pooled ChIP-Seq Links Variation in Transcription F.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WW7SSNNZ/S0092-8674(16)30339-7.html:text/html} } @article{stormo_identifying_1989, title = {Identifying protein-binding sites from unaligned {DNA} fragments.}, volume = {86}, issn = {0027-8424}, url = {https://www.ncbi.nlm.nih.gov/pmc/articles/PMC286650/}, abstract = {The ability to determine important features within DNA sequences from the sequences alone is becoming essential as large-scale sequencing projects are being undertaken. We present a method that can be applied to the problem of identifying the recognition pattern for a DNA-binding protein given only a collection of sequenced DNA fragments, each known to contain somewhere within it a binding site for that protein. Information about the position or orientation of the binding sites within those fragments is not needed. The method compares the "information content" of a large number of possible binding site alignments to arrive at a matrix representation of the binding site pattern. The specificity of the protein is represented as a matrix, rather than a consensus sequence, allowing patterns that are typical of regulatory protein-binding sites to be identified. The reliability of the method improves as the number of sequences increases, but the time required increases only linearly with the number of sequences. An example, using known cAMP receptor protein-binding sites, illustrates the method.}, number = {4}, journal = {Proceedings of the National Academy of Sciences of the United States of America}, author = {Stormo, G D and Hartzell, G W}, month = feb, year = {1989}, pmid = {2919167}, pmcid = {PMC286650}, pages = {1183--1187}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/P8H57Z5V/Stormo et Hartzell - 1989 - Identifying protein-binding sites from unaligned D.pdf:application/pdf} } @article{li_sequence_2002, title = {Sequence clustering strategies improve remote homology recognitions while reducing search times}, volume = {15}, issn = {1741-0126}, url = {https://academic.oup.com/peds/article/15/8/643/1532107}, doi = {10.1093/protein/15.8.643}, abstract = {Abstract. Sequence databases are rapidly growing, thereby increasing the coverage of protein sequence space, but this coverage is uneven because most sequencin}, language = {en}, number = {8}, urldate = {2018-06-21}, journal = {Protein Engineering, Design and Selection}, author = {Li, Weizhong and Jaroszewski, Lukasz and Godzik, Adam}, month = aug, year = {2002}, pages = {643--649}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8UE54UA8/Li et al. - 2002 - Sequence clustering strategies improve remote homo.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/D343QNAZ/1532107.html:text/html} } @article{schaid_genome-wide_2018, title = {From genome-wide associations to candidate causal variants by statistical fine-mapping}, volume = {19}, copyright = {2018 Macmillan Publishers Ltd., part of Springer Nature}, issn = {1471-0064}, url = {https://www.nature.com/articles/s41576-018-0016-z}, doi = {10.1038/s41576-018-0016-z}, abstract = {Fine-mapping is the process by which a trait-associated region from a genome-wide association study (GWAS) is analysed to identify the particular genetic variants that are likely to causally influence the examined trait. This Review discusses the diverse statistical approaches to fine-mapping and their foundations, strengths and limitations, including integration of trans-ethnic human population data and functional annotations.}, language = {en}, number = {8}, urldate = {2018-07-17}, journal = {Nature Reviews Genetics}, author = {Schaid, Daniel J. and Chen, Wenan and Larson, Nicholas B.}, month = aug, year = {2018}, pages = {491--504}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9DTQSD64/Schaid et al. - 2018 - From genome-wide associations to candidate causal .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HF3NTMN5/s41576-018-0016-z.html:text/html} } @article{andreatta_gibbscluster:_2017, title = {{GibbsCluster}: unsupervised clustering and alignment of peptide sequences}, volume = {45}, issn = {0305-1048}, shorttitle = {{GibbsCluster}}, url = {https://academic.oup.com/nar/article/45/W1/W458/3605637}, doi = {10.1093/nar/gkx248}, abstract = {Abstract. Receptor interactions with short linear peptide fragments (ligands) are at the base of many biological signaling processes. Conserved and information}, language = {en}, number = {W1}, urldate = {2018-08-07}, journal = {Nucleic Acids Research}, author = {Andreatta, Massimo and Alvarez, Bruno and Nielsen, Morten}, month = jul, year = {2017}, pages = {W458--W463}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GVGDMPB9/Andreatta et al. - 2017 - GibbsCluster unsupervised clustering and alignmen.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TFSVZ862/3605637.html:text/html} } @article{andreatta_simultaneous_2013, title = {Simultaneous alignment and clustering of peptide data using a {Gibbs} sampling approach}, volume = {29}, issn = {1367-4803}, url = {https://academic.oup.com/bioinformatics/article/29/1/8/272260}, doi = {10.1093/bioinformatics/bts621}, abstract = {Abstract. Motivation: Proteins recognizing short peptide fragments play a central role in cellular signaling. As a result of high-throughput technologies, pept}, language = {en}, number = {1}, urldate = {2018-08-08}, journal = {Bioinformatics}, author = {Andreatta, Massimo and Lund, Ole and Nielsen, Morten}, month = jan, year = {2013}, pages = {8--14}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UHJ8FJM4/Andreatta et al. - 2013 - Simultaneous alignment and clustering of peptide d.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2ZQ6BW86/272260.html:text/html} } @article{lawrence_detecting_1993, title = {Detecting subtle sequence signals: a {Gibbs} sampling strategy for multiple alignment}, volume = {262}, copyright = {© 1993}, issn = {0036-8075, 1095-9203}, shorttitle = {Detecting subtle sequence signals}, url = {http://science.sciencemag.org/content/262/5131/208}, doi = {10.1126/science.8211139}, abstract = {A wealth of protein and DNA sequence data is being generated by genome projects and other sequencing efforts. A crucial barrier to deciphering these sequences and understanding the relations among them is the difficulty of detecting subtle local residue patterns common to multiple sequences. Such patterns frequently reflect similar molecular structures and biological properties. A mathematical definition of this "local multiple alignment" problem suitable for full computer automation has been used to develop a new and sensitive algorithm, based on the statistical method of iterative sampling. This algorithm finds an optimized local alignment model for N sequences in N-linear time, requiring only seconds on current workstations, and allows the simultaneous detection and optimization of multiple patterns and pattern repeats. The method is illustrated as applied to helix-turn-helix proteins, lipocalins, and prenyltransferases.}, language = {en}, number = {5131}, urldate = {2018-08-15}, journal = {Science}, author = {Lawrence, C. E. and Altschul, S. F. and Boguski, M. S. and Liu, J. S. and Neuwald, A. F. and Wootton, J. C.}, month = oct, year = {1993}, pmid = {8211139}, pages = {208--214}, file = {Lawrence93.pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Lawrence93.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/327XWVSX/208.html:text/html} } -@article{leisch_article_nodate, - title = {@{Article}\{, author = \{{Friedrich} {Leisch}\}, title = \{{A} {Toolbox} for {K}-{Centroids} {Cluster} {Analysis}\}, journal = \{{Computational} {Statistics} and {Data} {Analysis}\}, year = \{2006\}, volume = \{51\}, number = \{2\}, pages = \{526--544\}, \}}, - author = {Leisch, Friedrich} -} - @article{rosenbloom_encode_2013, title = {{ENCODE} {Data} in the {UCSC} {Genome} {Browser}: year 5 update}, volume = {41}, issn = {0305-1048}, shorttitle = {{ENCODE} {Data} in the {UCSC} {Genome} {Browser}}, url = {https://academic.oup.com/nar/article/41/D1/D56/1066727}, doi = {10.1093/nar/gks1172}, abstract = {Abstract. The Encyclopedia of DNA Elements (ENCODE), http://encodeproject.org, has completed its fifth year of scientific collaboration to create a comprehensi}, language = {en}, number = {D1}, urldate = {2018-09-24}, journal = {Nucleic Acids Research}, author = {Rosenbloom, Kate R. and Sloan, Cricket A. and Malladi, Venkat S. and Dreszer, Timothy R. and Learned, Katrina and Kirkup, Vanessa M. and Wong, Matthew C. and Maddren, Morgan and Fang, Ruihua and Heitner, Steven G. and Lee, Brian T. and Barber, Galt P. and Harte, Rachel A. and Diekhans, Mark and Long, Jeffrey C. and Wilder, Steven P. and Zweig, Ann S. and Karolchik, Donna and Kuhn, Robert M. and Haussler, David and Kent, W. James}, month = jan, year = {2013}, pages = {D56--D63}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HXMKXF6F/Rosenbloom et al. - 2013 - ENCODE Data in the UCSC Genome Browser year 5 upd.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UV7N94N9/1066727.html:text/html} } @article{bailey_meme_2009, title = {{MEME} {Suite}: tools for motif discovery and searching}, volume = {37}, issn = {0305-1048}, shorttitle = {{MEME} {Suite}}, url = {https://academic.oup.com/nar/article/37/suppl_2/W202/1135092}, doi = {10.1093/nar/gkp335}, abstract = {Abstract. The MEME Suite web server provides a unified portal for online discovery and analysis of sequence motifs representing features such as DNA binding si}, language = {en}, number = {suppl\_2}, urldate = {2018-09-25}, journal = {Nucleic Acids Research}, author = {Bailey, Timothy L. and Boden, Mikael and Buske, Fabian A. and Frith, Martin and Grant, Charles E. and Clementi, Luca and Ren, Jingyuan and Li, Wilfred W. and Noble, William S.}, month = jul, year = {2009}, pages = {W202--W208}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FSJB5Q2B/Bailey et al. - 2009 - MEME Suite tools for motif discovery and searchin.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/84WXK6RS/1135092.html:text/html} } @article{dreos_mga_2018, title = {{MGA} repository: a curated data resource for {ChIP}-seq and other genome annotated data}, volume = {46}, issn = {0305-1048}, shorttitle = {{MGA} repository}, url = {https://academic.oup.com/nar/article/46/D1/D175/4563313}, doi = {10.1093/nar/gkx995}, abstract = {Abstract. The Mass Genome Annotation (MGA) repository is a resource designed to store published next generation sequencing data and other genome annotation dat}, language = {en}, number = {D1}, urldate = {2018-10-02}, journal = {Nucleic Acids Research}, author = {Dreos, René and Ambrosini, Giovanna and Groux, Romain and Périer, Rouayda Cavin and Bucher, Philipp}, month = jan, year = {2018}, pages = {D175--D180}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/B3GGR38V/Dréos et al. - 2018 - MGA repository a curated data resource for ChIP-s.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9VUC447P/4563313.html:text/html} } @article{ambrosini_pwmscan:_2018, title = {{PWMScan}: a fast tool for scanning entire genomes with a position-specific weight matrix}, volume = {34}, issn = {1367-4803}, shorttitle = {{PWMScan}}, url = {https://academic.oup.com/bioinformatics/article/34/14/2483/4921176}, doi = {10.1093/bioinformatics/bty127}, abstract = {AbstractSummary. Transcription factors regulate gene expression by binding to specific short DNA sequences of 5–20 bp to regulate the rate of transcription of}, language = {en}, number = {14}, urldate = {2018-10-31}, journal = {Bioinformatics}, author = {Ambrosini, Giovanna and Groux, Romain and Bucher, Philipp}, month = jul, year = {2018}, pages = {2483--2484}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7BG8Z46H/Ambrosini et al. - 2018 - PWMScan a fast tool for scanning entire genomes w.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KDHTMW7B/4921176.html:text/html} } @article{kulakovskiy_hocomoco:_2018, title = {{HOCOMOCO}: towards a complete collection of transcription factor binding models for human and mouse via large-scale {ChIP}-{Seq} analysis}, volume = {46}, issn = {0305-1048}, shorttitle = {{HOCOMOCO}}, url = {https://academic.oup.com/nar/article/46/D1/D252/4616875}, doi = {10.1093/nar/gkx1106}, abstract = {Abstract. We present a major update of the HOCOMOCO collection that consists of patterns describing DNA binding specificities for human and mouse transcription}, language = {en}, number = {D1}, urldate = {2018-10-31}, journal = {Nucleic Acids Research}, author = {Kulakovskiy, Ivan V. and Vorontsov, Ilya E. and Yevshin, Ivan S. and Sharipov, Ruslan N. and Fedorova, Alla D. and Rumynskiy, Eugene I. and Medvedeva, Yulia A. and Magana-Mora, Arturo and Bajic, Vladimir B. and Papatsenko, Dmitry A. and Kolpakov, Fedor A. and Makeev, Vsevolod J.}, month = jan, year = {2018}, pages = {D252--D259}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/M43KTC5T/Kulakovskiy et al. - 2018 - HOCOMOCO towards a complete collection of transcr.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/99VQ7MZK/4616875.html:text/html} } @article{khan_jaspar_2018, title = {{JASPAR} 2018: update of the open-access database of transcription factor binding profiles and its web framework}, volume = {46}, issn = {0305-1048}, shorttitle = {{JASPAR} 2018}, url = {https://academic.oup.com/nar/article/46/D1/D260/4621338}, doi = {10.1093/nar/gkx1126}, abstract = {Abstract. JASPAR (http://jaspar.genereg.net) is an open-access database of curated, non-redundant transcription factor (TF)-binding profiles stored as position}, language = {en}, number = {D1}, urldate = {2018-10-31}, journal = {Nucleic Acids Research}, author = {Khan, Aziz and Fornes, Oriol and Stigliani, Arnaud and Gheorghe, Marius and Castro-Mondragon, Jaime A. and van der Lee, Robin and Bessy, Adrien and Chèneby, Jeanne and Kulkarni, Shubhada R. and Tan, Ge and Baranasic, Damir and Arenillas, David J. and Sandelin, Albin and Vandepoele, Klaas and Lenhard, Boris and Ballester, Benoît and Wasserman, Wyeth W. and Parcy, François and Mathelier, Anthony}, month = jan, year = {2018}, pages = {D260--D266}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TZUMWSCF/Khan et al. - 2018 - JASPAR 2018 update of the open-access database of.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EUQZE2J9/4621338.html:text/html} } @article{chatr-aryamontri_biogrid_2017, title = {The {BioGRID} interaction database: 2017 update}, volume = {45}, issn = {0305-1048}, shorttitle = {The {BioGRID} interaction database}, url = {https://academic.oup.com/nar/article/45/D1/D369/2681732}, doi = {10.1093/nar/gkw1102}, abstract = {Abstract. The Biological General Repository for Interaction Datasets (BioGRID: https://thebiogrid.org) is an open access database dedicated to the annotation a}, language = {en}, number = {D1}, urldate = {2018-10-31}, journal = {Nucleic Acids Research}, author = {Chatr-aryamontri, Andrew and Oughtred, Rose and Boucher, Lorrie and Rust, Jennifer and Chang, Christie and Kolas, Nadine K. and O'Donnell, Lara and Oster, Sara and Theesfeld, Chandra and Sellam, Adnane and Stark, Chris and Breitkreutz, Bobby-Joe and Dolinski, Kara and Tyers, Mike}, month = jan, year = {2017}, pages = {D369--D379}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/V5XI5JI8/Chatr-aryamontri et al. - 2017 - The BioGRID interaction database 2017 update.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/R63HKK9T/2681732.html:text/html} } @article{djebali_landscape_2012, title = {Landscape of transcription in human cells}, volume = {489}, copyright = {2012 Nature Publishing Group}, issn = {1476-4687}, url = {https://www.nature.com/articles/nature11233}, doi = {10.1038/nature11233}, abstract = {Eukaryotic cells make many types of primary and processed RNAs that are found either in specific subcellular compartments or throughout the cells. A complete catalogue of these RNAs is not yet available and their characteristic subcellular localizations are also poorly understood. Because RNA represents the direct output of the genetic information encoded by genomes and a significant proportion of a cell’s regulatory capabilities are focused on its synthesis, processing, transport, modification and translation, the generation of such a catalogue is crucial for understanding genome function. Here we report evidence that three-quarters of the human genome is capable of being transcribed, as well as observations about the range and levels of expression, localization, processing fates, regulatory regions and modifications of almost all currently annotated and thousands of previously unannotated RNAs. These observations, taken together, prompt a redefinition of the concept of a gene.}, language = {en}, number = {7414}, urldate = {2018-11-12}, journal = {Nature}, author = {Djebali, Sarah and Davis, Carrie A. and Merkel, Angelika and Dobin, Alex and Lassmann, Timo and Mortazavi, Ali and Tanzer, Andrea and Lagarde, Julien and Lin, Wei and Schlesinger, Felix and Xue, Chenghai and Marinov, Georgi K. and Khatun, Jainab and Williams, Brian A. and Zaleski, Chris and Rozowsky, Joel and Röder, Maik and Kokocinski, Felix and Abdelhamid, Rehab F. and Alioto, Tyler and Antoshechkin, Igor and Baer, Michael T. and Bar, Nadav S. and Batut, Philippe and Bell, Kimberly and Bell, Ian and Chakrabortty, Sudipto and Chen, Xian and Chrast, Jacqueline and Curado, Joao and Derrien, Thomas and Drenkow, Jorg and Dumais, Erica and Dumais, Jacqueline and Duttagupta, Radha and Falconnet, Emilie and Fastuca, Meagan and Fejes-Toth, Kata and Ferreira, Pedro and Foissac, Sylvain and Fullwood, Melissa J. and Gao, Hui and Gonzalez, David and Gordon, Assaf and Gunawardena, Harsha and Howald, Cedric and Jha, Sonali and Johnson, Rory and Kapranov, Philipp and King, Brandon and Kingswood, Colin and Luo, Oscar J. and Park, Eddie and Persaud, Kimberly and Preall, Jonathan B. and Ribeca, Paolo and Risk, Brian and Robyr, Daniel and Sammeth, Michael and Schaffer, Lorian and See, Lei-Hoon and Shahab, Atif and Skancke, Jorgen and Suzuki, Ana Maria and Takahashi, Hazuki and Tilgner, Hagen and Trout, Diane and Walters, Nathalie and Wang, Huaien and Wrobel, John and Yu, Yanbao and Ruan, Xiaoan and Hayashizaki, Yoshihide and Harrow, Jennifer and Gerstein, Mark and Hubbard, Tim and Reymond, Alexandre and Antonarakis, Stylianos E. and Hannon, Gregory and Giddings, Morgan C. and Ruan, Yijun and Wold, Barbara and Carninci, Piero and Guigó, Roderic and Gingeras, Thomas R.}, month = sep, year = {2012}, pages = {101--108}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/C2Q2SUSC/Djebali et al. - 2012 - Landscape of transcription in human cells.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XJEIHF3I/nature11233.html:text/html} } @article{hesselberth_global_2009, title = {Global mapping of protein-{DNA} interactions \textit{in vivo} by digital genomic footprinting}, volume = {6}, copyright = {2009 Nature Publishing Group}, issn = {1548-7105}, url = {https://www.nature.com/articles/nmeth.1313}, doi = {10.1038/nmeth.1313}, abstract = {The orchestrated binding of transcriptional activators and repressors to specific DNA sequences in the context of chromatin defines the regulatory program of eukaryotic genomes. We developed a digital approach to assay regulatory protein occupancy on genomic DNA in vivo by dense mapping of individual DNase I cleavages from intact nuclei using massively parallel DNA sequencing. Analysis of {\textgreater}23 million cleavages across the Saccharomyces cerevisiae genome revealed thousands of protected regulatory protein footprints, enabling de novo derivation of factor binding motifs and the identification of hundreds of new binding sites for major regulators. We observed striking correspondence between single-nucleotide resolution DNase I cleavage patterns and protein-DNA interactions determined by crystallography. The data also yielded a detailed view of larger chromatin features including positioned nucleosomes flanking factor binding regions. Digital genomic footprinting should be a powerful approach to delineate the cis-regulatory framework of any organism with an available genome sequence.}, language = {en}, number = {4}, urldate = {2018-11-14}, journal = {Nature Methods}, author = {Hesselberth, Jay R. and Chen, Xiaoyu and Zhang, Zhihong and Sabo, Peter J. and Sandstrom, Richard and Reynolds, Alex P. and Thurman, Robert E. and Neph, Shane and Kuehn, Michael S. and Noble, William S. and Fields, Stanley and Stamatoyannopoulos, John A.}, month = apr, year = {2009}, pages = {283--289}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZV93EHPT/Hesselberth et al. - 2009 - Global mapping of protein-DNA interactions iin v.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/8G6VRRWP/nmeth.html:text/html} } @article{hon_chromasig:_2008, title = {{ChromaSig}: {A} {Probabilistic} {Approach} to {Finding} {Common} {Chromatin} {Signatures} in the {Human} {Genome}}, volume = {4}, issn = {1553-7358}, shorttitle = {{ChromaSig}}, url = {https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1000201}, doi = {10.1371/journal.pcbi.1000201}, abstract = {Computational methods to identify functional genomic elements using genetic information have been very successful in determining gene structure and in identifying a handful of cis-regulatory elements. But the vast majority of regulatory elements have yet to be discovered, and it has become increasingly apparent that their discovery will not come from using genetic information alone. Recently, high-throughput technologies have enabled the creation of information-rich epigenetic maps, most notably for histone modifications. However, tools that search for functional elements using this epigenetic information have been lacking. Here, we describe an unsupervised learning method called ChromaSig to find, in an unbiased fashion, commonly occurring chromatin signatures in both tiling microarray and sequencing data. Applying this algorithm to nine chromatin marks across a 1\% sampling of the human genome in HeLa cells, we recover eight clusters of distinct chromatin signatures, five of which correspond to known patterns associated with transcriptional promoters and enhancers. Interestingly, we observe that the distinct chromatin signatures found at enhancers mark distinct functional classes of enhancers in terms of transcription factor and coactivator binding. In addition, we identify three clusters of novel chromatin signatures that contain evolutionarily conserved sequences and potential cis-regulatory elements. Applying ChromaSig to a panel of 21 chromatin marks mapped genomewide by ChIP-Seq reveals 16 classes of genomic elements marked by distinct chromatin signatures. Interestingly, four classes containing enrichment for repressive histone modifications appear to be locally heterochromatic sites and are enriched in quickly evolving regions of the genome. The utility of this approach in uncovering novel, functionally significant genomic elements will aid future efforts of genome annotation via chromatin modifications.}, language = {en}, number = {10}, urldate = {2018-11-20}, journal = {PLOS Computational Biology}, author = {Hon, Gary and Ren, Bing and Wang, Wei}, month = oct, year = {2008}, keywords = {Chromatin, Transcription Factors, Sequence motif analysis, Histones, Histone modification, Chromatin modification, HeLa cells, T cells}, pages = {e1000201}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/K6CUWFD9/Hon et al. - 2008 - ChromaSig A Probabilistic Approach to Finding Com.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UJZ2MCBQ/article.html:text/html} } @inproceedings{arthur_k-means++:_2007, address = {Philadelphia, PA, USA}, series = {{SODA} '07}, title = {K-means++: {The} {Advantages} of {Careful} {Seeding}}, isbn = {978-0-89871-624-5}, shorttitle = {K-means++}, url = {http://dl.acm.org/citation.cfm?id=1283383.1283494}, abstract = {The k-means method is a widely used clustering technique that seeks to minimize the average squared distance between points in the same cluster. Although it offers no accuracy guarantees, its simplicity and speed are very appealing in practice. By augmenting k-means with a very simple, randomized seeding technique, we obtain an algorithm that is Θ(logk)-competitive with the optimal clustering. Preliminary experiments show that our augmentation improves both the speed and the accuracy of k-means, often quite dramatically.}, booktitle = {Proceedings of the {Eighteenth} {Annual} {ACM}-{SIAM} {Symposium} on {Discrete} {Algorithms}}, publisher = {Society for Industrial and Applied Mathematics}, author = {Arthur, David and Vassilvitskii, Sergei}, year = {2007}, pages = {1027--1035}, file = {ACM Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/62ET8WNZ/Arthur et Vassilvitskii - 2007 - K-means++ The Advantages of Careful Seeding.pdf:application/pdf} } @article{lake_integrative_2018, title = {Integrative single-cell analysis of transcriptional and epigenetic states in the human adult brain}, volume = {36}, copyright = {2017 Nature Publishing Group}, issn = {1546-1696}, url = {https://www.nature.com/articles/nbt.4038}, doi = {10.1038/nbt.4038}, abstract = {Detailed characterization of the cell types in the human brain requires scalable experimental approaches to examine multiple aspects of the molecular state of individual cells, as well as computational integration of the data to produce unified cell-state annotations. Here we report improved high-throughput methods for single-nucleus droplet-based sequencing (snDrop-seq) and single-cell transposome hypersensitive site sequencing (scTHS-seq). We used each method to acquire nuclear transcriptomic and DNA accessibility maps for {\textgreater}60,000 single cells from human adult visual cortex, frontal cortex, and cerebellum. Integration of these data revealed regulatory elements and transcription factors that underlie cell-type distinctions, providing a basis for the study of complex processes in the brain, such as genetic programs that coordinate adult remyelination. We also mapped disease-associated risk variants to specific cellular populations, which provided insights into normal and pathogenic cellular processes in the human brain. This integrative multi-omics approach permits more detailed single-cell interrogation of complex organs and tissues.}, language = {en}, number = {1}, urldate = {2018-12-03}, journal = {Nature Biotechnology}, author = {Lake, Blue B. and Chen, Song and Sos, Brandon C. and Fan, Jean and Kaeser, Gwendolyn E. and Yung, Yun C. and Duong, Thu E. and Gao, Derek and Chun, Jerold and Kharchenko, Peter V. and Zhang, Kun}, month = jan, year = {2018}, pages = {70--80}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/HKGMDM7S/Lake et al. - 2018 - Integrative single-cell analysis of transcriptiona.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Z795VVN2/nbt.html:text/html} } @article{gardeux_asap:_2017, title = {{ASAP}: a web-based platform for the analysis and interactive visualization of single-cell {RNA}-seq data}, volume = {33}, issn = {1367-4803}, shorttitle = {{ASAP}}, url = {https://academic.oup.com/bioinformatics/article/33/19/3123/3852081}, doi = {10.1093/bioinformatics/btx337}, abstract = {AbstractMotivation. Single-cell RNA-sequencing (scRNA-seq) allows whole transcriptome profiling of thousands of individual cells, enabling the molecular explor}, language = {en}, number = {19}, urldate = {2018-12-03}, journal = {Bioinformatics}, author = {Gardeux, Vincent and David, Fabrice P. A. and Shajkofci, Adrian and Schwalie, Petra C. and Deplancke, Bart}, month = oct, year = {2017}, pages = {3123--3125}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GCZ8VF92/Gardeux et al. - 2017 - ASAP a web-based platform for the analysis and in.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/I8CFAWH8/3852081.html:text/html} } @article{conway_xenometool_2012, title = {Xenome—a tool for classifying reads from xenograft samples}, volume = {28}, issn = {1367-4803}, url = {https://academic.oup.com/bioinformatics/article/28/12/i172/269972}, doi = {10.1093/bioinformatics/bts236}, abstract = {Abstract. Motivation: Shotgun sequence read data derived from xenograft material contains a mixture of reads arising from the host and reads arising from the g}, language = {en}, number = {12}, urldate = {2018-12-04}, journal = {Bioinformatics}, author = {Conway, Thomas and Wazny, Jeremy and Bromage, Andrew and Tymms, Martin and Sooraj, Dhanya and Williams, Elizabeth D. and Beresford-Smith, Bryan}, month = jun, year = {2012}, pages = {i172--i178}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6IWBVCKR/Conway et al. - 2012 - Xenome—a tool for classifying reads from xenograft.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/E48ISGNC/269972.html:text/html} } @article{ernst_chromhmm:_2012, title = {{ChromHMM}: automating chromatin-state discovery and characterization}, volume = {9}, copyright = {2012 Nature Publishing Group}, issn = {1548-7105}, shorttitle = {{ChromHMM}}, url = {https://www.nature.com/articles/nmeth.1906}, doi = {10.1038/nmeth.1906}, abstract = {ChromHMM: automating chromatin-state discovery and characterization}, language = {en}, number = {3}, urldate = {2018-12-04}, journal = {Nature Methods}, author = {Ernst, Jason and Kellis, Manolis}, month = mar, year = {2012}, pages = {215--216}, file = {Ernst et Kellis - 2012 supplementals .pdf:/home/romaingroux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ADS9BET6/Ernst et Kellis - 2012 supplementals .pdf:application/pdf;Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ADS9BET6/Ernst et Kellis - 2012 - ChromHMM automating chromatin-state discovery and.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7PGXJ6UM/nmeth.html:text/html} } @article{hwang_single-cell_2018, title = {Single-cell {RNA} sequencing technologies and bioinformatics pipelines}, volume = {50}, copyright = {2018 The Author(s)}, issn = {2092-6413}, url = {https://www.nature.com/articles/s12276-018-0071-8}, doi = {10.1038/s12276-018-0071-8}, abstract = {Showing which genes are expressed, or switched on, in individual cells may help to reveal the first signs of disease. Each cell in an organism contains the same genetic information, but cell type and behavior depend on which genes are expressed. Previously, researchers could only sequence cells in batches, averaging the results, but technological improvements now allow sequencing of the genes expressed in an individual cell, known as single-cell RNA sequencing (scRNA-seq). Ji Hyun Lee (Kyung Hee University, Seoul) and Duhee Bang and Byungjin Hwang (Yonsei University, Seoul) have reviewed the available scRNA-seq technologies and the strategies available to analyze the large quantities of data produced. They conclude that scRNA-seq will impact both basic and medical science, from illuminating drug resistance in cancer to revealing the complex pathways of cell differentiation during development.}, language = {En}, number = {8}, urldate = {2018-12-04}, journal = {Experimental \& Molecular Medicine}, author = {Hwang, Byungjin and Lee, Ji Hyun and Bang, Duhee}, month = aug, year = {2018}, pages = {96}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MISMSQTX/Hwang et al. - 2018 - Single-cell RNA sequencing technologies and bioinf.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/STGSTEGK/s12276-018-0071-8.html:text/html} } @article{angerer_single_2017, series = {Big data acquisition and analysis • {Pharmacology} and drug discovery}, title = {Single cells make big data: {New} challenges and opportunities in transcriptomics}, volume = {4}, issn = {2452-3100}, shorttitle = {Single cells make big data}, url = {http://www.sciencedirect.com/science/article/pii/S245231001730077X}, doi = {10.1016/j.coisb.2017.07.004}, abstract = {Recent technological advances have enabled unprecedented insight into transcriptomics at the level of single cells. Single cell transcriptomics enables the measurement of transcriptomic information of thousands of single cells in a single experiment. The volume and complexity of resulting data make it a paradigm of big data. Consequently, the field is presented with new scientific and, in particular, analytical challenges where currently no scalable solutions exist. At the same time, exciting opportunities arise from increased resolution of single-cell RNA sequencing data and improved statistical power of ever growing datasets. Big single cell RNA sequencing data promises valuable insights into cellular heterogeneity which may significantly improve our understanding of biology and human disease. This review focuses on single cell transcriptomics and highlights the inherent opportunities and challenges in the context of big data analytics.}, journal = {Current Opinion in Systems Biology}, author = {Angerer, Philipp and Simon, Lukas and Tritschler, Sophie and Wolf, F. Alexander and Fischer, David and Theis, Fabian J.}, month = aug, year = {2017}, keywords = {Machine learning, Single-cell RNA-seq, Big data, Single-cell transcriptomics}, pages = {85--91}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/62SIJ6H6/Angerer et al. - 2017 - Single cells make big data New challenges and opp.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VA9KMV8I/S245231001730077X.html:text/html} } @article{poirion_single-cell_2016, title = {Single-{Cell} {Transcriptomics} {Bioinformatics} and {Computational} {Challenges}}, volume = {7}, issn = {1664-8021}, url = {https://www.frontiersin.org/articles/10.3389/fgene.2016.00163/full}, doi = {10.3389/fgene.2016.00163}, abstract = {The emerging single-cell RNA-Seq (scRNA-Seq) technology holds the promise to revolutionize our understanding of diseases and associated biological processes at an unprecedented resolution. It opens the door to reveal the intercellular heterogeneity and has been employed to a variety of applications, ranging from characterizing cancer cells subpopulations to elucidating tumor resistance mechanisms. Parallel to improving experimental protocols to deal with technological issues, deriving new analytical methods to reveal the complexity in scRNA-Seq data is just as challenging. Here we review the current state-of-the-art bioinformatics tools and methods for scRNA-Seq analysis, as well as addressing some critical analytical challenges that the field faces.}, language = {English}, urldate = {2018-12-04}, journal = {Frontiers in Genetics}, author = {Poirion, Olivier B. and Zhu, Xun and Ching, Travers and Garmire, Lana}, year = {2016}, keywords = {bioinformatics, single-cell genomics, Single-Cell Analysis, heterogeneity, microevolution}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/J8JGKVTK/Poirion et al. - 2016 - Single-Cell Transcriptomics Bioinformatics and Com.pdf:application/pdf} } @article{guo_sincera:_2015, title = {{SINCERA}: {A} {Pipeline} for {Single}-{Cell} {RNA}-{Seq} {Profiling} {Analysis}}, volume = {11}, issn = {1553-7358}, shorttitle = {{SINCERA}}, url = {https://journals.plos.org/ploscompbiol/article?id=10.1371/journal.pcbi.1004575}, doi = {10.1371/journal.pcbi.1004575}, abstract = {A major challenge in developmental biology is to understand the genetic and cellular processes/programs driving organ formation and differentiation of the diverse cell types that comprise the embryo. While recent studies using single cell transcriptome analysis illustrate the power to measure and understand cellular heterogeneity in complex biological systems, processing large amounts of RNA-seq data from heterogeneous cell populations creates the need for readily accessible tools for the analysis of single-cell RNA-seq (scRNA-seq) profiles. The present study presents a generally applicable analytic pipeline (SINCERA: a computational pipeline for SINgle CEll RNA-seq profiling Analysis) for processing scRNA-seq data from a whole organ or sorted cells. The pipeline supports the analysis for: 1) the distinction and identification of major cell types; 2) the identification of cell type specific gene signatures; and 3) the determination of driving forces of given cell types. We applied this pipeline to the RNA-seq analysis of single cells isolated from embryonic mouse lung at E16.5. Through the pipeline analysis, we distinguished major cell types of fetal mouse lung, including epithelial, endothelial, smooth muscle, pericyte, and fibroblast-like cell types, and identified cell type specific gene signatures, bioprocesses, and key regulators. SINCERA is implemented in R, licensed under the GNU General Public License v3, and freely available from CCHMC PBGE website, https://research.cchmc.org/pbge/sincera.html.}, language = {en}, number = {11}, urldate = {2018-12-05}, journal = {PLOS Computational Biology}, author = {Guo, Minzhe and Wang, Hui and Potter, S. Steven and Whitsett, Jeffrey A. and Xu, Yan}, month = nov, year = {2015}, keywords = {Gene regulation, Gene expression, Centrality, Epithelial cells, Lung development, Gene prediction, Transcriptional control, Regulator genes}, pages = {e1004575}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RX9EBPZX/Guo et al. - 2015 - SINCERA A Pipeline for Single-Cell RNA-Seq Profil.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZPINKUFR/article.html:text/html} } @article{satija_spatial_2015, title = {Spatial reconstruction of single-cell gene expression data}, volume = {33}, copyright = {2015 Nature Publishing Group}, issn = {1546-1696}, url = {https://www.nature.com/articles/nbt.3192}, doi = {10.1038/nbt.3192}, abstract = {Spatial localization is a key determinant of cellular fate and behavior, but methods for spatially resolved, transcriptome-wide gene expression profiling across complex tissues are lacking. RNA staining methods assay only a small number of transcripts, whereas single-cell RNA-seq, which measures global gene expression, separates cells from their native spatial context. Here we present Seurat, a computational strategy to infer cellular localization by integrating single-cell RNA-seq data with in situ RNA patterns. We applied Seurat to spatially map 851 single cells from dissociated zebrafish (Danio rerio) embryos and generated a transcriptome-wide map of spatial patterning. We confirmed Seurat's accuracy using several experimental approaches, then used the strategy to identify a set of archetypal expression patterns and spatial markers. Seurat correctly localizes rare subpopulations, accurately mapping both spatially restricted and scattered groups. Seurat will be applicable to mapping cellular localization within complex patterned tissues in diverse systems.}, language = {en}, number = {5}, urldate = {2018-12-05}, journal = {Nature Biotechnology}, author = {Satija, Rahul and Farrell, Jeffrey A. and Gennert, David and Schier, Alexander F. and Regev, Aviv}, month = may, year = {2015}, pages = {495--502}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IPFURHTU/Satija et al. - 2015 - Spatial reconstruction of single-cell gene express.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/Q4FSVTQ5/nbt.html:text/html} } @article{finak_mast:_2015, title = {{MAST}: a flexible statistical framework for assessing transcriptional changes and characterizing heterogeneity in single-cell {RNA} sequencing data}, volume = {16}, issn = {1474-760X}, shorttitle = {{MAST}}, url = {https://doi.org/10.1186/s13059-015-0844-5}, doi = {10.1186/s13059-015-0844-5}, abstract = {Single-cell transcriptomics reveals gene expression heterogeneity but suffers from stochastic dropout and characteristic bimodal expression distributions in which expression is either strongly non-zero or non-detectable. We propose a two-part, generalized linear model for such bimodal data that parameterizes both of these features. We argue that the cellular detection rate, the fraction of genes expressed in a cell, should be adjusted for as a source of nuisance variation. Our model provides gene set enrichment analysis tailored to single-cell data. It provides insights into how networks of co-expressed genes evolve across an experimental treatment. MAST is available at https://github.com/RGLab/MAST.}, number = {1}, journal = {Genome Biology}, author = {Finak, Greg and McDavid, Andrew and Yajima, Masanao and Deng, Jingyuan and Gersuk, Vivian and Shalek, Alex K. and Slichter, Chloe K. and Miller, Hannah W. and McElrath, M. Juliana and Prlic, Martin and Linsley, Peter S. and Gottardo, Raphael}, month = dec, year = {2015}, pages = {278}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F86SBQ72/Finak et al. - 2015 - MAST a flexible statistical framework for assessi.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KMMCHHVM/s13059-015-0844-5.html:text/html} } @article{fan_characterizing_2016, title = {Characterizing transcriptional heterogeneity through pathway and gene set overdispersion analysis}, volume = {13}, copyright = {2016 Nature Publishing Group}, issn = {1548-7105}, url = {https://www.nature.com/articles/nmeth.3734}, doi = {10.1038/nmeth.3734}, abstract = {The transcriptional state of a cell reflects a variety of biological factors, from cell-type-specific features to transient processes such as the cell cycle, all of which may be of interest. However, identifying such aspects from noisy single-cell RNA-seq data remains challenging. We developed pathway and gene set overdispersion analysis (PAGODA) to resolve multiple, potentially overlapping aspects of transcriptional heterogeneity by testing gene sets for coordinated variability among measured cells.}, language = {en}, number = {3}, urldate = {2018-12-05}, journal = {Nature Methods}, author = {Fan, Jean and Salathia, Neeraj and Liu, Rui and Kaeser, Gwendolyn E. and Yung, Yun C. and Herman, Joseph L. and Kaper, Fiona and Fan, Jian-Bing and Zhang, Kun and Chun, Jerold and Kharchenko, Peter V.}, month = mar, year = {2016}, pages = {241--244}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IHVKTAAS/Fan et al. - 2016 - Characterizing transcriptional heterogeneity throu.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7ZP93GHG/nmeth.html:text/html} } @article{kiselev_sc3:_2017, title = {{SC}3: consensus clustering of single-cell {RNA}-seq data}, volume = {14}, copyright = {2017 Nature Publishing Group}, issn = {1548-7105}, shorttitle = {{SC}3}, url = {https://www.nature.com/articles/nmeth.4236}, doi = {10.1038/nmeth.4236}, abstract = {Single-cell RNA-seq enables the quantitative characterization of cell types based on global transcriptome profiles. We present single-cell consensus clustering (SC3), a user-friendly tool for unsupervised clustering, which achieves high accuracy and robustness by combining multiple clustering solutions through a consensus approach (http://bioconductor.org/packages/SC3). We demonstrate that SC3 is capable of identifying subclones from the transcriptomes of neoplastic cells collected from patients.}, language = {en}, number = {5}, urldate = {2018-12-05}, journal = {Nature Methods}, author = {Kiselev, Vladimir Yu and Kirschner, Kristina and Schaub, Michael T. and Andrews, Tallulah and Yiu, Andrew and Chandra, Tamir and Natarajan, Kedar N. and Reik, Wolf and Barahona, Mauricio and Green, Anthony R. and Hemberg, Martin}, month = may, year = {2017}, pages = {483--486}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RJHM5C3T/Kiselev et al. - 2017 - SC3 consensus clustering of single-cell RNA-seq d.pdf:application/pdf;Kiselev et al. - 2017 - Supplementals.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/62HT7SUC/Kiselev et al. - 2017 - Supplementals.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/FKGFKJWC/nmeth.html:text/html} } @article{gonzalez-blas_cis-topic_2018, title = {Cis-topic modelling of single cell epigenomes}, copyright = {© 2018, Posted by Cold Spring Harbor Laboratory. The copyright holder for this pre-print is the author. All rights reserved. The material may not be redistributed, re-used or adapted without the author's permission.}, url = {https://www.biorxiv.org/content/early/2018/07/16/370346}, doi = {10.1101/370346}, abstract = {Single-cell epigenomics provides new opportunities to decipher genomic regulatory programs from heterogeneous samples and dynamic processes. We present a probabilistic framework called cisTopic, to simultaneously discover "cis-regulatory topics" and stable cell states from sparse single-cell epigenomics data. After benchmarking cisTopic on single-cell ATAC-seq data, single-cell DNA methylation data, and semi-simulated single-cell ChIP-seq data, we use cisTopic to predict regulatory programs in the human brain and validate these by aligning them with co-expression networks derived from single-cell RNA-seq data. Next, we performed a time-series single-cell ATAC-seq experiment after SOX10 perturbations in melanoma cultures, where cisTopic revealed dynamic regulatory topics driven by SOX10 and AP-1. Finally, machine learning and enhancer modelling approaches allowed to predict cell type specific SOX10 and SOX9 binding sites based on topic specific co-regulatory motifs. cisTopic is available as an R/Bioconductor package at http://github.com/aertslab/cistopic.}, language = {en}, urldate = {2018-12-10}, journal = {bioRxiv}, author = {González-Blas, Carmen Bravo and Minnoye, Liesbeth and Papasokrati, Dafni and Aibar, Sara and Hulselmans, Gert and Christiaens, Valerie and Davie, Kristofer and Wouters, Jasper and Aerts, Stein}, month = jul, year = {2018}, pages = {370346}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6YTUEV8W/González-Blas et al. - 2018 - Cis-topic modelling of single cell epigenomes.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/H72ELCGI/370346.html:text/html} } @article{aibar_scenic:_2017, title = {{SCENIC}: single-cell regulatory network inference and clustering}, volume = {14}, copyright = {2017 Nature Publishing Group}, issn = {1548-7105}, shorttitle = {{SCENIC}}, url = {https://www.nature.com/articles/nmeth.4463}, doi = {10.1038/nmeth.4463}, abstract = {We present SCENIC, a computational method for simultaneous gene regulatory network reconstruction and cell-state identification from single-cell RNA-seq data (http://scenic.aertslab.org). On a compendium of single-cell data from tumors and brain, we demonstrate that cis-regulatory analysis can be exploited to guide the identification of transcription factors and cell states. SCENIC provides critical biological insights into the mechanisms driving cellular heterogeneity.}, language = {en}, number = {11}, urldate = {2018-12-10}, journal = {Nature Methods}, author = {Aibar, Sara and González-Blas, Carmen Bravo and Moerman, Thomas and Huynh-Thu, Vân Anh and Imrichova, Hana and Hulselmans, Gert and Rambow, Florian and Marine, Jean-Christophe and Geurts, Pierre and Aerts, Jan and van den Oord, Joost and Atak, Zeynep Kalender and Wouters, Jasper and Aerts, Stein}, month = nov, year = {2017}, pages = {1083--1086}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SXK75H8W/Aibar et al. - 2017 - SCENIC single-cell regulatory network inference a.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/LZTL22E5/nmeth.html:text/html} } @article{zerbino_ensembl_2015, title = {The {Ensembl} {Regulatory} {Build}}, volume = {16}, issn = {1465-6906}, url = {https://doi.org/10.1186/s13059-015-0621-5}, doi = {10.1186/s13059-015-0621-5}, abstract = {Most genomic variants associated with phenotypic traits or disease do not fall within gene coding regions, but in regulatory regions, rendering their interpretation difficult. We collected public data on epigenetic marks and transcription factor binding in human cell types and used it to construct an intuitive summary of regulatory regions in the human genome. We verified it against independent assays for sensitivity. The Ensembl Regulatory Build will be progressively enriched when more data is made available. It is freely available on the Ensembl browser, from the Ensembl Regulation MySQL database server and in a dedicated track hub.}, number = {1}, urldate = {2018-12-10}, journal = {Genome Biology}, author = {Zerbino, Daniel R. and Wilder, Steven P. and Johnson, Nathan and Juettemann, Thomas and Flicek, Paul R.}, month = mar, year = {2015}, pages = {56}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/PUUXY9Q3/Zerbino et al. - 2015 - The Ensembl Regulatory Build.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3HYDPEH5/s13059-015-0621-5.html:text/html} } @article{cao_joint_2018, title = {Joint profiling of chromatin accessibility and gene expression in thousands of single cells}, volume = {361}, copyright = {Copyright © 2018 The Authors, some rights reserved; exclusive licensee American Association for the Advancement of Science. No claim to original U.S. Government Works. http://www.sciencemag.org/about/science-licenses-journal-article-reuseThis is an article distributed under the terms of the Science Journals Default License.}, issn = {0036-8075, 1095-9203}, url = {http://science.sciencemag.org/content/361/6409/1380}, doi = {10.1126/science.aau0730}, abstract = {Single-cell chromatin and RNA analysis Single-cell analyses have begun to provide insight into the differences among and within the individual cells that make up a tissue or organism. However, technological barriers owing to the small amount of material present in each single cell have prevented parallel analyses. Cao et al. present sci-CAR, a pooled barcode method that jointly analyzes both the RNA transcripts and chromatin profiles of single cells. By applying sci-CAR to lung adenocarcinoma cells and mouse kidney tissue, the authors demonstrate precision in assessing expression and genome accessibility at a genome-wide scale. The approach provides an improvement over bulk analysis, which can be confounded by differing cellular subgroups. Science, this issue p. 1380 Although we can increasingly measure transcription, chromatin, methylation, and other aspects of molecular biology at single-cell resolution, most assays survey only one aspect of cellular biology. Here we describe sci-CAR, a combinatorial indexing–based coassay that jointly profiles chromatin accessibility and mRNA (CAR) in each of thousands of single cells. As a proof of concept, we apply sci-CAR to 4825 cells, including a time series of dexamethasone treatment, as well as to 11,296 cells from the adult mouse kidney. With the resulting data, we compare the pseudotemporal dynamics of chromatin accessibility and gene expression, reconstruct the chromatin accessibility profiles of cell types defined by RNA profiles, and link cis-regulatory sites to their target genes on the basis of the covariance of chromatin accessibility and transcription across large numbers of single cells. A technique termed sci-CAR can assess both chromatin accessibility and RNA transcription at the single-cell level. A technique termed sci-CAR can assess both chromatin accessibility and RNA transcription at the single-cell level.}, language = {en}, number = {6409}, urldate = {2018-12-17}, journal = {Science}, author = {Cao, Junyue and Cusanovich, Darren A. and Ramani, Vijay and Aghamirzaie, Delasa and Pliner, Hannah A. and Hill, Andrew J. and Daza, Riza M. and McFaline-Figueroa, Jose L. and Packer, Jonathan S. and Christiansen, Lena and Steemers, Frank J. and Adey, Andrew C. and Trapnell, Cole and Shendure, Jay}, month = sep, year = {2018}, pmid = {30166440}, pages = {1380--1385}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SHE8MKCM/Cao et al. - 2018 - Joint profiling of chromatin accessibility and gen.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9JBD4YCU/1380.html:text/html} } @article{kolodziejczyk_technology_2015, title = {The {Technology} and {Biology} of {Single}-{Cell} {RNA} {Sequencing}}, volume = {58}, issn = {1097-2765}, url = {http://www.sciencedirect.com/science/article/pii/S1097276515002610}, doi = {10.1016/j.molcel.2015.04.005}, abstract = {The differences between individual cells can have profound functional consequences, in both unicellular and multicellular organisms. Recently developed single-cell mRNA-sequencing methods enable unbiased, high-throughput, and high-resolution transcriptomic analysis of individual cells. This provides an additional dimension to transcriptomic information relative to traditional methods that profile bulk populations of cells. Already, single-cell RNA-sequencing methods have revealed new biology in terms of the composition of tissues, the dynamics of transcription, and the regulatory relationships between genes. Rapid technological developments at the level of cell capture, phenotyping, molecular biology, and bioinformatics promise an exciting future with numerous biological and medical applications.}, number = {4}, urldate = {2019-01-14}, journal = {Molecular Cell}, author = {Kolodziejczyk, Aleksandra A. and Kim, Jong Kyoung and Svensson, Valentine and Marioni, John C. and Teichmann, Sarah A.}, month = may, year = {2015}, pages = {610--620}, file = {ScienceDirect Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KH6KQ2M6/Kolodziejczyk et al. - 2015 - The Technology and Biology of Single-Cell RNA Sequ.pdf:application/pdf;ScienceDirect Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/3FC8TUDQ/S1097276515002610.html:text/html} } @article{islam_quantitative_2014, title = {Quantitative single-cell {RNA}-seq with unique molecular identifiers}, volume = {11}, copyright = {2013 Nature Publishing Group}, issn = {1548-7105}, url = {https://www.nature.com/articles/nmeth.2772}, doi = {10.1038/nmeth.2772}, abstract = {Single-cell RNA sequencing (RNA-seq) is a powerful tool to reveal cellular heterogeneity, discover new cell types and characterize tumor microevolution. However, losses in cDNA synthesis and bias in cDNA amplification lead to severe quantitative errors. We show that molecular labels—random sequences that label individual molecules—can nearly eliminate amplification noise, and that microfluidic sample preparation and optimized reagents produce a fivefold improvement in mRNA capture efficiency.}, language = {en}, number = {2}, urldate = {2019-01-14}, journal = {Nature Methods}, author = {Islam, Saiful and Zeisel, Amit and Joost, Simon and La Manno, Gioele and Zajac, Pawel and Kasper, Maria and Lönnerberg, Peter and Linnarsson, Sten}, month = feb, year = {2014}, pages = {163--166}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/UCF3T8UV/Islam et al. - 2014 - Quantitative single-cell RNA-seq with unique molec.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/2YGPMH8E/nmeth.html:text/html} } @article{vallejos_normalizing_2017, title = {Normalizing single-cell {RNA} sequencing data: challenges and opportunities}, volume = {14}, copyright = {2017 Nature Publishing Group}, issn = {1548-7105}, shorttitle = {Normalizing single-cell {RNA} sequencing data}, url = {https://www.nature.com/articles/nmeth.4292}, doi = {10.1038/nmeth.4292}, abstract = {Single-cell transcriptomics is becoming an important component of the molecular biologist's toolkit. A critical step when analyzing data generated using this technology is normalization. However, normalization is typically performed using methods developed for bulk RNA sequencing or even microarray data, and the suitability of these methods for single-cell transcriptomics has not been assessed. We here discuss commonly used normalization approaches and illustrate how these can produce misleading results. Finally, we present alternative approaches and provide recommendations for single-cell RNA sequencing users.}, language = {en}, number = {6}, urldate = {2019-01-17}, journal = {Nature Methods}, author = {Vallejos, Catalina A. and Risso, Davide and Scialdone, Antonio and Dudoit, Sandrine and Marioni, John C.}, month = jun, year = {2017}, pages = {565--571}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IDFSTNYM/Vallejos et al. - 2017 - Normalizing single-cell RNA sequencing data chall.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/9PV8R8CQ/nmeth.html:text/html} } -@article{aibar_scenic:_2017-1, - title = {{SCENIC}: single-cell regulatory network inference and clustering}, - volume = {14}, - copyright = {2017 Nature Publishing Group}, - issn = {1548-7105}, - shorttitle = {{SCENIC}}, - url = {https://www.nature.com/articles/nmeth.4463}, - doi = {10.1038/nmeth.4463}, - abstract = {We present SCENIC, a computational method for simultaneous gene regulatory network reconstruction and cell-state identification from single-cell RNA-seq data (http://scenic.aertslab.org). On a compendium of single-cell data from tumors and brain, we demonstrate that cis-regulatory analysis can be exploited to guide the identification of transcription factors and cell states. SCENIC provides critical biological insights into the mechanisms driving cellular heterogeneity.}, - language = {en}, - number = {11}, - urldate = {2019-01-21}, - journal = {Nature Methods}, - author = {Aibar, Sara and González-Blas, Carmen Bravo and Moerman, Thomas and Huynh-Thu, Vân Anh and Imrichova, Hana and Hulselmans, Gert and Rambow, Florian and Marine, Jean-Christophe and Geurts, Pierre and Aerts, Jan and van den Oord, Joost and Atak, Zeynep Kalender and Wouters, Jasper and Aerts, Stein}, - month = nov, - year = {2017}, - pages = {1083--1086}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EPI2PAIJ/Aibar et al. - 2017 - SCENIC single-cell regulatory network inference a.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5EWIIHC9/nmeth.html:text/html} -} - -@article{satija_spatial_2015-1, - title = {Spatial reconstruction of single-cell gene expression data}, - volume = {33}, - copyright = {2015 Nature Publishing Group}, - issn = {1546-1696}, - url = {https://www.nature.com/articles/nbt.3192}, - doi = {10.1038/nbt.3192}, - abstract = {Spatial localization is a key determinant of cellular fate and behavior, but methods for spatially resolved, transcriptome-wide gene expression profiling across complex tissues are lacking. RNA staining methods assay only a small number of transcripts, whereas single-cell RNA-seq, which measures global gene expression, separates cells from their native spatial context. Here we present Seurat, a computational strategy to infer cellular localization by integrating single-cell RNA-seq data with in situ RNA patterns. We applied Seurat to spatially map 851 single cells from dissociated zebrafish (Danio rerio) embryos and generated a transcriptome-wide map of spatial patterning. We confirmed Seurat's accuracy using several experimental approaches, then used the strategy to identify a set of archetypal expression patterns and spatial markers. Seurat correctly localizes rare subpopulations, accurately mapping both spatially restricted and scattered groups. Seurat will be applicable to mapping cellular localization within complex patterned tissues in diverse systems.}, - language = {en}, - number = {5}, - urldate = {2019-01-21}, - journal = {Nature Biotechnology}, - author = {Satija, Rahul and Farrell, Jeffrey A. and Gennert, David and Schier, Alexander F. and Regev, Aviv}, - month = may, - year = {2015}, - pages = {495--502}, - file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/IL7MIU2T/Satija et al. - 2015 - Spatial reconstruction of single-cell gene express.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/WNYFPAYC/nbt.html:text/html} -} - @article{wang_gene_2018, title = {Gene expression distribution deconvolution in single-cell {RNA} sequencing}, volume = {115}, copyright = {Copyright © 2018 the Author(s). Published by PNAS.. This open access article is distributed under Creative Commons Attribution-NonCommercial-NoDerivatives License 4.0 (CC BY-NC-ND).}, issn = {0027-8424, 1091-6490}, url = {https://www.pnas.org/content/115/28/E6437}, doi = {10.1073/pnas.1721085115}, abstract = {Single-cell RNA sequencing (scRNA-seq) enables the quantification of each gene’s expression distribution across cells, thus allowing the assessment of the dispersion, nonzero fraction, and other aspects of its distribution beyond the mean. These statistical characterizations of the gene expression distribution are critical for understanding expression variation and for selecting marker genes for population heterogeneity. However, scRNA-seq data are noisy, with each cell typically sequenced at low coverage, thus making it difficult to infer properties of the gene expression distribution from raw counts. Based on a reexamination of nine public datasets, we propose a simple technical noise model for scRNA-seq data with unique molecular identifiers (UMI). We develop deconvolution of single-cell expression distribution (DESCEND), a method that deconvolves the true cross-cell gene expression distribution from observed scRNA-seq counts, leading to improved estimates of properties of the distribution such as dispersion and nonzero fraction. DESCEND can adjust for cell-level covariates such as cell size, cell cycle, and batch effects. DESCEND’s noise model and estimation accuracy are further evaluated through comparisons to RNA FISH data, through data splitting and simulations and through its effectiveness in removing known batch effects. We demonstrate how DESCEND can clarify and improve downstream analyses such as finding differentially expressed genes, identifying cell types, and selecting differentiation markers.}, language = {en}, number = {28}, urldate = {2019-01-24}, journal = {Proceedings of the National Academy of Sciences}, author = {Wang, Jingshu and Huang, Mo and Torre, Eduardo and Dueck, Hannah and Shaffer, Sydney and Murray, John and Raj, Arjun and Li, Mingyao and Zhang, Nancy R.}, month = jul, year = {2018}, pmid = {29946020}, keywords = {differential expression, Gini coefficient, highly variable genes, RNA sequencing, single-cell transcriptomics}, pages = {E6437--E6446}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/57DNLDK4/Wang et al. - 2018 - Gene expression distribution deconvolution in sing.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/YUYL4KY2/E6437.html:text/html} } @article{kiselev_challenges_2019, title = {Challenges in unsupervised clustering of single-cell {RNA}-seq data}, copyright = {2018 Springer Nature Limited}, issn = {1471-0064}, url = {https://www.nature.com/articles/s41576-018-0088-9}, doi = {10.1038/s41576-018-0088-9}, abstract = {Single-cell RNA sequencing (scRNA-seq) enables transcriptome-based characterization of the constituent cell types within a heterogeneous sample. However, reliable analysis and biological interpretation typically require optimal use of clustering algorithms. This Review discusses the multiple algorithmic options for clustering scRNA-seq data, including various technical, biological and computational considerations.}, language = {En}, urldate = {2019-01-31}, journal = {Nature Reviews Genetics}, author = {Kiselev, Vladimir Yu and Andrews, Tallulah S. and Hemberg, Martin}, month = jan, year = {2019}, pages = {1}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/YIHZU3GQ/Kiselev et al. - 2019 - Challenges in unsupervised clustering of single-ce.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/BQ9FYZH6/s41576-018-0088-9.html:text/html} } @article{ji_tscan:_2016, title = {{TSCAN}: {Pseudo}-time reconstruction and evaluation in single-cell {RNA}-seq analysis}, volume = {44}, issn = {0305-1048}, shorttitle = {{TSCAN}}, url = {https://academic.oup.com/nar/article/44/13/e117/2457590}, doi = {10.1093/nar/gkw430}, abstract = {Abstract. When analyzing single-cell RNA-seq data, constructing a pseudo-temporal path to order cells based on the gradual transition of their transcriptomes i}, language = {en}, number = {13}, urldate = {2019-02-04}, journal = {Nucleic Acids Research}, author = {Ji, Zhicheng and Ji, Hongkai}, month = jul, year = {2016}, pages = {e117--e117}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F4AMNTIU/Ji and Ji - 2016 - TSCAN Pseudo-time reconstruction and evaluation i.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/QURDXBZ3/2457590.html:text/html} } @article{kumasaka_high-resolution_2019, title = {High-resolution genetic mapping of putative causal interactions between regions of open chromatin}, volume = {51}, copyright = {2018 The Author(s), under exclusive licence to Springer Nature America, Inc.}, issn = {1546-1718}, url = {https://www.nature.com/articles/s41588-018-0278-6}, doi = {10.1038/s41588-018-0278-6}, abstract = {A Bayesian hierarchical approach identifies over 15,000 causal regulatory interactions in the human genome using ATAC-seq data from 100 individuals. The majority of detected interactions were over distances of \<20 kb, a range where 3C methods perform poorly.}, language = {En}, number = {1}, urldate = {2019-03-14}, journal = {Nature Genetics}, author = {Kumasaka, Natsuhiko and Knights, Andrew J. and Gaffney, Daniel J.}, month = jan, year = {2019}, pages = {128}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CS8XIVYF/Kumasaka et al. - 2019 - High-resolution genetic mapping of putative causal.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/TIPW979S/s41588-018-0278-6.html:text/html} } @article{grossman_positional_2018, title = {Positional specificity of different transcription factor classes within enhancers}, volume = {115}, copyright = {Copyright © 2018 the Author(s). Published by PNAS.. This open access article is distributed under Creative Commons Attribution-NonCommercial-NoDerivatives License 4.0 (CC BY-NC-ND).}, issn = {0027-8424, 1091-6490}, url = {https://www.pnas.org/content/115/30/E7222}, doi = {10.1073/pnas.1804663115}, abstract = {Gene expression is controlled by sequence-specific transcription factors (TFs), which bind to regulatory sequences in DNA. TF binding occurs in nucleosome-depleted regions of DNA (NDRs), which generally encompass regions with lengths similar to those protected by nucleosomes. However, less is known about where within these regions specific TFs tend to be found. Here, we characterize the positional bias of inferred binding sites for 103 TFs within ∼500,000 NDRs across 47 cell types. We find that distinct classes of TFs display different binding preferences: Some tend to have binding sites toward the edges, some toward the center, and some at other positions within the NDR. These patterns are highly consistent across cell types, suggesting that they may reflect TF-specific intrinsic structural or functional characteristics. In particular, TF classes with binding sites at NDR edges are enriched for those known to interact with histones and chromatin remodelers, whereas TFs with central enrichment interact with other TFs and cofactors such as p300. Our results suggest distinct regiospecific binding patterns and functions of TF classes within enhancers.}, language = {en}, number = {30}, urldate = {2019-04-01}, journal = {Proceedings of the National Academy of Sciences}, author = {Grossman, Sharon R. and Engreitz, Jesse and Ray, John P. and Nguyen, Tung H. and Hacohen, Nir and Lander, Eric S.}, month = jul, year = {2018}, pmid = {29987030}, - keywords = {chromatin structure, gene regulation, genomics, transcription factor binding}, + keywords = {genomics, chromatin structure, gene regulation, transcription factor binding}, pages = {E7222--E7230}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KFUGBD65/Grossman et al. - 2018 - Positional specificity of different transcription .pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/SJD8DKDS/E7222.html:text/html} } @article{berest_quantification_2018, title = {Quantification of differential transcription factor activity and multiomics-based classification into activators and repressors: {diffTF}}, shorttitle = {Quantification of differential transcription factor activity and multiomics-based classification into activators and repressors}, url = {http://biorxiv.org/lookup/doi/10.1101/368498}, doi = {10.1101/368498}, abstract = {Transcription factor (TF) activity is an important read-out of cellular signalling pathways and thus to assess regulatory differences across conditions. However, current technologies lack the ability to simultaneously assess activity changes for multiple TFs and in particular to determine whether a specific TF acts globally as transcriptional repressor or activator. To this end, we introduce a widely applicable genome-wide method diffTF to assess differential TF activity and to classify TFs as activator or repressor (available at https://git.embl.de/grp-zaugg/diffTF). This is done by integrating any type of genome-wide chromatin accessibility data with RNA-Seq data and in-silico predicted TF binding sites. We corroborated the classification of TFs into repressors and activators by three independent analyses based on enrichments of active/repressive chromatin states, correlation of TF activity with gene expression, and activator- and repressor-specific chromatin footprints. To show the power of diffTF, we present two case studies: First, we applied diffTF in to a large ATAC-Seq/RNA-Seq dataset comparing mutated and unmutated chronic lymphocytic leukemia samples, where we identified dozens of known (40\%) and potentially novel (60\%) TFs that are differentially active. We were also able to classify almost half of them as either repressor and activator. Second, we applied diffTF to a small ATAC-Seq/RNA-Seq data set comparing two cell types along the hematopoietic differentiation trajectory (multipotent progenitors - MPP - versus granulocyte-macrophage progenitors - GMP). Here we identified the known drivers of differentiation and found that the majority of the differentially active TFs are transcriptional activators. Overall, diffTF was able to recover the known TFs in both case studies, additionally identified TFs that have been less well characterized in the given condition, and provides a classification of the TFs into transcriptional activators and repressors.}, language = {en}, urldate = {2019-04-01}, journal = {bioRxiv}, author = {Berest, Ivan and Arnold, Christian and Reyes-Palomares, Armando and Palla, Giovanni and Rasmussen, Kasper Dindler and Helin, Kristian and Zaugg, Judith}, month = dec, year = {2018}, file = {Berest et al. - 2018 - Quantification of differential transcription facto.pdf:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T89PUHUV/Berest et al. - 2018 - Quantification of differential transcription facto.pdf:application/pdf} } @article{gonzalez-blas_cistopic:_2019, title = {{cisTopic}: cis-regulatory topic modeling on single-cell {ATAC}-seq data}, volume = {16}, copyright = {2019 The Author(s), under exclusive licence to Springer Nature America, Inc.}, issn = {1548-7105}, shorttitle = {{cisTopic}}, url = {https://www.nature.com/articles/s41592-019-0367-1}, doi = {10.1038/s41592-019-0367-1}, abstract = {As an unsupervised Bayesian framework, cisTopic classifies regions in scATAC-seq data into regulatory topics, which are used for clustering.}, language = {En}, number = {5}, urldate = {2019-05-07}, journal = {Nature Methods}, author = {González-Blas, Carmen Bravo and Minnoye, Liesbeth and Papasokrati, Dafni and Aibar, Sara and Hulselmans, Gert and Christiaens, Valerie and Davie, Kristofer and Wouters, Jasper and Aerts, Stein}, month = may, year = {2019}, pages = {397}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/CILUNPYF/González-Blas et al. - 2019 - cisTopic cis-regulatory topic modeling on single-.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/RXHF5XRB/s41592-019-0367-1.html:text/html} } @article{fang_fast_2019, title = {Fast and {Accurate} {Clustering} of {Single} {Cell} {Epigenomes} {Reveals} {Cis}-{Regulatory} {Elements} in {Rare} {Cell} {Types}}, copyright = {© 2019, Posted by Cold Spring Harbor Laboratory. The copyright holder for this pre-print is the author. All rights reserved. The material may not be redistributed, re-used or adapted without the author's permission.}, url = {https://www.biorxiv.org/content/10.1101/615179v1}, doi = {10.1101/615179}, abstract = {{\textless}p{\textgreater}Mammalian tissues are composed of highly specialized cell types defined by distinct gene expression patterns. Identification of cis-regulatory elements responsible for cell-type specific gene expression is essential for understanding the origin of the cellular diversity. Conventional assays to map cis-elements via open chromatin analysis of primary tissues fail to resolve their cell type specificity and lack the sensitivity to identify cis-elements in rare cell types. Single nucleus analysis of transposase-accessible chromatin (ATAC-seq) can overcome this limitation, but current analysis methods begin with pre-defined genomic regions of accessibility and are therefore biased toward the dominant population of a tissue. Here we report a method, Single Nucleus Analysis Pipeline for ATAC-seq (SnapATAC), that can efficiently dissect cellular heterogeneity in an unbiased manner using single nucleus ATAC-seq datasets and identify candidate regulatory sequences in constituent cell types. We demonstrate that SnapATAC outperforms existing methods in both accuracy and scalability. We further analyze 64,795 single cell chromatin profiles from the secondary motor cortex of mouse brain, creating a chromatin landscape atlas with unprecedent resolution, including over 300,000 candidate cis-regulatory elements in nearly 50 distinct cell populations. These results demonstrate a systematic approach for comprehensive analysis of cis-regulatory sequences in the mammalian genomes.{\textless}/p{\textgreater}}, language = {en}, urldate = {2019-05-07}, journal = {bioRxiv}, author = {Fang, Rongxin and Preissl, Sebastian and Hou, Xiaomeng and Lucero, Jacinta and Wang, Xinxin and Motamedi, Amir and Shiau, Andrew K. and Mukamel, Eran A. and Zhang, Yanxiao and Behrens, M. Margarita and Ecker, Joseph and Ren, Bing}, month = apr, year = {2019}, pages = {615179}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/T6VU8VIB/Fang et al. - 2019 - Fast and Accurate Clustering of Single Cell Epigen.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/JKLJNT7V/615179v1.html:text/html} } @article{li_identification_2019, title = {Identification of transcription factor binding sites using {ATAC}-seq}, volume = {20}, issn = {1474-760X}, url = {https://doi.org/10.1186/s13059-019-1642-2}, doi = {10.1186/s13059-019-1642-2}, abstract = {Transposase-Accessible Chromatin followed by sequencing (ATAC-seq) is a simple protocol for detection of open chromatin. Computational footprinting, the search for regions with depletion of cleavage events due to transcription factor binding, is poorly understood for ATAC-seq. We propose the first footprinting method considering ATAC-seq protocol artifacts. HINT-ATAC uses a position dependency model to learn the cleavage preferences of the transposase. We observe strand-specific cleavage patterns around transcription factor binding sites, which are determined by local nucleosome architecture. By incorporating all these biases, HINT-ATAC is able to significantly outperform competing methods in the prediction of transcription factor binding sites with footprints.}, number = {1}, urldate = {2019-05-21}, journal = {Genome Biology}, author = {Li, Zhijian and Schulz, Marcel H. and Look, Thomas and Begemann, Matthias and Zenke, Martin and Costa, Ivan G.}, month = feb, year = {2019}, pages = {45}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/KFNKU6ZM/Li et al. - 2019 - Identification of transcription factor binding sit.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/VISSH4XB/s13059-019-1642-2.html:text/html} } @article{vierstra_genomic_2016, title = {Genomic footprinting}, volume = {13}, copyright = {2016 Nature Publishing Group}, issn = {1548-7105}, url = {https://www.nature.com/articles/nmeth.3768}, doi = {10.1038/nmeth.3768}, abstract = {The advent of DNA footprinting with DNase I more than 35 years ago enabled the systematic analysis of protein-DNA interactions, and the technique has been instrumental in the decoding of cis-regulatory elements and the identification and characterization of transcription factors and other DNA-binding proteins. The ability to analyze millions of individual genomic cleavage events via massively parallel sequencing has enabled in vivo DNase I footprinting on a genomic scale, offering the potential for global analysis of transcription factor occupancy in a single experiment. Genomic footprinting has opened unique vistas on the organization, function and evolution of regulatory DNA; however, the technology is still nascent. Here we discuss both prospects and challenges of genomic footprinting, as well as considerations for its application to complex genomes.}, language = {en}, number = {3}, urldate = {2019-09-30}, journal = {Nature Methods}, author = {Vierstra, Jeff and Stamatoyannopoulos, John A.}, month = mar, year = {2016}, pages = {213--221}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/GTRVMWIS/Vierstra and Stamatoyannopoulos - 2016 - Genomic footprinting.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/F4K3L8EJ/nmeth.html:text/html} } @article{barozzi_co-regulation_2014, title = {Co-regulation of transcription factor binding and nucleosome occupancy through {DNA} features of mammalian enhancers}, volume = {54}, issn = {1097-2765}, url = {https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4048654/}, doi = {10.1016/j.molcel.2014.04.006}, abstract = {Transcription factors (TFs) preferentially bind sites contained in regions of computationally predicted high nucleosomal occupancy, suggesting that nucleosomes are gatekeepers of TF binding sites. However, because of their complexity mammalian genomes contain millions of randomly occurring, unbound TF consensus binding sites. We hypothesized that the information controlling nucleosome assembly may coincide with the information that enables TFs to bind cis-regulatory elements while ignoring randomly occurring sites. Hence, nucleosome would selectively mask genomic sites contacted by TFs and thus potentially functional. The hematopoietic TF Pu.1 maintained nucleosome depletion at macrophage-specific enhancers that displayed a broad range of nucleosome occupancy in other cell types and in reconstituted chromatin. We identified a minimal set of DNA sequence and shape features that accurately predicted both Pu.1 binding and nucleosome occupancy genome-wide. These data reveal a basic organizational principle of mammalian cis-regulatory elements whereby TF recruitment and nucleosome deposition are controlled by overlapping DNA sequence features.}, number = {5}, urldate = {2019-09-30}, journal = {Molecular cell}, author = {Barozzi, Iros and Simonatto, Marta and Bonifacio, Silvia and Yang, Lin and Rohs, Remo and Ghisletti, Serena and Natoli, Gioacchino}, month = jun, year = {2014}, pmid = {24813947}, pmcid = {PMC4048654}, pages = {844--857}, file = {PubMed Central Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/6RTT9G5R/Barozzi et al. - 2014 - Co-regulation of transcription factor binding and .pdf:application/pdf} } @article{adey_rapid_2010, title = {Rapid, low-input, low-bias construction of shotgun fragment libraries by high-density in vitro transposition}, volume = {11}, issn = {1474-760X}, url = {https://doi.org/10.1186/gb-2010-11-12-r119}, doi = {10.1186/gb-2010-11-12-r119}, abstract = {We characterize and extend a highly efficient method for constructing shotgun fragment libraries in which transposase catalyzes in vitro DNA fragmentation and adaptor incorporation simultaneously. We apply this method to sequencing a human genome and find that coverage biases are comparable to those of conventional protocols. We also extend its capabilities by developing protocols for sub-nanogram library construction, exome capture from 50 ng of input DNA, PCR-free and colony PCR library construction, and 96-plex sample indexing.}, number = {12}, urldate = {2019-09-30}, journal = {Genome Biology}, author = {Adey, Andrew and Morrison, Hilary G. and {Asan} and Xun, Xu and Kitzman, Jacob O. and Turner, Emily H. and Stackhouse, Bethany and MacKenzie, Alexandra P. and Caruccio, Nicholas C. and Zhang, Xiuqing and Shendure, Jay}, month = dec, year = {2010}, pages = {R119}, file = {Full Text:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/XYZCW65D/Adey et al. - 2010 - Rapid, low-input, low-bias construction of shotgun.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/ZGDVGS7E/gb-2010-11-12-r119.html:text/html} } @article{berest_quantification_2018-1, title = {Quantification of differential transcription factor activity and multiomics-based classification into activators and repressors: {diffTF}}, copyright = {© 2018, Posted by Cold Spring Harbor Laboratory. This pre-print is available under a Creative Commons License (Attribution-NonCommercial-NoDerivs 4.0 International), CC BY-NC-ND 4.0, as described at http://creativecommons.org/licenses/by-nc-nd/4.0/}, shorttitle = {Quantification of differential transcription factor activity and multiomics-based classification into activators and repressors}, url = {https://www.biorxiv.org/content/10.1101/368498v2}, doi = {10.1101/368498}, abstract = {{\textless}p{\textgreater}Transcription factor (TF) activity is an important read-out of cellular signalling pathways and thus to assess regulatory differences across conditions. However, current technologies lack the ability to simultaneously assess activity changes for multiple TFs and in particular to determine whether a specific TF acts globally as transcriptional repressor or activator. To this end, we introduce a widely applicable genome-wide method \textit{diffTF} to assess differential TF activity and to classify TFs as activator or repressor (available at https://git.embl.de/grp-zaugg/diffTF). This is done by integrating any type of genome-wide chromatin accessibility data with RNA-Seq data and in-silico predicted TF binding sites. We corroborated the classification of TFs into repressors and activators by three independent analyses based on enrichments of active/repressive chromatin states, correlation of TF activity with gene expression, and activator-and repressor-specific chromatin footprints. To show the power of \textit{diffTF}, we present two case studies: First, we applied \textit{diffTF} in to a large ATAC-Seq/RNA-Seq dataset comparing mutated and unmutated chronic lymphocytic leukemia samples, where we identified dozens of known (40\%) and potentially novel (60\%) TFs that are differentially active. We were also able to classify almost half of them as either repressor and activator. Second, we applied \textit{diffTF} to a small ATAC-Seq/RNA-Seq data set comparing two cell types along the hematopoietic differentiation trajectory (multipotent progenitors – MPP – versus granulocyte-macrophage progenitors – GMP). Here we identified the known drivers of differentiation and found that the majority of the differentially active TFs are transcriptional activators. Overall, \textit{diffTF} was able to recover the known TFs in both case studies, additionally identified TFs that have been less well characterized in the given condition, and provides a classification of the TFs into transcriptional activators and repressors.{\textless}/p{\textgreater}}, language = {en}, urldate = {2019-10-01}, journal = {bioRxiv}, author = {Berest, Ivan and Arnold, Christian and Reyes-Palomares, Armando and Palla, Giovanni and Rasmussen, Kasper Dindler and Helin, Kristian and Zaugg, Judith B.}, month = dec, year = {2018}, pages = {368498}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/59JR3A39/Berest et al. - 2018 - Quantification of differential transcription facto.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/EPXLXEGN/368498v2.html:text/html} } @article{klemm_chromatin_2019, title = {Chromatin accessibility and the regulatory epigenome}, volume = {20}, copyright = {2018 Springer Nature Limited}, issn = {1471-0064}, url = {https://www.nature.com/articles/s41576-018-0089-8}, doi = {10.1038/s41576-018-0089-8}, abstract = {Chromatin accessibility comprises the positions, compaction and dynamics of nucleosomes, as well as the occupancy of DNA by other proteins such as transcription factors. In this Review, the authors discuss diverse methods for characterizing chromatin accessibility, how accessibility is determined and remodelled in cells and the regulatory roles of accessibility in gene expression and development.}, language = {en}, number = {4}, urldate = {2019-10-01}, journal = {Nature Reviews Genetics}, author = {Klemm, Sandy L. and Shipony, Zohar and Greenleaf, William J.}, month = apr, year = {2019}, pages = {207--220}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/7M52REY6/Klemm et al. - 2019 - Chromatin accessibility and the regulatory epigeno.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/4Q5BBBWP/s41576-018-0089-8.html:text/html} } @article{groux_spar-k:_2019, title = {{SPar}-{K}: a method to partition {NGS} signal data}, shorttitle = {{SPar}-{K}}, url = {https://academic.oup.com/bioinformatics/advance-article/doi/10.1093/bioinformatics/btz416/5497248}, doi = {10.1093/bioinformatics/btz416}, abstract = {AbstractSummary. We present SPar-K (Signal Partitioning with K-means), a method to search for archetypical chromatin architectures by partitioning a set of gen}, language = {en}, urldate = {2019-10-01}, journal = {Bioinformatics}, author = {Groux, Romain and Bucher, Philipp}, month = may, year = {2019}, file = {Full Text PDF:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/MB4BIGBN/Groux and Bucher - SPar-K a method to partition NGS signal data.pdf:application/pdf;Snapshot:/home/groux/.zotero/zotero/mgp9vo2c.default/zotero/storage/5FDIJ676/5497248.html:text/html} } \ No newline at end of file diff --git a/phd_thesis.pdf b/phd_thesis.pdf index 4e35ae8..681fbb7 100644 Binary files a/phd_thesis.pdf and b/phd_thesis.pdf differ diff --git a/phd_thesis.tex b/phd_thesis.tex index d239fdd..a855078 100755 --- a/phd_thesis.tex +++ b/phd_thesis.tex @@ -1,247 +1,380 @@ \documentclass[12pt]{report} \usepackage{graphicx} \usepackage[round]{natbib} \usepackage[utf8]{inputenc} \usepackage[labelfont=bf]{caption} \usepackage[margin={2.5cm,2.5cm}]{geometry} \usepackage[titletoc,title]{appendix} +\usepackage{amsmath} % for equations with braces and text inside equations +\usepackage{hyperref} % for url \setlength{\columnsep}{20pt} \renewcommand{\familydefault}{\sfdefault} % document \begin{document} \title{Bioinformatic analysis of transcription factor binding sites} \author{Romain Groux} \date{\today} \maketitle \chapter{Plan} \begin{enumerate} \item in vitro data study \begin{itemize} \item the analysis of SMiLE-seq data \end{itemize} \item in vivo data study \begin{itemize} \item SPar-K method \item Chromatin architecture around TFBS \item Motif co-occurence \item Using single-cell ATAC-seq data to create a lexicon of chromatin architectures \end{itemize} \end{enumerate} \chapter{Introduction} TODO \citep{alipanahi_predicting_2015}. \chapter{A study of chromatin accessibility in human blood monocytes} Digital genomic footprinting (DGF) methods are a power powerful mean to reveal protein occupancy, genome-wide, at once \citep{vierstra_genomic_2016}. These methods allow to identify open chromatin regions within a genome and to list its active regulatory sites. These technologies are based on a targeted degradation of the open regions of the genome, either by DNaseI \citep{neph_expansive_2012} or by a transposon-based system \citep{adey_rapid_2010,buenrostro_transposition_2013}. DGF techologies encounter a yet ever-growing popularity because of the wealth of data produced in a single experiment. Indeed, instead of running thousands of chromatin immonuprecitpitation followed by sequencing (ChIP-seq) \citep{barski_high-resolution_2007}, one per transcription factor (TF), to know where each TF is binding, it is sufficient to run a single chromatin accessibility assay. The price to pay for this gain of simplicity, compared to ChIP-seq, is a loss of information. Indeed, chromatin accessibility assays allow to list any active regulatory region within a sample, at once but do not give any information about which TF or complex is bound at a given location The transposon-based method - named assay for transposase-accessible chromatin with high-throughput sequencing (ATAC-seq) - is currently gaining a rapid popularity due to its technical affordability and cheap labor costs compared to DNaseI-based methods. \section{ATAC-seq} \begin{figure}[!htbp] \begin{center} \includegraphics[scale=0.5]{scATAC-seq/figures/ATAC-seq2.png} \captionof{figure}{\textbf{ATAC-seq principle :} ATAC-seq uses a hyperactive Tn5 transposase to simultaneously cleave genomic DNA at accessible loci and ligate adaptors to accessible DNA. These adaptors can serve as sequencing barcodes. A subsequent step of ligation allows to add sequencing adaptors. The released fragments are subjected to massively parallel sequencing of fragment ends (transposition sites) to generate a digital readout of per-nucleotide insertion genome-wide. A footprint is present at the level of the protected nucleotides. Taken and adapted from \citep{vierstra_genomic_2016}.} \label{atac_seq_atac_seq} \end{center} \end{figure} ATAC-seq assays uses a modified Tn5 transposase enzyme to selectively fragment the accessible regions of the genome \citep{adey_rapid_2010,buenrostro_transposition_2013}. The enzyme inserts small double stranded barcodes inside the DNA wherever it is accessible resulting a the creation of double strand breaks (shown in Figure \ref{atac_seq_atac_seq}). This process, known as tagmentation, allows to i) fragment the genome and ii) inserts sequencing primers at once. It should be noted that the Tn5 acts as an homodimer and thus inserts two copy of the same adaptors separated from each other by 9bp \citep{adey_rapid_2010}. For a given genomic locus, the number of insertions depends on several parameters. First, the Tn5 transposition rate itself depends on the enzyme and substrate concentrations. Second, it has been demonstrated that the Tn5 posses a slight sequence preference \citep{adey_rapid_2010}. Finally, the most important parameter is steric hindrance. Stretches of DNA occupied by other proteins, such a transcription factors (TF) binding sites (BS) are protected from degradation. This usually leads to the creation of a characteristic signal at the level of the BS. If we represent the density of transposition events along a given region of the genome, the density usually show a decrease at the level of the BS. This decrease is named “footprint”. The experimental readout of ATAC-seq is produced by sequencing the DNA fragment edges – the transposition sites - by using the inserted tags as sequencing primers. Mapping these sequences against the genome allows to retrieve the insertion sites. If the sequencing is pair-ended, it is possible to know the size of each fragment. \section{Monitoring TF binding} As discusses above, DGF assays are able to highlight active regulatory elements from an entire genome, at once. However, this come with the price of an information loss. First, even if we can identify active loci likely to be bound, we have no direct idea about the identities of the bound TFs. Second, we have no idea about the function of those regions. The function of a region – for instance transcriptional activation or repression - is ultimately bared by the TF and other complexes bound there. Thus delineating a region function necessitate to identify the TF and complexes bound here. Retrieving the identify of the TFs/complexes bound require to implement dedicated strategies. First, it is possible to collect evidences about the identity of TF likely to bind at a given location through a motif analysis. TFs can bind DNA directly through their own DNA binding domain or indirectly, through an interaction with at least on other partner TF which binds DNA directly \citep{neph_expansive_2012}. For a given TF, direct binding events can be detected by monitoring the presence of a binding motif if a specificity model is available. Thus a footprint baring a motif is likely to reflect a direct binding event. However, this method has two important limitations : related TF often share a common DNA specificity. For indirect binding, however, nothing can be done to detect such events. Also, evidences about the presence of biggest complexes can be collected by studying the size of the footprint. Large complexes should leave large footprints. This approach, even if limited is able to pinpoint a handful of candidate TFs. Second, deciphering the functions of the regulatory elements can be undertaken by looking at the footprint produced by a given factor. Indeed, previous studies have showed that activator and repressor TFs tend to produce different types of footprints \citep{berest_quantification_2018}. Also, the spatial positioning of TF motif within the footprint seemed to be linked with the factor functions \citep{grossman_positional_2018}. For instance, factors associated with the regulation of transcription tend to have a motif in the middle of the footprint whereas factors known to interact with chromatin remodeling factors tend to have a footprint at the edge of the footprint, in contact with the surrounding nucleosomes. \section{The advent of single cell DGF} Recently, the advent of single-cell (sc) sequencing technologies have been a real game changer in the field of life science. These technological advances allowed to measure gene expression and chromatin accessibility (scATAC-seq) at a yet unprecedented resolution. As bulk sequencing was providing an average overview of what was going on, single-cell sequencing allows to monitor what is happening in each cell of a population. This advance had a profound impact on genomics for two reasons. First, for the really first time, the heterogeneity of a cell population became accessible and could be studied at the chromatin, transcriptional and protein levels. Second, the possibility of collecting high dimensionality data from tenth of thousands of individuals allows genomics to fully enter in the modern big data era, making commonly used machine learning methods usable as the number of parameters to estimate in the models became smaller than the number of individuals in the data \citep{angerer_single_2017}. \section{A quick overview of scATAC-seq data analysis} So far, most of the single cell technologies are targeted at measuring gene expression through scRNA-seq. Naturally, dedicated algorithms and computational methods have been developed to analyze these data. Currently, the most common types of analyses made are i) data projections and dimensionality reduction such as principal component analysis (PCA), t-stochastic distributed neighbours embedding (t-SNE) or uniform manifold approximation and projection (UMAP) and ii) cell population detection by clustering the cells based on the expression of genes \citep{fan_characterizing_2016, kiselev_sc3:_2017}, by reconstructing gene regulation network \citep{aibar_scenic:_2017} or by identifying cellular states based on the accessible region motif content \citep{gonzalez-blas_cistopic:_2019}. In all cases, the use of scATAC-seq data is to determined whether a region is accessible or not. The downstream analyses characterizes the accessible region using i) the number of reads mapping in these regions as a measure of the accessibility or ii) the sequence content within these accessible regions to determine regulatory topics. \section{Open questions} \begin{figure}[!htbp] \begin{center} \includegraphics[scale=0.5]{scATAC-seq/figures/pipeline.png} \captionof{figure}{\textbf{framework to identify chromatin organization and use them to annotate cellular state :} the scATAC-seq data available in each individual cell are aggregated and used a if it was a bulk sequencing experiment. Regions of interest are listed using peak calling on the the bulk data. The read densities in these regions (center of the peaks +/- a given offset) are measured. The regions are then clustered based on their signal shape to identify different chromatin architectures and create a catalog. These chromatin signatures can then be used to annotate each region of interest in each cell, based on the signal resemblance. The information can be stored as a matrix (M) that can be used for downstream analyses, such as sub-population identification.} \label{atac_seq_pipeline} \end{center} \end{figure} All these methods have shown good performances to identify know and new cell populations [REFERENCES]. However, some issues remains open. First, none of these methods uses DGF data to identify different types of footprints or chromatin architecture, in terms of signal shape, at the single cell level. Second, ATAC-seq measures chromatin accessibility but also provides information about the nucleosome occupancy at accessible genomic regions \citep{buenrostro_transposition_2013}. Thus counting the number of reads mapping at a given loci is, indeed, an indication of accessibility but it does use only a small fraction of the available information. Finally, to date, no study has tried to determine whether what is observed at the bulk level can also be seen at the individual cell level and whether this can be used to infer the molecular state of the cells. -With this project, I design and develop the basements of a computational framework to construct a catalog of prototypical chromatin architectures from single-cell data that can later on be used to annotate individual regions, in single cell. Such a method can be useful to determine cellular molecular state and to group cells accordingly. The entire pipeline is illustrate in Figure \ref{atac_seq_pipeline}. +In this project, I designed and developed the basements of a computational framework to construct a catalog of prototypical chromatin architectures from single-cell data that can later on be used to annotate individual regions, in single cell. Such a method can be useful to determine cellular molecular state and to group cells accordingly. The entire pipeline is illustrate in Figure \ref{atac_seq_pipeline}. + +\section{Data} + +To this end, I choose to work with a publicly available single-cell ATAC-seq dataset from 5'000 human blood monocytes from a healthy donor. These data have been produced by 10xGenomics and are available as part of the advertisement for their single-cell library preparation and data analysis solutions. + +For this reason, several data pre-processing steps have already been performed. Thus working with these data require minimum handling in order to be used. Cell demultiplexing has already been performed. Sequencing adapters sequences have been trimmed. Quality control checks have been performed and show good values. Mapping has been performed on the hg19 genome, peaks have been called and many more downstream analyses results and intermediate data are available. + +Because of these reasons, this dataset offers all the conditions to be used as a standard to develop and benchmark new analyses methods. + +The reads were downloaded in bam format from \url{http://s3-us-west-2.amazonaws.com/10x.files/samples/cell-atac/1.1.0/atac_v1_pbmc_5k/atac_v1_pbmc_5k_possorted_bam.bam} and the peaks called on the aggregated data were downloaded in bed format from \url{http://cf.10xgenomics.com/samples/cell-atac/1.1.0/atac_v1_pbmc_5k/atac_v1_pbmc_5k_peaks.bed}. \section{Identification of catalog of chromatin architectures} The study of signal shape (distribution) has been a quite active field for bulk sequencing experiments during the last decade. Dedicated algorithms \citep{hon_chromasig:_2008} \citep{nielsen_catchprofiles:_2012} \citep{kundaje_ubiquitous_2012} \citep{nair_probabilistic_2014} \citep{groux_spar-k:_2019} have been developed to cluster genomic regions based on their distribution of reads, which reflects their function. The major issue faced where i) to assess whether two regions had the same signal, they had to be properly aligned, ii) even if the regions were properly aligned, they had to be properly oriented and iii) the signal may be sparse due to an sub-optimal sequencing depth. -\subsection{Algorithm to identify over-represented chromatin architecture} +\subsection{EMRead : an algorithm to identify over-represented chromatin architecture} \begin{figure}[!htbp] \begin{center} \includegraphics[scale=0.15]{scATAC-seq/figures/em.png} - \captionof{figure}{\textbf{Expectation-maximization algorithms :} illustration of the algorithms procedure. \textbf{A} Algorithm dedicated to the discovery of over-represented chromatin (EMRead) patterns, as described in \citep{nair_probabilistic_2014}. \textbf{B} Adaptation of the algorithm to discover over-represented DNA motifs (EMSequence). The overall design is the same. Both algorithms model the data has having being sampled from a distribution and perform a maximum-likelihood estimation of the distribution parameters from the data through an iterative procedure.} + \captionof{figure}{\textbf{Expectation-maximization algorithms :} illustration of the algorithms procedure. \textbf{A} illustration of EMRead, an algorithm dedicated to the discovery of over-represented chromatin patterns, as described in \citep{nair_probabilistic_2014}. \textbf{B} illustration of EMSequence, an algorithm to discover over-represented DNA motifs. The overall design is the same. Both algorithms model the data has having being sampled from a distribution and perform a maximum-likelihood estimation of the distribution parameters from the data through an iterative procedure.\\ +EMJoint algorithm is the combination of both EMRead and EMSequence at the same time.} \label{atac_seq_em} \end{center} \end{figure} -Most of the above mentioned algorithms and softwares deal with some of these issues. The probabilistic algorithm developed in \citep{nair_probabilistic_2014} is really interesting. It is a probabilistic partitioning method that softly clusters a sets of genomic regions represented as a vector of counts corresponding to the number of reads (ChIP-seq, DNase-seq) along them. The regions clustered based on their signal shape resemblance. To ensure proper comparisons between the regions, the algorithm allows to offset one region compare to the other to retrieve a similar signal at different offsets and to flip the signal orientation. Finally, it has been demonstrated to be really robust to sparse data. +Most of the above mentioned algorithms and softwares deal with some of these issues. However, the probabilistic algorithm developed by \citep{nair_probabilistic_2014} is really interesting. For the sake of simplicity, let us call it EMRead. EMRead is a probabilistic partitioning method that softly clusters a sets of genomic regions represented as a vector of counts corresponding to the number of reads (ChIP-seq, DNase-seq) along them. The regions clustered based on their signal shape resemblance. To ensure proper comparisons between the regions, the algorithm allows to offset one region compare to the other to retrieve a similar signal at different offsets and to flip the signal orientation. Finally, it has been demonstrated to be really robust to sparse data. This algorithm explicitly models the data has having being generated by sampling from $K$ distinct signal models that corresponds to $K$ different signal classes. Each class is represented by a vector of $L$ values that represented the aggregated signal for that class. This algorithm models the data has having being generated, using a Poisson distribution, from $K$ signal models of lengths $L$. Each class is represented by a vector of $L$ values that represent the mean signal for that class. These values are then the mean parameters of the Poisson distributions This algorithm models the signal over a region of length $L$ has having being sampled from a signal model, using $L$ independent Poisson distributions. The number of reads sequenced over this region is then the result of this sampling procedure. The entire set of regions is assumed to have been generated from $K$ different signal models (classes). Each class is represented by a vector of $L' \le L$ values that represent the expected number of reads at each position for that class. These values are thus the Poisson distribution parameters. In order to discover the $K$ different chromatin signatures in the data, the algorithm proceed to a maximum likelihood estimation of the parameters using an expectation-maximization (EM) framework. Given a set of $K$ models, the likelihoods of each region given each class is computed. A posterior probability of each class given each region can, in turn, be computed. These probabilities can be understood as a soft clustering. The parameters of the classes are updated using a weighted aggregation of the signal. Since each region is computed a probability to belong to each class, it participates to the update of all the classes, with different weights. If the length of the chromatin signature searched $L'