<?xml version='1.0' encoding='utf-8'?>
<eprints xmlns='http://eprints.org/ep2/data/2.0'>
  <eprint id='https://datacompass.lshtm.ac.uk/id/eprint/193'>
    <eprintid>193</eprintid>
    <rev_number>23</rev_number>
    <documents>
      <document id='https://datacompass.lshtm.ac.uk/id/document/1836'>
        <docid>1836</docid>
        <rev_number>2</rev_number>
        <files>
          <file id='https://datacompass.lshtm.ac.uk/id/file/6298'>
            <fileid>6298</fileid>
            <datasetid>document</datasetid>
            <objectid>1836</objectid>
            <filename>AdditionalFile1-TableS1.docx</filename>
            <mime_type>application/vnd.openxmlformats-officedocument.wordprocessingml.document</mime_type>
            <hash>799fab1b2e878ea1fe856bdf67cbbea401def12ec61c6553ed37a1d1e8dd5ace</hash>
            <hash_type>SHA256</hash_type>
            <filesize>57287</filesize>
            <mtime>2016-04-11 09:56:16</mtime>
            <url>https://datacompass.lshtm.ac.uk/id/eprint/193/1/AdditionalFile1-TableS1.docx</url>
          </file>
        </files>
        <eprintid>193</eprintid>
        <pos>1</pos>
        <placement>1</placement>
        <mime_type>application/vnd.openxmlformats-officedocument.wordprocessingml.document</mime_type>
        <format>Dataset</format>
        <language>en</language>
        <security>public</security>
        <license>cc_by</license>
        <main>AdditionalFile1-TableS1.docx</main>
        <content>data</content>
        <retention_period>indefinite</retention_period>
        <formatdesc>The isolates according to geographic location and phenotypic drug resistance</formatdesc>
      </document>
      <document id='https://datacompass.lshtm.ac.uk/id/document/1837'>
        <docid>1837</docid>
        <rev_number>1</rev_number>
        <files>
          <file id='https://datacompass.lshtm.ac.uk/id/file/6304'>
            <fileid>6304</fileid>
            <datasetid>document</datasetid>
            <objectid>1837</objectid>
            <filename>indexcodes.txt</filename>
            <mime_type>text/x-c</mime_type>
            <hash>1f671bd5e6a0de21b03be19dba62bb6bf761a7a9606fd97991fa3c5ebf441361</hash>
            <hash_type>SHA256</hash_type>
            <filesize>3378</filesize>
            <mtime>2016-04-11 10:06:19</mtime>
            <url>https://datacompass.lshtm.ac.uk/id/eprint/193/2/indexcodes.txt</url>
          </file>
        </files>
        <eprintid>193</eprintid>
        <pos>2</pos>
        <placement>2</placement>
        <mime_type>text/x-c</mime_type>
        <format>other</format>
        <language>en</language>
        <security>public</security>
        <main>indexcodes.txt</main>
        <relation>
          <item>
            <type>http://eprints.org/relation/isVersionOf</type>
            <uri>https://datacompass.lshtm.ac.uk/id/document/1836</uri>
          </item>
          <item>
            <type>http://eprints.org/relation/isVolatileVersionOf</type>
            <uri>https://datacompass.lshtm.ac.uk/id/document/1836</uri>
          </item>
          <item>
            <type>http://eprints.org/relation/isIndexCodesVersionOf</type>
            <uri>https://datacompass.lshtm.ac.uk/id/document/1836</uri>
          </item>
        </relation>
        <retention_period>indefinite</retention_period>
        <formatdesc>Generate index codes conversion from Dataset to indexcodes</formatdesc>
      </document>
    </documents>
    <eprint_status>archive</eprint_status>
    <userid>3</userid>
    <dir>disk0/00/00/01/93</dir>
    <datestamp>2016-04-11 09:57:37</datestamp>
    <lastmod>2025-06-17 10:40:11</lastmod>
    <status_changed>2016-04-11 09:57:37</status_changed>
    <type>data_collection</type>
    <metadata_visibility>show</metadata_visibility>
    <creators>
      <item>
        <name>
          <family>Phelan</family>
          <given>Jody</given>
        </name>
        <orcid>0000-0001-8323-7019</orcid>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>5192f0191f2538d0166106c24634f7ca</staffid>
      </item>
      <item>
        <name>
          <family>Coll</family>
          <given>Francesc</given>
        </name>
        <orcid>0000-0002-7882-2325</orcid>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>6c2b7e9afcb260630b636d81fd3bfaf0</staffid>
      </item>
      <item>
        <name>
          <family>Mcnerney</family>
          <given>Ruth</given>
        </name>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>742e523ff9b133b222c41fb882843cdb</staffid>
      </item>
      <item>
        <name>
          <family>Ascher</family>
          <given>David B.</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Pires</family>
          <given>Douglas E. V.</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Furnham</family>
          <given>Nick</given>
        </name>
        <orcid>0000-0002-7532-1269</orcid>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>0fe896f7be3f2c7db6f8b28e68870c57</staffid>
      </item>
      <item>
        <name>
          <family>Coeck</family>
          <given>Nele</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Hill-Cawthorne</family>
          <given>Grant A.</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Nair</family>
          <given>Mridul B.</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Mallard</family>
          <given>Kim</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Ramsay</family>
          <given>Andrew</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Campino</family>
          <given>Susana</given>
        </name>
        <orcid>0000-0003-1403-6138</orcid>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>b440f47b7ee6c1f6c5e11fc34edf059e</staffid>
      </item>
      <item>
        <name>
          <family>Hibberd</family>
          <given>Martin</given>
        </name>
        <orcid>0000-0001-8587-1849</orcid>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>1f995f1c7e03c1b91784efdf5c246e39</staffid>
      </item>
      <item>
        <name>
          <family>Pain</family>
          <given>Arnab</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Rigouts</family>
          <given>Leen</given>
        </name>
        <lshtm_flag>FALSE</lshtm_flag>
      </item>
      <item>
        <name>
          <family>Clark</family>
          <given>Taane</given>
        </name>
        <orcid>0000-0001-8985-9265</orcid>
        <lshtm_flag>TRUE</lshtm_flag>
        <staffid>d6c0a9ae313d576cb0129f8b148489e7</staffid>
      </item>
    </creators>
    <corp_creators>
      <item>Study consortium</item>
    </corp_creators>
    <title>Whole genome sequences for M.tuberculosis isolates from the TDR strain bank</title>
    <divisions>
      <item>EPID</item>
      <item>ITPM</item>
    </divisions>
    <keywords>
      <item>Tuberculosis</item>
      <item>Drug resistance</item>
      <item>Genomics</item>
      <item>Protein structural modelling</item>
      <item>Association study</item>
      <item>Convergent evolution</item>
    </keywords>
    <abstract>Combating the spread of drug resistant tuberculosis is a global health priority. Whole genome association studies are being applied to identify genetic determinants of resistance to anti-tuberculosis drugs. Protein structure and interaction modelling are used to understand the functional effects of putative mutations and provide insight into the molecular mechanisms leading to resistance. To investigate the potential utility of these approaches, we analysed the genomes of 144 Mycobacterium tuberculosis clinical isolates from The Special Programme for Research and Training in Tropical Diseases (TDR) collection sourced from 20 countries in four continents. A genome-wide approach was applied to 127 isolates to identify polymorphisms associated with minimum inhibitory concentrations for first-line anti-tuberculosis drugs. In addition, the effect of identified candidate mutations on protein stability and interactions was assessed quantitatively with well-established computational methods. The analysis revealed that mutations in the genes rpoB (rifampicin), katG (isoniazid), inhA-promoter (isoniazid), rpsL (streptomycin) and embB (ethambutol) were responsible for the majority of resistance observed. A subset of the mutations identified in rpoB and katG were predicted to affect protein stability. Further, a strong direct correlation was observed between the minimum inhibitory concentration values and the distance of the mutated residues in the three-dimensional structures of rpoB and katG to their respective drugs binding sites.</abstract>
    <date>2015-11-04</date>
    <date_type>published</date_type>
    <publisher>European Nucleotide Archive</publisher>
    <data_type>Dataset</data_type>
    <copyright_holders>
      <item>Study consortium</item>
    </copyright_holders>
    <collection_mode>
      <item>Experiment</item>
    </collection_mode>
    <full_text_status>public</full_text_status>
    <funders>
      <item>Biotechnology and Biological Sciences Research Council</item>
      <item>National Health and Medical Research Council</item>
      <item>René Rachou Research Center</item>
      <item>Medical Research Council</item>
      <item>Fundação de Amparo à Pesquisa do Estado de Minas Gerais</item>
    </funders>
    <resourcetype>
      <resourcetypegeneral>Dataset</resourcetypegeneral>
      <resourcetype>Quantitative</resourcetype>
    </resourcetype>
    <collection_method>All DNA samples underwent Illumina sequencing on the HiSeq 2000 platform at the KAUST genomic facility, generating paired-end reads of 150 bp (Additional file 1: Table S1, pathogenseq.lshtm.ac.uk/tdr, Additional file 1: Table S2). All raw sequence data can be downloaded from the ENA short read archive (accession number PRJEB11653). For the raw sequence data, trimmomatic (v0.33) software [42] (parameters: LEADING:3 TRAILING:3 SLIDINGWINDOW:4:20 MINLEN:36) was used to remove or truncate reads of low quality. High quality reads were then mapped to the H37Rv reference genome (Genbank accession: AL123456.3) using the BWA-mem (v0.7.12) algorithm [43] (parameters: -c 100 -M -T 50). From the resulting alignments, SAMtools (v1.3) [44] and GATK (v3.5) [45] software (default parameter settings) were used to call SNPs and small indels, and the interaction of variants between the methods retained. Mappability values were calculated along the reference genome using GEM-Mappability software with a k-mer length of 50 bp and a 0.04 % substitution threshold [46]. Non-unique SNP sites (mappability values greater than one) were removed. Sample genotypes were called using the majority allele (minimum frequency 75 %) in positions supported by at least 20-fold total genome coverage, otherwise they were classified as missing. Isolates or SNPs with in excess of 10 % missing genotype calls were excluded. The final dataset included 144 isolates and 17,952 genome-wide SNPs.</collection_method>
    <language>
      <item>en</item>
    </language>
    <related_resources>
      <item>
        <title>European Nucleotide Archive</title>
        <url>http://www.ebi.ac.uk/ena/data/view/PRJEB11653</url>
        <type>dataresource</type>
      </item>
      <item>
        <title>TDR TB Strain Bank</title>
        <url>http://pathogenseq.lshtm.ac.uk/tdr/</url>
        <type>project</type>
      </item>
    </related_resources>
    <repo_link>
      <item>
        <title>Mycobacterium tuberculosis whole genome sequencing and protein structure modelling provides insights into anti-tuberculosis drug resistance.</title>
        <link>http://researchonline.lshtm.ac.uk/id/eprint/2535998</link>
      </item>
    </repo_link>
    <funders_info>
      <item>
        <funder_name>Biotechnology and Biological Sciences Research Council</funder_name>
        <funder_id>http://dx.doi.org/10.13039/501100000268</funder_id>
      </item>
      <item>
        <funder_name>National Health and Medical Research Council</funder_name>
        <funder_id>http://dx.doi.org/10.13039/501100000925</funder_id>
      </item>
      <item>
        <funder_name>René Rachou Research Center</funder_name>
      </item>
      <item>
        <funder_name>Medical Research Council</funder_name>
        <funder_id>http://dx.doi.org/10.13039/501100000265</funder_id>
      </item>
      <item>
        <funder_name>Fundação de Amparo à Pesquisa do Estado de Minas Gerais</funder_name>
        <funder_id>https://doi.org/10.13039/501100004901</funder_id>
      </item>
    </funders_info>
    <ukri_date_sub>2015-11-04</ukri_date_sub>
  </eprint>
</eprints>
