<codeBook xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" xmlns="ddi:codebook:2_5">
  <docDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv"></titl>
        <parTitl xml:lang="en">NrdJm phylogeny</parTitl>
        <IDNo agency="SND">doi-10-17045-sthlmuni-7117430-0</IDNo>
        <IDNo agency="DOI">https://doi.org/10.17045/STHLMUNI.7117430</IDNo>
      </titlStmt>
      <prodStmt>
        <producer xml:lang="en" abbr="SND">Swedish National Data Service</producer>
        <producer xml:lang="sv" abbr="SND">Svensk nationell datatjänst</producer>
      </prodStmt>
      <holdings URI="https://doi.org/10.17045/STHLMUNI.7117430">Landing page</holdings>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv"></titl>
        <parTitl xml:lang="en">NrdJm phylogeny</parTitl>
        <IDNo agency="SND">doi-10-17045-sthlmuni-7117430-0</IDNo>
        <IDNo agency="DOI">https://doi.org/10.17045/STHLMUNI.7117430</IDNo>
      </titlStmt>
      <rspStmt />
      <prodStmt />
      <distStmt>
        <distrbtr xml:lang="en" abbr="SND" URI="https://snd.se">Swedish National Data Service</distrbtr>
        <distrbtr xml:lang="sv" abbr="SND" URI="https://snd.se">Svensk nationell datatjänst</distrbtr>
        <distDate xml:lang="en" date="2018-09-21" />
      </distStmt>
      <verStmt>
        <version elementVersion="0" elementVersionDate="2018-09-21" />
      </verStmt>
      <holdings URI="https://doi.org/10.17045/STHLMUNI.7117430">Landing page</holdings>
    </citation>
    <stdyInfo>
      <subject />
      <abstract xml:lang="en" contentType="abstract">All NrdJm sequences from NCBI’s RefSeq database were downloaded from RNRdb (http://rnrdb.pfitmap.org) and clustered with USEARCH (Edgar 2010) at 90% sequence identity to reduce redundancy. Non full-length sequences and sequences of dubious quality were manually removed, before aligning all 363 sequences with ProbCons (Do et al. 2005). Trustworthy alignment positions were selected with the BMGE algorithm (Criscuolo and Gribaldo 2010) using the BLOSUM30 substitution matrix, ending up with 363 well-aligned positions forming 350 distinct alignment patterns. RAxML version 8.2.4 (Stamatakis 2014) was used to estimate a phylogeny, using the PROTGAMMAAUTO model, rapid bootstrapping with the autoMRE bootstopping followed by a full maximum likelihood tree search.


The file is viewable with Dendroscope (Huson et al. 2007).
v2: Addition of Lactobacillus leichmannii sequence.</abstract>
      <sumDscr />
    </stdyInfo>
    <method>
      <dataColl />
    </method>
    <dataAccs>
      <useStmt>
        <restrctn xml:lang="en">Access to data through an external actor. </restrctn>
        <restrctn xml:lang="sv">Åtkomst till data via extern aktör. </restrctn>
      </useStmt>
    </dataAccs>
    <othrStdyMat />
  </stdyDscr>
</codeBook>