<codeBook xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" xmlns="ddi:codebook:2_5">
  <docDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">SUPPLEMENTARY MATERIAL: Machine learning-based analysis of glioma grades reveals co-enrichment</titl>
        <parTitl xml:lang="en">SUPPLEMENTARY MATERIAL: Machine learning-based analysis of glioma grades reveals co-enrichment</parTitl>
        <IDNo agency="SND">2024-339-1</IDNo>
        <IDNo agency="DOI">https://doi.org/10.57804/6fa3-6v37</IDNo>
      </titlStmt>
      <prodStmt>
        <producer xml:lang="en" abbr="SND">Swedish National Data Service</producer>
        <producer xml:lang="sv" abbr="SND">Svensk nationell datatjänst</producer>
      </prodStmt>
      <holdings URI="https://doi.org/10.57804/6fa3-6v37">Landing page</holdings>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">SUPPLEMENTARY MATERIAL: Machine learning-based analysis of glioma grades reveals co-enrichment</titl>
        <parTitl xml:lang="en">SUPPLEMENTARY MATERIAL: Machine learning-based analysis of glioma grades reveals co-enrichment</parTitl>
        <IDNo agency="SND">2024-339-1</IDNo>
        <IDNo agency="DOI">https://doi.org/10.57804/6fa3-6v37</IDNo>
        <IDNo agency="URN">urn:nbn:se:uu:diva-455177</IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty xml:lang="en" affiliation="Uppsala University">Garbulowski, Mateusz</AuthEnty>
        <AuthEnty xml:lang="sv" affiliation="Uppsala universitet">Garbulowski, Mateusz</AuthEnty>
      </rspStmt>
      <prodStmt />
      <distStmt>
        <distrbtr xml:lang="en" abbr="SND" URI="https://snd.se">Swedish National Data Service</distrbtr>
        <distrbtr xml:lang="sv" abbr="SND" URI="https://snd.se">Svensk nationell datatjänst</distrbtr>
        <distDate xml:lang="en" date="2021-10-05" />
      </distStmt>
      <verStmt>
        <version elementVersion="1" elementVersionDate="2021-10-05" />
      </verStmt>
      <holdings URI="https://doi.org/10.57804/6fa3-6v37">Landing page</holdings>
    </citation>
    <stdyInfo>
      <subject>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p9788">gliomas</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p9788">gliom</keyword>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p21846">machine learning</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p21846">maskininlärning</keyword>
      </subject>
      <abstract xml:lang="en" contentType="abstract">Examining glioma grading processes is valuable for improving therapeutic challenges. One of the most extensive repositories storing transcriptomics data for gliomas is The Cancer Genome Atlas (TCGA). However, such big cohorts should be processed with caution and evaluated thoroughly as they can contain batch and other effects. Furthermore, biological mechanisms of cancer contain interactions among biomarkers. Thus, we applied an interpretable machine learning approach to discover such relationships. This type of transparent learning provides not only good predictability, but also reveals co-predictive mechanisms among features. In this study, we corrected the strong and confounded batch effect in the TCGA glioma data. We further used the corrected datasets to perform comprehensive machine learning analysis applied on single-sample gene set enrichment scores using collections from the Molecular Signature Database. Furthermore, using rule-based classifiers, we displayed networks of co-enrichment related to glioma grades. Moreover, we validated our results using the external glioma cohorts.

The dataset was originally published in DiVA and moved to SND in 2024.</abstract>
      <abstract xml:lang="sv" contentType="abstract">Se engelsk version av beskrivningen för information. 
Datasetet har ursprungligen publicerats i DiVA och flyttades över till SND 2024.</abstract>
      <sumDscr>
        <dataKind xml:lang="en">Numeric</dataKind>
        <dataKind xml:lang="en">Text</dataKind>
        <dataKind xml:lang="en">Still image</dataKind>
      </sumDscr>
    </stdyInfo>
    <method>
      <dataColl />
    </method>
    <dataAccs>
      <useStmt>
        <restrctn xml:lang="en">Access to data through SND. Data are freely accessible.</restrctn>
        <restrctn xml:lang="sv">Åtkomst till data via SND. Data är fritt tillgängliga.</restrctn>
        <conditions elementVersion="info:eu-repo-Access-Terms vocabulary">openAccess</conditions>
      </useStmt>
    </dataAccs>
    <othrStdyMat>
      <relPubl />
    </othrStdyMat>
  </stdyDscr>
</codeBook>