<codeBook xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" xmlns="ddi:codebook:2_5">
  <docDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">Web-scraped EMA guidelines and European Public Assessment Reports</titl>
        <parTitl xml:lang="en">Web-scraped EMA guidelines and European Public Assessment Reports</parTitl>
        <IDNo agency="SND">2023-254-1</IDNo>
        <IDNo agency="DOI">https://doi.org/10.57804/wa37-j878</IDNo>
      </titlStmt>
      <prodStmt>
        <producer xml:lang="en" abbr="SND">Swedish National Data Service</producer>
        <producer xml:lang="sv" abbr="SND">Svensk nationell datatjänst</producer>
      </prodStmt>
      <holdings URI="https://doi.org/10.57804/wa37-j878">Landing page</holdings>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">Web-scraped EMA guidelines and European Public Assessment Reports</titl>
        <parTitl xml:lang="en">Web-scraped EMA guidelines and European Public Assessment Reports</parTitl>
        <IDNo agency="SND">2023-254-1</IDNo>
        <IDNo agency="DOI">https://doi.org/10.57804/wa37-j878</IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty xml:lang="en" affiliation="Department of Medical Sciences, Uppsala University">Westman, Gabriel</AuthEnty>
        <AuthEnty xml:lang="sv" affiliation="Institutionen för medicinska vetenskaper, Uppsala universitet">Westman, Gabriel</AuthEnty>
      </rspStmt>
      <prodStmt />
      <distStmt>
        <distrbtr xml:lang="en" abbr="SND" URI="https://snd.se">Swedish National Data Service</distrbtr>
        <distrbtr xml:lang="sv" abbr="SND" URI="https://snd.se">Svensk nationell datatjänst</distrbtr>
        <distDate xml:lang="en" date="2023-11-27" />
      </distStmt>
      <verStmt>
        <version elementVersion="1" elementVersionDate="2023-11-27" />
      </verStmt>
      <holdings URI="https://doi.org/10.57804/wa37-j878">Landing page</holdings>
    </citation>
    <stdyInfo>
      <subject>
        <keyword xml:lang="en" vocab="ELSST" vocabURI="https://elsst.cessda.eu/id/6/482e42ce-7ce5-4a31-b7dd-632d6fdc7df8">DRUG THERAPY</keyword>
        <keyword xml:lang="sv" vocab="ELSST" vocabURI="https://elsst.cessda.eu/id/6/482e42ce-7ce5-4a31-b7dd-632d6fdc7df8">LÄKEMEDELSTERAPI</keyword>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p6069">computational linguistics</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p6069">datalingvistik</keyword>
      </subject>
      <abstract xml:lang="en" contentType="abstract">This submission consists of the data and python code that supports the original research article "A full-document analysis of the semantic relation between European Public Assessment Reports and EMA guidelines using a BERT language model" (Bergman et al, PLOS ONE 2023).

The database contains metadata and fulltext from 669 EMA Scientific guidelines and 1024 EMA European Public Assessment Reports.</abstract>
      <abstract xml:lang="sv" contentType="abstract">Detta datapaket innehåller data och python-kod som ligger till grund för publikationen "A full-document analysis of the semantic relation between European Public Assessment Reports and EMA guidelines using a BERT language model" (Bergman et al, PLOS ONE 2023).

Databasen innehåller metadata och fulltext från 669 st EMA Scientific guidelines och 1024 EMA European Public Assessment Reports.</abstract>
      <sumDscr>
        <anlyUnit xml:lang="en" unit="Media unit: Text">Media unit: Text<concept vocab="DDI Analysis Unit" vocabURI="https://vocabularies.cessda.eu/v2/vocabularies/AnalysisUnit/2.1.3?languageVersion=en-2.1.3">Media unit: Text</concept></anlyUnit>
        <anlyUnit xml:lang="sv" unit="Mediaenhet: Text">Mediaenhet: Text<concept vocab="DDI Analysis Unit" vocabURI="https://vocabularies.cessda.eu/v2/vocabularies/AnalysisUnit/2.1.3?languageVersion=sv-2.1.3">Mediaenhet: Text</concept></anlyUnit>
        <universe xml:lang="en">Open regulatory data on medicinal products</universe>
        <universe xml:lang="sv">Öppna regulatoriska data rörande läkemedelsprodukter</universe>
        <dataKind xml:lang="en">Text</dataKind>
        <dataKind xml:lang="en">Software</dataKind>
      </sumDscr>
    </stdyInfo>
    <method>
      <dataColl>
        <sampProc xml:lang="en">All EMA guidelines and European Public Assessment Reports (EPARs) from the time period specified.<concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/v2/vocabularies/SamplingProcedure/2.0.1?languageVersion=en-2.0.1">All EMA guidelines and European Public Assessment Reports (EPARs) from the time period specified.</concept></sampProc>
        <sampProc xml:lang="sv">Alla EMA guidelines och European Public Assessment Reports (EPARs) från den beskrivna tidsperioden.<concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/v2/vocabularies/SamplingProcedure/2.0.1?languageVersion=sv-2.0.1">Alla EMA guidelines och European Public Assessment Reports (EPARs) från den beskrivna tidsperioden.</concept></sampProc>
        <sampProc xml:lang="en">Total universe/Complete enumeration<concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/v2/vocabularies/SamplingProcedure/2.0.1?languageVersion=en-2.0.1">Total universe/Complete enumeration</concept></sampProc>
        <sampProc xml:lang="sv">Hela populationen/total räkning<concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/v2/vocabularies/SamplingProcedure/2.0.1?languageVersion=sv-2.0.1">Hela populationen/total räkning</concept></sampProc>
      </dataColl>
    </method>
    <dataAccs>
      <useStmt>
        <restrctn xml:lang="en">Access to data through SND. Data are freely accessible.</restrctn>
        <restrctn xml:lang="sv">Åtkomst till data via SND. Data är fritt tillgängliga.</restrctn>
        <conditions elementVersion="info:eu-repo-Access-Terms vocabulary">openAccess</conditions>
      </useStmt>
    </dataAccs>
    <othrStdyMat />
  </stdyDscr>
</codeBook>