<codeBook xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" xmlns="ddi:codebook:2_5">
  <docDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">PGV-PII</titl>
        <parTitl xml:lang="en">PGV-PII</parTitl>
        <IDNo agency="SND">doi-10-23695-qcqg-3613-0</IDNo>
        <IDNo agency="DOI">https://doi.org/10.23695/QCQG-3613</IDNo>
      </titlStmt>
      <prodStmt>
        <producer xml:lang="en" abbr="SND">Swedish National Data Service</producer>
        <producer xml:lang="sv" abbr="SND">Svensk nationell datatjänst</producer>
      </prodStmt>
      <holdings URI="https://doi.org/10.23695/QCQG-3613">Landing page</holdings>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">PGV-PII</titl>
        <parTitl xml:lang="en">PGV-PII</parTitl>
        <IDNo agency="SND">doi-10-23695-qcqg-3613-0</IDNo>
        <IDNo agency="DOI">https://doi.org/10.23695/QCQG-3613</IDNo>
      </titlStmt>
      <rspStmt />
      <prodStmt />
      <distStmt>
        <distrbtr xml:lang="en" abbr="SND" URI="https://snd.se">Swedish National Data Service</distrbtr>
        <distrbtr xml:lang="sv" abbr="SND" URI="https://snd.se">Svensk nationell datatjänst</distrbtr>
        <distDate xml:lang="en" date="2025-10-07" />
      </distStmt>
      <verStmt>
        <version elementVersion="0" elementVersionDate="2025-10-07" />
      </verStmt>
      <holdings URI="https://doi.org/10.23695/QCQG-3613">Landing page</holdings>
    </citation>
    <stdyInfo>
      <subject />
      <abstract xml:lang="en" contentType="abstract">This is a small corpus of 10 pairs of texts in Swedish and English annotated with personal information categories. The annotation largely follows that of the TAB corpus (https://aclanthology.org/2022.cl-4.19/). The twenty texts in total were sourced from the Parallel Global Voices corpus (https://nlp.ilsp.gr/pgv/, CC BY 4.0) and manually annotated. That corpus, in turn, had collected the texts from the Global Voices websites (https://globalvoices.org/, CC BY 3.0).</abstract>
      <abstract xml:lang="sv" contentType="abstract">Det här är en liten korpus som består av 10 par texter på svenska och engelska, annoterade med kategorier av personliga uppgifter. Annoteringen liknar den av TAB-korpusen (https://aclanthology.org/2022.cl-4.19/). De tjugo texterna har sitt ursprung i Parallel Global Voices-korpusen (https://nlp.ilsp.gr/pgv/, CC BY 4.0) och var annoterade för hand. Denna korpus innehåller data från Global Voices-webbsidorna (https://globalvoices.org/, CC BY 3.0).</abstract>
      <sumDscr />
    </stdyInfo>
    <method>
      <dataColl />
    </method>
    <dataAccs>
      <useStmt>
        <restrctn xml:lang="en">Access to data through an external actor. </restrctn>
        <restrctn xml:lang="sv">Åtkomst till data via extern aktör. </restrctn>
      </useStmt>
    </dataAccs>
    <othrStdyMat />
  </stdyDscr>
</codeBook>