<codeBook xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" xmlns="ddi:codebook:2_5">
  <docDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">Dataset med annoteringar av tekniskt språk från fyra års tillståndsövervakning av pappersmaskinsindustri i norra Sverige</titl>
        <parTitl xml:lang="en">Dataset with four years of condition monitoring technical language annotations from paper machine industries in northern Sweden</parTitl>
        <IDNo agency="SND">2023-257-1</IDNo>
        <IDNo agency="ltu.se">2019-02533</IDNo>
        <IDNo agency="DOI">https://doi.org/10.5878/hafd-ms27</IDNo>
      </titlStmt>
      <prodStmt>
        <producer xml:lang="en" abbr="SND">Swedish National Data Service</producer>
        <producer xml:lang="sv" abbr="SND">Svensk nationell datatjänst</producer>
      </prodStmt>
      <holdings URI="https://doi.org/10.5878/hafd-ms27">Landing page</holdings>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="sv">Dataset med annoteringar av tekniskt språk från fyra års tillståndsövervakning av pappersmaskinsindustri i norra Sverige</titl>
        <parTitl xml:lang="en">Dataset with four years of condition monitoring technical language annotations from paper machine industries in northern Sweden</parTitl>
        <IDNo agency="SND">2023-257-1</IDNo>
        <IDNo agency="ltu.se">2019-02533</IDNo>
        <IDNo agency="DOI">https://doi.org/10.5878/hafd-ms27</IDNo>
        <IDNo agency="SwePub">oai:DiVA.org:ltu-95407</IDNo>
        <IDNo agency="DOI">10.36001/phme.2022.v7i1.3356</IDNo>
        <IDNo agency="URN">urn:nbn:se:ltu:diva-95407</IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty xml:lang="en" affiliation="Department of Computer Science, Electrical and Space Engineering, Luleå University of Technology">Löwenmark, Karl</AuthEnty>
        <AuthEnty xml:lang="sv" affiliation="Institutionen för system- och rymdteknik, Luleå tekniska universitet">Löwenmark, Karl</AuthEnty>
        <AuthEnty xml:lang="en" affiliation="Department of Computer Science, Electrical and Space Engineering, Luleå University of Technology">Sandin, Fredrik</AuthEnty>
        <AuthEnty xml:lang="sv" affiliation="Institutionen för system- och rymdteknik, Luleå tekniska universitet">Sandin, Fredrik</AuthEnty>
        <AuthEnty xml:lang="en" affiliation="Department of Computer Science, Electrical and Space Engineering, Luleå University of Technology">Liwicki, Marcus</AuthEnty>
        <AuthEnty xml:lang="sv" affiliation="Institutionen för system- och rymdteknik, Luleå tekniska universitet">Liwicki, Marcus</AuthEnty>
        <AuthEnty xml:lang="en" affiliation="SKF (Sweden)">Schnabel, Stephan</AuthEnty>
        <AuthEnty xml:lang="sv" affiliation="Svenska Kullagerfabriken">Schnabel, Stephan</AuthEnty>
      </rspStmt>
      <prodStmt>
        <grantNo xml:lang="en" agency="VINNOVA">2019-02533</grantNo>
        <grantNo xml:lang="sv" agency="Verket för innovationssystem">2019-02533</grantNo>
      </prodStmt>
      <distStmt>
        <distrbtr xml:lang="en" abbr="SND" URI="https://snd.se">Swedish National Data Service</distrbtr>
        <distrbtr xml:lang="sv" abbr="SND" URI="https://snd.se">Svensk nationell datatjänst</distrbtr>
        <distDate xml:lang="en" date="2023-12-21" />
      </distStmt>
      <verStmt>
        <version elementVersion="1" elementVersionDate="2023-12-21" />
      </verStmt>
      <holdings URI="https://doi.org/10.5878/hafd-ms27">Landing page</holdings>
    </citation>
    <stdyInfo>
      <subject>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p10598">paper machines</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p10598">pappersmaskiner</keyword>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p15423">condition monitoring</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p15423">övervakning av skick</keyword>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p6071">language technology</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p6071">språkteknologi</keyword>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p12266">signal processing</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p12266">signalbehandling</keyword>
        <keyword xml:lang="en" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p10706">paper industry</keyword>
        <keyword xml:lang="sv" vocab="YSO" vocabURI="http://www.yso.fi/onto/yso/p10706">pappersindustri</keyword>
      </subject>
      <abstract xml:lang="en" contentType="abstract">This dataset consists of four years of technical language annotations from two paper machines in northern Sweden, structured as a Pandas dataframe. The same data is also available as a semicolon-separated .csv file. The data consists of two columns, where the first column corresponds to annotation note contents, and the second column corresponds to annotation titles. The annotations are in Swedish, and processed so that all mentions of personal information are replaced with the string ‘egennamn’, meaning “personal name” in Swedish. Each row corresponds to one annotation with the corresponding title.

Data can be accessed in Python with:
import pandas as pd
annotations_df = pd.read_pickle("Technical_Language_Annotations.pkl")
annotation_contents = annotations_df['noteComment']
annotation_titles = annotations_df['title']</abstract>
      <abstract xml:lang="sv" contentType="abstract">Detta dataset består av tekniskt-språk-annoteringar från fyra års insamling från två pappersmaskiner i norra Sverige,  strukturerat som en Pandas dataframe. Samma data finns också tillgänglig som en semikolonseparerad .csv-fil. Datan består av två kolumner, där den första kolumnen motsvarar annoteringens textinnehåll, och den andra titeln. Annoteringarna är skrivna på svenska, och processade så att alla egennamn ersatts av textsträngen ’egennamn’. Varje rad motsvarar en annotering med titel.

Data behandlas i Python med:
import pandas as pd
annotations_df = pd.read_pickle("Technical_Language_Annotations.pkl")
annotation_contents = annotations_df['noteComment']
annotation_titles = annotations_df['title']</abstract>
      <sumDscr>
        <nation xml:lang="en" abbr="SE">Sweden</nation>
        <nation xml:lang="sv" abbr="SE">Sverige</nation>
        <dataKind xml:lang="en">Text</dataKind>
        <dataKind xml:lang="en">Other</dataKind>
      </sumDscr>
    </stdyInfo>
    <method>
      <dataColl />
    </method>
    <dataAccs>
      <useStmt>
        <restrctn xml:lang="en">Access to data through SND. Access to data is restricted.</restrctn>
        <restrctn xml:lang="sv">Åtkomst till data via SND. Tillgång till data är begränsad.</restrctn>
        <conditions elementVersion="info:eu-repo-Access-Terms vocabulary">restrictedAccess</conditions>
      </useStmt>
    </dataAccs>
    <othrStdyMat>
      <relPubl>
        <citation>
          <titlStmt>
            <titl xml:lang="sv">Löwenmark, K., Taal, C., Nivre, J., Liwicki, M., &amp; Sandin, F. (2022). Processing of Condition Monitoring Annotations with BERT and Technical Language Substitution: A Case Study. In Proceedings of the 7th European Conference of the Prognostics and Health Management Society 2022 (pp. 306–314).</titl>
            <parTitl xml:lang="en">Löwenmark, K., Taal, C., Nivre, J., Liwicki, M., &amp; Sandin, F. (2022). Processing of Condition Monitoring Annotations with BERT and Technical Language Substitution: A Case Study. In Proceedings of the 7th European Conference of the Prognostics and Health Management Society 2022 (pp. 306–314).</parTitl>
            <IDNo agency="DOI">10.36001/phme.2022.v7i1.3356</IDNo>
            <IDNo agency="URN">urn:nbn:se:ltu:diva-95407</IDNo>
            <IDNo agency="SWEPUB">oai:DiVA.org:ltu-95407</IDNo>
          </titlStmt>
          <distStmt>
            <distDate date="2022">2022</distDate>
          </distStmt>
          <any xml:lang="en" xmlns="http://purl.org/dc/elements/1.1/">oai:DiVA.org:ltu-95407</any>
        </citation>
      </relPubl>
    </othrStdyMat>
  </stdyDscr>
</codeBook>