<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type='text/xsl' href='/oai/static/oai2.xsl' ?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd">
  <responseDate>2026-05-25T09:51:35Z</responseDate>
  <request identifier="0643e7c0a1f2dd7f42d44235b3dd4d0f65a4a9481e1ab90ca9bbce3a2146bdcc" metadataPrefix="oai_ddi25" verb="GetRecord">https://datacatalogue.cessda.eu/oai-pmh/v0/oai</request>
  <GetRecord>
    <record>
    <header>
      <identifier>0643e7c0a1f2dd7f42d44235b3dd4d0f65a4a9481e1ab90ca9bbce3a2146bdcc</identifier>
      <datestamp>2026-02-09T03:09:27Z</datestamp>
      <setSpec>language:en</setSpec><setSpec>openaire_data</setSpec>
    </header>
      <metadata>
        <codeBook xmlns="ddi:codebook:2_5" version="2.5" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd">
    <docDscr>
      <citation>
        <titlStmt>
          <titl xml:lang="en">DDI study level documentation for study 10.7802/2990 Web Survey: Data Annotation Bottleneck and Active Learning for Natural Language Processing in the Era of Large Language Models</titl>
        </titlStmt>
        <prodStmt>
        </prodStmt>
        <holdings xml:lang="en" URI="https://search.gesis.org/research_data/SDN-10.7802-2990?lang=en"/><holdings xml:lang="de" URI="https://search.gesis.org/research_data/SDN-10.7802-2990?lang=de"/>
      </citation>
    </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl xml:lang="en">Web Survey: Data Annotation Bottleneck and Active Learning for Natural Language Processing in the Era of Large Language Models</titl>
        <parTitl xml:lang="de">Web Survey: Data Annotation Bottleneck and Active Learning for Natural Language Processing in the Era of Large Language Models</parTitl>
        <IDNo xml:lang="en" agency="GESIS">10.7802/2990</IDNo><IDNo xml:lang="de" agency="GESIS">10.7802/2990</IDNo><IDNo xml:lang="en" agency="DOI">10.7802/2990</IDNo><IDNo xml:lang="de" agency="DOI">10.7802/2990</IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty affiliation="GESIS - Leibniz Institut für Sozialwissenschaften" xml:lang="en">Romberg, Julia
        </AuthEnty><AuthEnty affiliation="GESIS - Leibniz Institut für Sozialwissenschaften" xml:lang="de">Romberg, Julia
        </AuthEnty><AuthEnty affiliation="Institute for Applied Informatics at Leipzig University (InfAI), Center for Scalable Data Analytics and Artificial Intelligence (ScaDS.AI) Dresden/Leipzig, Leipzig University" xml:lang="en">Schröder, Christopher
        </AuthEnty><AuthEnty affiliation="Institute for Applied Informatics at Leipzig University (InfAI), Center for Scalable Data Analytics and Artificial Intelligence (ScaDS.AI) Dresden/Leipzig, Leipzig University" xml:lang="de">Schröder, Christopher
        </AuthEnty><AuthEnty affiliation="Dresden University of Technology" xml:lang="en">Gonsior, Julius
        </AuthEnty><AuthEnty affiliation="Dresden University of Technology" xml:lang="de">Gonsior, Julius
        </AuthEnty>
      </rspStmt>
      <prodStmt>
        <prodDate xml:lang="en"/>
      </prodStmt>
      <distStmt>
        <distrbtr abbr="GESIS" URI="http://www.gesis.org/" xml:lang="en">GESIS Data Archive for the Social Sciences</distrbtr><distrbtr abbr="GESIS" URI="http://www.gesis.org/" xml:lang="de">GESIS Datenarchiv für Sozialwissenschaften</distrbtr>
        <distDate xml:lang="en" date="2026"/><distDate xml:lang="de" date="2026"/>
      </distStmt>
      <verStmt>
        <version date="2026" xml:lang="en"/><version date="2026" xml:lang="de"/>
      </verStmt>
      <holdings xml:lang="en" URI="https://search.gesis.org/research_data/SDN-10.7802-2990?lang=en"/><holdings xml:lang="de" URI="https://search.gesis.org/research_data/SDN-10.7802-2990?lang=de"/>
    </citation>
    <stdyInfo>
      <subject>
        <keyword xml:lang="en">large language models</keyword><keyword xml:lang="en">supervised learning</keyword><keyword xml:lang="en">data annotation</keyword><keyword xml:lang="en">active learning</keyword><keyword xml:lang="en">practical application</keyword><keyword xml:lang="de">large language models</keyword><keyword xml:lang="de">supervised learning</keyword><keyword xml:lang="de">data annotation</keyword><keyword xml:lang="de">active learning</keyword><keyword xml:lang="de">practical application</keyword>
      </subject>
      <abstract xml:lang="en">We publish a dataset of 144 community perspectives on the need for annotated training data in the field of Natural Language Processing (NLP). The dataset documents how large language models (LLMs) have impacted the persistent issue of the lack of annotated data. Additionally, we inquire about the current state of the "active learning" annotation method. Our target group consists of experts from academia, industry, and government institutions.  The data was collected with a web survey that was open online to voluntary participants for 6 weeks, from December 15th, 2024, to January 26th, 2025.  keywords: large language models, supervised learning, data annotation, active learning, practical application</abstract><abstract xml:lang="de">We publish a dataset of 144 community perspectives on the need for annotated training data in the field of Natural Language Processing (NLP). The dataset documents how large language models (LLMs) have impacted the persistent issue of the lack of annotated data. Additionally, we inquire about the current state of the "active learning" annotation method. Our target group consists of experts from academia, industry, and government institutions.  The data was collected with a web survey that was open online to voluntary participants for 6 weeks, from December 15th, 2024, to January 26th, 2025.  keywords: large language models, supervised learning, data annotation, active learning, practical application</abstract>
      <sumDscr>
        <universe xml:lang="en" clusion="I">Experts in Natural Language Processing</universe>
      </sumDscr>
    </stdyInfo>
    <method>
      <dataColl>
        <collMode xml:lang="en">Selbstausfüller:CAWI(Computerunterstütztes Web-Interview)<concept/></collMode><collMode xml:lang="de">Selbstausfüller:CAWI(Computerunterstütztes Web-Interview)<concept/></collMode>
      </dataColl>
    </method>
    <dataAccs>
      <useStmt>
        <restrctn xml:lang="en">Free access (with registration) - The research data can be downloaded by registered users.
CC BY-NC-SA 4.0: Namensnennung - Nicht kommerziell – Weitergabe unter gleichen Bedingungen  (https://creativecommons.org/licenses/by-nc-sa/4.0/deed.de)</restrctn><restrctn xml:lang="de">Freier Zugang (mit Registrierung) - Die Forschungsdaten können von allen registrierten Nutzerinnen und Nutzern heruntergeladen werden.
CC BY-NC-SA 4.0: Namensnennung - Nicht kommerziell – Weitergabe unter gleichen Bedingungen  (https://creativecommons.org/licenses/by-nc-sa/4.0/deed.de)</restrctn>
      </useStmt>
    </dataAccs>
    <othrStdyMat>
    </othrStdyMat>
  </stdyDscr>
  <fileDscr>
  </fileDscr>
</codeBook>
      </metadata>
      <about>
        <provenance xmlns="http://www.openarchives.org/OAI/2.0/provenance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/provenance http://www.openarchives.org/OAI/2.0/provenance.xsd">
    <originDescription harvestDate="2026-02-09T03:09:26Z" altered="true">
      <baseURL>http://dbkapps.gesis.org/dbkoai/oai.asp</baseURL>
      <identifier>oai:dbk.gesis.org:SDN/10.7802_2990</identifier>
      <datestamp>2026-01-31</datestamp>
      <metadataNamespace>ddi:codebook:2_5</metadataNamespace>
    </originDescription>
</provenance>
      </about>
    </record>
  </GetRecord>
</OAI-PMH>