<?xml version='1.0' encoding='UTF-8'?><codeBook xmlns="ddi:codebook:2_5" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="ddi:codebook:2_5 https://ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" version="2.5"><docDscr><citation><titlStmt><titl>A dataset of 1500-word stories generated by gpt-4o-mini for 236 nationalities</titl><IDNo agency="DOI">doi:10.18710/VM2K4O</IDNo></titlStmt><distStmt><distrbtr source="archive">DataverseNO</distrbtr><distDate>2025-05-28</distDate></distStmt><verStmt source="archive"><version date="2025-05-28" type="RELEASED">1</version></verStmt><biblCit>Rettberg, Jill Walker; Wigers, Hermann, 2025, "A dataset of 1500-word stories generated by gpt-4o-mini for 236 nationalities", https://doi.org/10.18710/VM2K4O, DataverseNO, V1</biblCit></citation></docDscr><stdyDscr><citation><titlStmt><titl>A dataset of 1500-word stories generated by gpt-4o-mini for 236 nationalities</titl><IDNo agency="DOI">doi:10.18710/VM2K4O</IDNo><IDNo agency="Zenodo">10.5281/zenodo.14947238</IDNo><IDNo agency="GitHub">https://github.com/AI-STORIES-ERC/GPT_stories</IDNo></titlStmt><rspStmt><AuthEnty affiliation="University of Bergen">Rettberg, Jill Walker</AuthEnty><AuthEnty affiliation="University of Bergen">Wigers, Hermann</AuthEnty><othId role="Project Leader">Rettberg, Jill Walker</othId><othId role="Hosting Institution">University of Bergen</othId><othId role="Research Group">Center for Digital Culture</othId><othId role="Researcher">Wigers, Hermann</othId><othId role="Data Manager">Wigers, Hermann</othId><othId role="Project Member">Robinson, Colin</othId></rspStmt><prodStmt><producer affiliation="Center for Digital Narrative, University of Bergen" abbr="AI STORIES">AI STORIES</producer><prodPlac>Bergen, Norway</prodPlac><software version="3.11">Python</software><software version="gpt-4o-mini">OpenAI API</software><software version="not specified">distilbert-base-uncased-emotion</software><software version="0.19.0">TextBlob</software><grantNo agency="European Research Council">101142306</grantNo><grantNo agency="Research Council of Norway">332643</grantNo></prodStmt><distStmt><distrbtr source="archive">DataverseNO</distrbtr><distrbtr affiliation="Center for Digital Narrative" abbr="UiB" URI="https://dataverse.no/dataverse/uib">University of Bergen</distrbtr><contact affiliation="University of Bergen" email="Jill.walker.rettberg@uib.no">Rettberg, Jill Walker</contact><depositr>Rettberg, Jill Walker</depositr><depDate>2025-02-17</depDate></distStmt><holdings URI="https://doi.org/10.18710/VM2K4O"/></citation><stdyInfo><subject><keyword xml:lang="en">Arts and Humanities</keyword><keyword xml:lang="en">Computer and Information Science</keyword><keyword vocab="DH Thesaurus" vocabURI="https://vocabularyserver.com/dhthesaurus/">digital humanities</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org/">digital humanities</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org/">generative AI</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org">gpt-4o-mini</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org/">narration</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org/">generative artificial intelligence</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org">large language model</keyword><keyword vocab="Wikidata" vocabURI="https://www.wikidata.org/">synthetic data</keyword></subject><abstract date="2025-02-17">We created a dataset of stories generated by OpenAI’s gpt-4o-miniby using a Python script to construct prompts that were sent to the OpenAI API. We used Statistics Norway’s list of 252 countries, added demonyms for each country, for example Norwegian for Norway, and removed countries without demonyms, leaving us with 236 countries. Our base prompt was  “Write a 1500 word potential {demonym} story”, and we generated 50 stories for each country.

The scripts used to generate the data, and additional scripts for analysis are available at the GitHub repository https://github.com/MachineVisionUiB/GPT_stories</abstract><sumDscr><collDate cycle="P1" event="start" date="2025-01-13">2025-01-13</collDate><collDate cycle="P1" event="end" date="2025-01-19">2025-01-19</collDate><universe>AI-generated stories for each of the 252 nationalities listed in Statistics Norway's dataset of countries.</universe><dataKind>AI-generated text</dataKind></sumDscr></stdyInfo><method><dataColl><sources><dataSrc>https://github.com/MachineVisionUiB/GPT_stories</dataSrc></sources></dataColl><anlyInfo/></method><dataAccs><setAvail/><useStmt/><notes type="DVN:TOU" level="dv">&lt;a href="http://creativecommons.org/publicdomain/zero/1.0">CC0 1.0&lt;/a></notes></dataAccs><othrStdyMat><relPubl><citation><titlStmt><titl>Rettberg, Jill Walker and Hermann Wigers, forthcoming 2025, "AI-generated stories favour stability over change: homogeneity and cultural stereotyping in narratives generated by gpt-4o-mini" (submitted for review May 2025).</titl></titlStmt><biblCit>Rettberg, Jill Walker and Hermann Wigers, forthcoming 2025, "AI-generated stories favour stability over change: homogeneity and cultural stereotyping in narratives generated by gpt-4o-mini" (submitted for review May 2025).</biblCit></citation></relPubl></othrStdyMat></stdyDscr><otherMat ID="f249181" URI="https://dataverse.no/api/access/datafile/249181" level="datafile"><labl>00_README.txt</labl><txt>Description of the dataset.</txt><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">text/plain</notes></otherMat><otherMat ID="f249169" URI="https://dataverse.no/api/access/datafile/249169" level="datafile"><labl>country_data.csv</labl><txt>List of the countries we generated stories for with country names and demonyms, alpha-2 and alpha-3 country codes, emoji flags, regions, sub-regions and 2023 population numbers. The list of 252 countries is from Statistics Norway. See 00_README.txt for details of where the other data is taken from. We only generated stories for the 236 countries with demonyms.</txt><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">text/comma-separated-values</notes></otherMat><otherMat ID="f249180" URI="https://dataverse.no/api/access/datafile/249180" level="datafile"><labl>gpt-stories.zip</labl><txt>Zip file containing generated stories, summaries, word frequencies, sentiments and protagonist names for 236 countries, generated by gpt-4o-mini in January and February 2025.</txt><notes level="file" type="DATAVERSE:CONTENTTYPE" subject="Content/MIME Type">application/zip</notes></otherMat></codeBook>