<?xml version="1.0" encoding="utf-8"?>
<codeBook xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="ddi:codebook:2_5" version="2.5" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd" xml:lang="en">
  <docDscr>
    <citation>
      <titlStmt>
        <titl>DDI description: PsyCoLaGe: Psychological Data for the CoLaGe Corpus from Mexico and Spain 2022-2023</titl>
        <parTitl xml:lang="fi">DDI-kuvailu: PsyCoLaGe: CoLaGe-korpuksen psykologinen aineisto Meksikosta ja Espanjasta 2022-2023</parTitl>
        <IDNo agency="FSD">4041</IDNo>
      </titlStmt>
      <prodStmt>
        <producer abbr="FSD">Finnish Social Science Data Archive</producer>
        <copyright>Finnish Social Science Data Archive</copyright>
        <prodPlac>Finnish Social Science Data Archive</prodPlac>
      </prodStmt>
      <verStmt>
        <version date="2026-03-10" type="mef_eng">1.0.0</version>
      </verStmt>
      <biblCit>PsyCoLaGe: Psychological Data for the CoLaGe Corpus from Mexico and Spain 2022-2023 [metadata]. Metadata version 1.0.0 (2026-03-10). Finnish Social Science Data Archive [producer and distributor]. DOI: https://doi.org/10.60686/t-fsd4041; URN: https://urn.fi/urn:nbn:fi:fsd:T-FSD4041</biblCit>
      <holdings location="Finnish Social Science Data Archive FSD" URI="https://urn.fi/urn:nbn:fi:fsd:T-FSD4041" />
    </citation>
    <notes xml:lang="fi">FSD:n aineistokuvailut (FSD metadata records), joiden tekijä on Suomen yhteiskuntatieteellinen tietoarkisto (Finnish Social Science Data Archive), on lisensoitu Creative Commons 1.0 Yleismaailmallinen (CC0 1.0) -lisenssillä.
      <ExtLink URI="https://creativecommons.org/publicdomain/zero/1.0/deed.fi" />
    </notes>
    <notes xml:lang="en">FSD:n aineistokuvailut (FSD metadata records) by Suomen yhteiskuntatieteellinen tietoarkisto (Finnish Social Science Data Archive) are licensed under a Creative Commons 1.0 Universal (CC0 1.0) license.
      <ExtLink URI="https://creativecommons.org/publicdomain/zero/1.0/deed.en" />
    </notes>
    <notes xml:lang="sv">FSD:n aineistokuvailut (FSD metadata records) av Finlands samhällsvetenskapliga dataarkiv (Finnish Social Science Data Archive) är licensierade under en Creative Commons 1.0 Universiell (CC0 1.0) licens.
      <ExtLink URI="https://creativecommons.org/publicdomain/zero/1.0/deed.sv" />
    </notes>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl>PsyCoLaGe: Psychological Data for the CoLaGe Corpus from Mexico and Spain 2022-2023</titl>
        <parTitl xml:lang="fi">PsyCoLaGe: CoLaGe-korpuksen psykologinen aineisto Meksikosta ja Espanjasta 2022-2023</parTitl>
        <IDNo agency="FSD">4041</IDNo>
        <IDNo agency="URN">urn:nbn:fi:fsd:T-FSD4041</IDNo>
        <IDNo agency="DOI">10.60686/t-fsd4041</IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty affiliation="University of Helsinki">Kachel, Sven
          <ExtLink URI="https://orcid.org/0000-0002-4641-946X" role="PID" title="ORCID">0000-0002-4641-946X</ExtLink>
        </AuthEnty>
        <AuthEnty affiliation="University of Helsinki">Posio, Pekka
          <ExtLink URI="https://orcid.org/0000-0003-0563-2755" role="PID" title="ORCID">0000-0003-0563-2755</ExtLink>
        </AuthEnty>
      </rspStmt>
      <prodStmt>
        <copyright>In accordance with the agreement between FSD and the depositor.</copyright>
        <grantNo agency="Kone Foundation">202007066</grantNo>
      </prodStmt>
      <distStmt>
        <distrbtr abbr="FSD" URI="https://www.fsd.tuni.fi/">Finnish Social Science Data Archive</distrbtr>
        <distDate date="2026-04-22" />
      </distStmt>
      <serStmt ID="S8" URI="https://services.fsd.tuni.fi/catalogue/series/8?lang=en">
        <serName>Individual datasets</serName>
        <serInfo>
          <p>Individual datasets that do not belong to any series.</p>
        </serInfo>
      </serStmt>
      <verStmt>
        <version date="2026-02-24" type="main_data">1.0</version>
      </verStmt>
      <biblCit>Kachel, Sven (University of Helsinki) &amp; Posio, Pekka (University of Helsinki): PsyCoLaGe: Psychological Data for the CoLaGe Corpus from Mexico and Spain 2022-2023 [dataset]. Data version 1.0 (2026-02-24). Finnish Social Science Data Archive [distributor]. DOI: https://doi.org/10.60686/t-fsd4041; URN: https://urn.fi/urn:nbn:fi:fsd:T-FSD4041</biblCit>
      <holdings location="Finnish Social Science Data Archive FSD" URI="https://urn.fi/urn:nbn:fi:fsd:T-FSD4041" />
    </citation>
    <stdyInfo>
      <subject>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">gender expression</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">femininity</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">masculinity</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">gender role</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">sex</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">homosexuality</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">personality</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">speech</keyword>
        <keyword vocab="ELSST" vocabURI="https://elsst.cessda.eu/id">attitudes</keyword>
        <topcClas vocab="OKM" vocabURI="http://www.yso.fi/onto/okm-tieteenala/conceptscheme">Social sciences</topcClas>
        <topcClas vocab="OKM" vocabURI="http://www.yso.fi/onto/okm-tieteenala/conceptscheme">Humanities</topcClas>
        <topcClas vocab="CESSDA Topic Classification" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.cessda.cv:TopicClassification:4.2.3">Gender and gender roles</topcClas>
        <topcClas vocab="CESSDA Topic Classification" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.cessda.cv:TopicClassification:4.2.3">Social behaviour and attitudes</topcClas>
      </subject>
      <abstract>
        <p>The PsyCoLaGe data collected in Spain and Mexico is part of the research project 'Gender, Society and Language Use: Evidence from Mexico and Spain” and contains the project's psychological data. The project also collected the CoLaGe corpus, which has been archived in the Language Bank of Finland (for further information, see 'Other Material”). The PsyCoLaGe data can be used to examine, for example, various research questions related to gender, gender roles and gender stereotypes, and it can additionally be used together with the corpus.</p>
        <p>The data were used to examine respondents' attitudes and perceptions primarily regarding gender and partly sexuality. This was carried out using various instruments measuring psychological characteristics, which assessed, for example, respondents' views on gender role ideologies, attitudes towards gay men, behaviour-based gender role self-concept, and perceptions of the relationship between voice characteristics and gender. The modes of measurement varied. Respondents were asked, for example, to evaluate whether the sentences presented in the questionnaire were uttered by women or men, whether certain voice or personality traits were typical of women, men or both genders, and whether they agreed or disagreed with statements concerning gender.</p>
        <p>The variable labels in the archived dataset include information on which instrument measuring psychological characteristics each variable belongs to. Some value labels of the variables include annotations indicating whether the voice features, sentences, and descriptions of everyday tasks presented to respondents are female‑typical or male‑typical, and whether the presented statement is egalitarian or traditional. These annotations are based on the instruments used to measure psychological characteristics.</p>
        <p>The full questions, question preambles, and response options can be found in the questionnaire (quF4041_mul.pdf). The questions were presented to respondents either in Peninsular Spanish or Mexican Spanish depending on their nationality, not in English.</p>
        <p>The background variables of the dataset are nationality, gender, sexual orientation and a dichotomous age group.</p>
      </abstract>
      <sumDscr>
        <timePrd event="start" date="2022" />
        <timePrd event="end" date="2023" />
        <collDate event="start" date="2022-02" />
        <collDate event="end" date="2023-06" />
        <nation abbr="ES">Spain</nation>
        <nation abbr="MX">Mexico</nation>
        <geogCover>Valencia</geogCover>
        <geogCover>Guadaljara</geogCover>
        <anlyUnit>Individual
          <concept vocab="DDI Analysis Unit" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:AnalysisUnit:2.1.3">Individual</concept>
        </anlyUnit>
        <universe clusion="I">The adult population of Valencia and Guadalajara</universe>
        <dataKind>Quantitative</dataKind>
      </sumDscr>
    </stdyInfo>
    <method>
      <dataColl>
        <timeMeth>Cross-section
          <concept vocab="DDI Time Method" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:TimeMethod:1.2.3">CrossSection</concept>
        </timeMeth>
        <dataCollector affiliation="University of Helsinki">Kachel, Sven</dataCollector>
        <dataCollector affiliation="University of Helsinki">Posio, Pekka</dataCollector>
        <dataCollector affiliation="University of Helsinki">Uclés Ramada, Gloria</dataCollector>
        <dataCollector affiliation="University of Guadalajara">González Guzmán, Grecia</dataCollector>
        <sampProc>Non-probability: Availability
          <concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:SamplingProcedure:2.0.2">Nonprobability.Availability</concept>
        </sampProc>
        <sampProc>Non-probability: Respondent-assisted
          <concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:SamplingProcedure:2.0.2">Nonprobability.RespondentAssisted</concept>
        </sampProc>
        <sampProc>Non-probability: Purposive
          <concept vocab="DDI Sampling Procedure" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:SamplingProcedure:2.0.2">Nonprobability.Purposive</concept>
        </sampProc>
        <sampProc>
          <p>Respondents were initially recruited through social media. To achieve a sufficiently large sample size, additional respondents were recruited through the researchers' personal contacts (excluding friends and relatives). In addition, respondents who had already been reached recruited further participants (i.e. snowball sampling).</p>
        </sampProc>
        <collMode>Self-administered questionnaire: Web-based (CAWI)
          <concept vocab="DDI Mode of Collection" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:ModeOfCollection:5.0.1">SelfAdministeredQuestionnaire.CAWI</concept>
        </collMode>
        <collMode>Psychological measurements and tests
          <concept vocab="DDI Mode of Collection" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:ModeOfCollection:5.0.1">MeasurementsAndTests.Psychological</concept>
        </collMode>
        <resInstru>Structured questionnaire
          <concept vocab="DDI Type of Instrument" vocabURI="https://vocabularies.cessda.eu/urn/urn:ddi:int.ddi.cv:TypeOfInstrument:1.1.2">Questionnaire.Structured</concept>
        </resInstru>
        <weight>There are no weight variables in the data.</weight>
      </dataColl>
      <stdyClas type="B">Study description in Finnish and English. The data files are generally not processed and are retained in the form they were delivered in by the researcher. If necessary, the archive anonymises the data.</stdyClas>
    </method>
    <dataAccs>
      <setAvail>
        <accsPlac URI="https://www.fsd.tuni.fi/">Finnish Social Science Data Archive</accsPlac>
        <complete>The dataset does not include the original date variable, as it did not function as intended across all file formats. Two new variables, Recording_time_year and Recording_time_month, have been created in the archived dataset based on the original variable. Together, these variables contain the same information as the original variable.</complete>
      </setAvail>
      <useStmt>
        <specPerm ID="eng_unique_specPerm_2519-FSD4041">The research group collected both linguistic and psychological survey data. The linguistic corpus data are archived at the Language Bank of Finland and the psychological survey data with FSD. The research group exclusively holds a master key document linking informant codes across the two datasets; this document is available only from the authors of the dataset upon reasonable request.</specPerm>
        <restrctn>The dataset is (D) available only by permission from the data depositor/creator.</restrctn>
        <citReq>The data and its creators shall be cited in all publications and presentations for which the data have been used. The bibliographic citation may be in the form suggested by the archive or in the form required by the publication.</citReq>
        <deposReq>Notify FSD of all publications where you have used the data by sending the citation information to user-services.fsd@tuni.fi.</deposReq>
        <disclaimer>The original data creators and the archive bear no responsibility for any results or interpretations arising from the reuse of the data.</disclaimer>
      </useStmt>
      <notes>For confidentiality reasons, the researchers anonymised the data by removing variables describing the respondent's level of education, main activity, marital status, number of children, childhood region, size of childhood region, and the country of residence at the time of data collection. For the same reason, variables indicating the respondent's age and sexual orientation were recoded into broader categories. In addition, the responses of four participants were removed from the archived dataset to ensure their anonymity.</notes>
      <notes>Additional items that are not part of the original scale have been added to the BSRI scale in this dataset.</notes>
      <notes>The last six characters of the variable Informant_ID, consisting of four letters and two digits, were generated randomly and form the respondent ID. The other characters in the variable indicate the respondent's corpus, gender, and age group.</notes>
    </dataAccs>
    <othrStdyMat>
      <relMat>PsyCoLaGe: Data and Measurement Description. Included as an appendix to the dataset.</relMat>
      <relPubl xml:lang="en">Posio, P., *Kachel, S., &amp; Uclés Ramada, G. (2024). Morphosyntactic stereotypes of speakers with different genders and sexual orientations: An experimental investigation. Linguistics, online first. https://doi.org/10.1515/ling-2022-0143
        <citation>
          <titlStmt>
            <titl>Morphosyntactic stereotypes of speakers with different genders and sexual orientations: An experimental investigation</titl>
            <IDNo agency="DOI">10.1515/ling-2022-0143</IDNo>
          </titlStmt>
          <distStmt>
            <distDate date="2024" />
          </distStmt>
          <holdings URI="https://doi.org/10.1515/ling-2022-0143" />
        </citation>
      </relPubl>
      <relPubl xml:lang="en">Posio, P., Kachel, S., &amp; Uclés Ramada, G. (2025). Sociolinguistic and functional variation in the use of direct reported speech in Spanish in the corpus CoLaGe-Valencia. Spanish in Context, online first. https://doi.org/10.1075/sic.24023.pos
        <citation>
          <titlStmt>
            <titl>Sociolinguistic and functional variation in the use of direct reported speech in Spanish in the corpus CoLaGe-Valencia</titl>
            <IDNo agency="DOI">10.1075/sic.24023.pos</IDNo>
          </titlStmt>
          <distStmt>
            <distDate date="2025" />
          </distStmt>
          <holdings URI="https://doi.org/10.1075/sic.24023.pos" />
        </citation>
      </relPubl>
      <relPubl xml:lang="en">Uclés Ramada, G., Kachel, S., &amp; Posio, P. J. (2025). Conflict, gender, and amount of talk: Gender differences in Spanish role play data. Pragmatics and Society. https://doi.org/10.1075/ps.23144.ucl
        <citation>
          <titlStmt>
            <titl>Conflict, gender, and amount of talk: Gender differences in Spanish role play data</titl>
            <IDNo agency="DOI">10.1075/ps.23144.ucl</IDNo>
          </titlStmt>
          <distStmt>
            <distDate date="2026" />
          </distStmt>
          <holdings URI="https://doi.org/10.1075/ps.23144.ucl" />
        </citation>
      </relPubl>
    </othrStdyMat>
  </stdyDscr>
  <otherMat level="study" URI="https://urn.fi/urn:nbn:fi:lb-2024030608">
    <labl>A speech and text corpus archived in the Language Bank of Finland for research on language and gender in Mexico and Spain</labl>
    <txt>The corpus was collected from the same respondents who participated in the FSD4041 dataset archived at the Finnish Social Science Data Archive: PsyCoLaGe: Psychological Data for the CoLaGe Corpus from Mexico and Spain 2022-2023.</txt>
  </otherMat>
</codeBook>
