<?xml version="1.0" encoding="UTF-8" ?>
<!-- module name : ethmigsurveydataDDIPrototype.xml -->
<!-- module in-charge : alexandre.mairot@sciencespo.fr (CDSP) -->
<!-- module title : PROTOTYPE DDI2 ETHMIGSURVEYDATA -->
<!-- module program : XML DDI -->
<!-- module version date : 2019-06-21 -->
<codeBook xmlns="ddi:codebook:2_5" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" ID="FIN031" xml:lang="en" version="2.5" xsi:schemaLocation="ddi:codebook:2_5 http://www.ddialliance.org/Specification/DDI-Codebook/2.5/XMLSchema/codebook.xsd">
  <docDscr>
    <citation>
      <titlStmt>
        <titl>Eurostudent V: Finland 2014</titl>
      </titlStmt>
      <dcterms:spatial>Finland</dcterms:spatial>
      <dc:identifier>4484</dc:identifier>
      <dc:contributor>Annina Claesson &lt;a target='_blank' href="https://orcid.org/0000-0002-4114-2406"&gt;&lt;img class="inline ml-1" src="https://i0.wp.com/info.orcid.org/wp-content/uploads/2021/12/orcid_16x16.gif?resize=16%2C16&amp;ssl=1" alt='' /&gt;&lt;/a&gt;</dc:contributor>
      <dcterms:modified>2021-12-02</dcterms:modified>
      <dcterms:temporal>2000-01-01</dcterms:temporal>
      <dc:coverage>All nation-wide surveys irrespective of sample size</dc:coverage>
      <dc:coverage>The topics of the survey are particularly well suited for the study of the integration of EMMs in Finland and the survey includes a sizeable number of EMM respondents (even if smaller than 400)</dc:coverage>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl>Opiskelijatutkimus 2014</titl>
        <parTitl xml:lang="en">Eurostudent V: Finland 2014</parTitl>
        <IDNo>FIN031</IDNo>
      </titlStmt>
      <prodStmt>
        <producer>Statistics Finland</producer>
        <copyright>Ministry of Education and Culture; Statistics Finland; Eurostudent consortium</copyright>
      </prodStmt>
      <distStmt>
        <distrbtr>Finnish Social Science Data Archive (FSD)</distrbtr>
      </distStmt>
      <serStmt>
        <serInfo>2000-05-01</serInfo>
      </serStmt>
      <biblCit>Ministry of Education and Culture &amp; Statistics Finland &amp; Eurostudent consortium: Eurostudent V: Finland 2014 [dataset]. Version 2.0 (2017-08-21). Finnish Social Science Data Archive [distributor]. http://urn.fi/urn:nbn:fi:fsd:T-FSD2978</biblCit>
    </citation>
    <stdyInfo>
      <subject>
        <keyword>Educational attainment/trajectory, human capital, skills</keyword>
        <keyword>Housing/housing access</keyword>
        <keyword>Financial situation and/or economic inequality</keyword>
        <keyword>Labour market integration and/or socioeconomic mobility</keyword>
        <keyword>Time use</keyword>
        <topcClas>Demography.Migration</topcClas>
        <topcClas>SocialStratificationAndGroupings.Minorities</topcClas>
        <topcClas>Economics.EconomicConditionsAndIndicators</topcClas>
        <topcClas>Economics.IncomePropertyAndInvestmentSaving</topcClas>
        <topcClas>LabourAndEmployment.Employment</topcClas>
        <topcClas>SocialStratificationAndGroupings.SocialAndOccupationalMobility</topcClas>
        <topcClas>SocietyAndCulture.TimeUse</topcClas>
        <topcClas>HousingAndLandUse.Housing</topcClas>
      </subject>
      <sumDscr>
        <collDate event="start">2013-03-25</collDate>
        <collDate event="end">2013-05-15</collDate>
        <collDate cycle="Opiskelijatutkimukset"></collDate>
        <nation abbr="FI">Finland</nation>
        <geogCover><![CDATA[
National
]]></geogCover>
        <universe clusion="I"><![CDATA[
Adult population (18+ or 15+) only
Both men and women
]]></universe>
      </sumDscr>
      <notes subject="inclusion in a large survey">
2.6: While the survey has been running since 2000, the 2014 wave was the only wave thus far for which a sufficient number of EMM respondents could be identified
</notes>
    </stdyInfo>
    <method>
      <dataColl>
        <timeMeth method="Repeated cross-section (multiple waves with different samples)"></timeMeth>
        <dataCollector>Statistics Finland</dataCollector>
        <frequenc>Irregular</frequenc>
        <sampProc><![CDATA[
Survey include subgroup of majority pop: Yes
Survey designed as a general population survey: Yes
Sampling strategy - closed: Random sampling/selection (i.e. probability sampling, of some kind)
Sampling strategy - open: Probability: Stratified and disproportional
]]></sampProc>
        <sampleFrame>
          <txt><![CDATA[
Representative of the population: Yes
Sample design - full information: The samples were drawn based on information on students attending educational institutions, Statistic Finland’s register data derived from the educational institution statistics, and the address information in the Finnish Population Information System (väestötietojärjestelmä). The sample was divided into five strata: Finnish university students, foreign university students, postgraduates, Finnish university of applied sciences (polytechnics) students, and foreign university of applied sciences students. In order to receive reliable data on foreign students and postgraduates, as their numbers were much smaller, oversampling was used for these two groups. Cluster sampling was not used
]]></txt>
          <universe clusion="I"><![CDATA[
EMM Target population: which minority group(s): Foreign students (including students in adult education) studying for ISCED 2011 5, 6 and 7 level degrees in Finnish universities, universities of applied sciences (polytechnics) and other higher education institutions during the academic year 2012-2013
Was the EMM target population…: A selection of residents of foreign/immigrant origin or ancestry in the city/region/country                        
Operationalization of target population: Information not available on definition of target population
Sampling frame(s): Statistics Finland’s register data on students; Student registers of educational institutions; List of address in the Finnish Population Information System (väestötietojärjestelmä)
]]></universe>
          <frameUnit ID="frameUnit_total">
            <unitType numberOfUnits="00000"><![CDATA[
Sampling units: Individuals
]]></unitType>
            <txt>[Total]</txt>
          </frameUnit>
          <frameUnit ID="frameUnit_sg1">
            <unitType></unitType>
            <txt>Finnish university students</txt>
          </frameUnit>
          <frameUnit ID="frameUnit_sg2">
            <unitType></unitType>
            <txt>Foreign university students</txt>
          </frameUnit>
        </sampleFrame>
        <targetSampleSize>
          <sampleSize ID="sampleSize_total">19809</sampleSize>
        </targetSampleSize>
        <targetSampleSize>
          <sampleSize ID="sampleSize_sg1">4740</sampleSize>
        </targetSampleSize>
        <targetSampleSize>
          <sampleSize ID="sampleSize_sg2">3909</sampleSize>
        </targetSampleSize>
        <collMode>
Web/email survey; Paper self-administered (postal); 
</collMode>
        <sources>
          <srcDocu>http://urn.fi/urn:nbn:fi:fsd:T-FSD2978</srcDocu>
        </sources>
        <collSitu><![CDATA[
Questionnaire in migrant language: Yes
Language of questionnaire: English
Average duration/length of interview: 23
Number of questions: 86
]]></collSitu>
        <weight><![CDATA[
Are weights provided: Yes
Description: There are two weight variables in the data: sampling weight (paino1) and scaled weight (paino2). The weighting is based on calibration. Weights were separately calculated for each of the five strata. Base weights used in calibration for each strata were calculated by dividing the frame population by the number of responses. Marginal distributions used in calibration were the frame population frequencies of fields of education, age groups, and gender distribution of students in each institution. Because the equivalent variables were available for the respondents, calibrating the weights was possible by using the CALMAR software developed by the National Institute for Statistic and Economic Studies (France). Some categories were combined. The results of the survey are weighted (institution, field of education, gender, age) to be representative of degree students in universities and universities of applied sciences. The values of weight variables are higher for groups that had above-average non-response. Foreign students were overrepresented in the sample and the values of weight variables are thus lower for them. For Finnish students, the average weight variable is 85 (meaning that one respondent represents this number of students), and variation between the weight variables is between 11 and 256. Average weight variable for foreign students is 18 and variation between the variables is 2-75
]]></weight>
      </dataColl>
      <notes subject="SG1 issues">Only gross sample reported</notes>
      <notes subject="SG2 issues">Only gross sample reported</notes>
      <anlyInfo>
        <respRate ID="respRate_total"><![CDATA[
Overall response rate: 33
Overall response rate calculated: By data producers with no mentioned formula                                         ]]></respRate>
        <respRate ID="respRate_sg1"><![CDATA[
]]></respRate>
        <respRate ID="respRate_sg2"><![CDATA[
]]></respRate>
        <dataAppr ID="dataAppr_sg1">Only gross sample reported</dataAppr>
      </anlyInfo>
      <stdyClas>Survey in development/not yet completed: No</stdyClas>
    </method>
    <dataAccs>
      <setAvail>
        <accsPlac>Finnish Social Science Data Archive (FSD): https://services.fsd.tuni.fi/catalogue/FSD2978?tab=download&amp;study_language=fi</accsPlac>
        <avlStatus><![CDATA[
Availability of the survey dataset: Available by request
Access to complete dataset: Yes, micro-data available for download/direct access by researchers
Access to portions of dataset: Not applicable (full dataset accessible)
Access to aggregate data results: Yes
]]></avlStatus>
      </setAvail>
      <useStmt>
        <restrctn>The dataset is available for research, teaching and study only</restrctn>
      </useStmt>
      <notes>8.3, 8.12, 8.18: FSD uses the same ID for their dataset, technical documentation and questionnaire. This is because the ID is intended to cover all materials about the survey that have been deposited with FSD. 8.4, 8.13, 8.19: FSD does not use DOIs for their dataset, technical documentation or questionnaire. Instead, they use URN as the persistent identifier. For all these items, the same URN is used: http://urn.fi/urn:nbn:fi:fsd:T-FSD2978 . 8.5: Some variables have been removed/recoded in order to anonymise the data</notes>
    </dataAccs>
    <othrStdyMat>
      <relMat ID="relMat_technical">
        <citation>
          <titlStmt>
            <titl>Technical survey documentation</titl>
            <IDNo>FSD2978</IDNo>
          </titlStmt>
          <holdings URI="Finnish Social Science Data Archive (FSD): https://services.fsd.tuni.fi/catalogue/FSD2978/PIP/cbF2978.pdf"></holdings>
          <dcterms:available>Yes, publicly available</dcterms:available>
          <dcterms:conformsTo>Data Documentation Initiative</dcterms:conformsTo>
          <dc:language>Finnish</dc:language>
          <dc:language>FIN</dc:language>
        </citation>
      </relMat>
      <relMat ID="relMat_questionnaire">
        <citation>
          <titlStmt>
            <titl>Questionnaire</titl>
            <IDNo>FSD2978</IDNo>
          </titlStmt>
          <verStmt>
            <version>Not applicable</version>
          </verStmt>
          <holdings URI="Finnish Social Science Data Archive (FSD): https://services.fsd.tuni.fi/catalogue/FSD2978/PIP/quF2978_fin.pdf"></holdings>
          <dcterms:available>Publicly available</dcterms:available>
          <dc:language>Finnish</dc:language>
          <dc:language>FIN</dc:language>
        </citation>
      </relMat>
      <relStdy>
        <citation>
          <titlStmt>
            <titl>Opiskelijatutkimukset</titl>
            <parTitl xml:lang="en">Eurostudent V</parTitl>
            <IDNo>EVF2000</IDNo>
          </titlStmt>
        </citation>
      </relStdy>
      <relStdy>
        <citation>
          <titlStmt>
            <titl>No</titl>
          </titlStmt>
        </citation>
      </relStdy>
      <othRefs>
        <citation>
          <titlStmt>
            <titl>Any other publications</titl>
          </titlStmt>
        </citation>
      </othRefs>
    </othrStdyMat>
  </stdyDscr>
  <fileDscr>
    <fileTxt>
      <fileCitation>
        <titlStmt>
          <titl></titl>
          <IDNo>FSD2978</IDNo>
        </titlStmt>
      </fileCitation>
      <fileCont><![CDATA[
Migrant/minority related questions: Country of birth of respondent; Country of birth of parents; Mother tongue/language related question;                 
Dataset language(s) available: Finnish; English; FIN;ENG                
]]></fileCont>
    </fileTxt>
    <notes>3.3: Statistics Finland likely had information on a student’s country of birth and their native language based on the information registered in the Finnish Population Information System, but it is not directly mentioned which variable(s) they used in operationalisation the EMM target population</notes>
  </fileDscr>
</codeBook>