<?xml version='1.0' encoding='UTF-8'?>
<codeBook version="1.2.2" ID="ZA011-EXMORTALITY-01" xml-lang="en" xmlns="http://www.icpsr.umich.edu/DDI" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.icpsr.umich.edu/DDI http://www.icpsr.umich.edu/DDI/Version1-2-2.xsd">
  <docDscr>
    <citation>
      <titlStmt>
        <titl>
          ZA011 Excess Mortality: Surveillance Episodes Datasets
        </titl>
        <IDNo>
          ZA011-EXMORTALITY-01
        </IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty affiliation="Agincourt">
          Prof Steve Tollman
        </AuthEnty>
        <AuthEnty affiliation="Agincourt">
          Prof Kathleen Khan
        </AuthEnty>
        <AuthEnty affiliation="Agincourt">
          Dr Chodziwadziwa Kabudula
        </AuthEnty>
        <AuthEnty affiliation="SAPRIN">
          Dr Kobus Herbst
        </AuthEnty>
        <AuthEnty affiliation="Nyanja Health Research Institute">
          Dr Beth Tippett-Barr
        </AuthEnty>
      </rspStmt>
      <prodStmt>
        <producer/>
        <copyright>
          @2023
        </copyright>
        <software version="4.0.10" date="2018-05-02">
          Nesstar Publisher
        </software>
      </prodStmt>
    </citation>
  </docDscr>
  <stdyDscr>
    <citation>
      <titlStmt>
        <titl>
          ZA011 Excess Mortality: Surveillance Episodes Datasets
        </titl>
        <IDNo>
          ZA011-EXMORTALITY-01
        </IDNo>
      </titlStmt>
      <rspStmt>
        <AuthEnty affiliation="Agincourt">
          Prof Steve Tollman
        </AuthEnty>
        <AuthEnty affiliation="Agincourt">
          Prof Kathleen Khan
        </AuthEnty>
        <AuthEnty affiliation="SAPRIN">
          Dr Kobus Herbst
        </AuthEnty>
        <AuthEnty affiliation="Agincourt">
          Dr Chodziwadziwa Kabudula
        </AuthEnty>
        <AuthEnty affiliation="Nyanja Health Research Institute">
          Dr Beth Tippett-Barr
        </AuthEnty>
        <othId role="Data Review" affiliation="Agincourt">
          <p>
            SAMRC/Wits Agincourt Team
          </p>
        </othId>
        <othId role="Data Review And QA" affiliation="SAPRIN">
          <p>
            Kobus Herbst
          </p>
        </othId>
        <othId role="Reviews" affiliation="CHAMPS">
          <p>
            CHAMPS Team
          </p>
        </othId>
        
      </rspStmt>
      <prodStmt>
        <producer affiliation="Agincourt" role="Technical Assistance">
          Chodziwadziwa Kabudula
        </producer>
        <producer affiliation="SAPRIN" role="Technical Assistance">
          Kobus Herbst
        </producer>
        <producer affiliation="Agincourt" role="Technical Assistance">
          Daniel Ohene-Kwofie
        </producer>
        <producer affiliation="Agincourt" role="Technical Assistance">
          Jean Bashingwa
        </producer>
        <producer affiliation="Agincourt" role="Technical Assistance">
          Nkosinathi Masilela
        </producer>
        <producer affiliation="Agincourt" role="Technical Assistance">
          Rhulani Silaule
        </producer>
        <copyright>
          This dataset documentation is licensed under a Creative Commons Attribution-Non Commercial 4.0 International License. The dataset is shared in terms of the data-use agreement accepted at the time of data download.
        </copyright>
        <software version="4.0.10" date="2018-05-02">
          Nesstar Publisher
        </software>
        <fundAg abbr="BMGF" role="Current Funder">
          <![CDATA[Bill & Melinda Gates Foundation, Seattle, WA  ]]>
        </fundAg>
        <fundAg abbr="SAPRIN" role="Current Funder">
          South African Population Research Infrastructure Network, South Africa
        </fundAg>
        <fundAg abbr="Wellcome" role="Previous Funder">
          Wellcome Trust, UK
        </fundAg>
      </prodStmt>
      <distStmt>
        <contact affiliation="Agincourt" URI="http://data.agincourt.ac.za/" email="chodziwadziwa.kabudula@wits.ac.za">
          Chodziwadziwa Kabudula
        </contact>
      </distStmt>
      <serStmt>
        <serName>
          Demographic Surveillance
        </serName>
        <serInfo>
          <![CDATA[This dataset contains  demographic surveillance data covering the period from 1 Jan 2015 to 31 December 2021.]]>
        </serInfo>
      </serStmt>
      <verStmt>
        <version date="2023-06-01">
          v1: Dataset for public distribution.
        </version>
        <notes>
          <![CDATA[v1:  Dataset for public distribution.]]>
        </notes>
      </verStmt>
      <notes>
        
      </notes>
    </citation>
    <stdyInfo>
      <subject>
        <keyword>
          Episodes, Mortality, Migration
        </keyword>
        <topcClas>
          Episodes, Mortality, Migration
        </topcClas>
      </subject>
      <abstract>
        <![CDATA[Following the declaration of COVID-19 as a pandemic by the World Health Organization, there have been high levels of reported deaths, at least in countries with functioning civil registration and vital statistics (CRVS). These largely under-represent the true mortality due to COVID-19. A fundamental question, then, is what is the impact of COVID-19 on mortality and the scale of excess deaths, and the population sub-groups most affected, particularly in low- and middle-income settings? Constructing a true representation of COVID-19 deaths can be useful for social policies and future pandemic preparedness planning. The goal of this initiative is to characterise all-cause mortality rates and trends, by age and sex, across a range of rural and urban sub-Saharan African and South Asian settings under continuous health and demographic surveillance. 

This a multinational initiative bringing together 17 sites/centres from Africa and South Asia. This dataset represents a snapshot of the continually evolving data in the underlying longitudinal databases maintained by the nodes.]]>
      </abstract>
      <sumDscr>
        <timePrd date="2015-01-01" event="start" cycle="Agincourt"/>
        <timePrd date="2021-12-31" event="end" cycle="Agincourt"/>
        <collDate date="2015-01-01" event="start" cycle="Agincourt"/>
        <collDate date="2021-12-31" event="end" cycle="Agincourt"/>
        <nation abbr="RSA">
          South Africa
        </nation>
        <geogCover>
          The MRC/Wits University Agincourt HDSS in Bushbuckridge District, Mpumalanga, which has collected data since 1993. The nodal website is: http://www.agincourt.co.za. The Agincourt HDSS covers a surveillance area of approximately 420 square kilometres and is located in the Bushbuckridge District, Mpumalanga in the rural northeast of South Africa close to the Mozambique border. At baseline in 1992, 57 600 people were recorded in 8900 households in 20 villages; by 2006, the population had increased to about 70 000 people in 11 700 households. As of December 2017, there were 113 113 people under surveillance of whom 28% were not resident within the surveillance area, with a total of about 2m person years of observation. 33% of the population is under 15 years old. The population is almost exclusively Shangaan-speaking.The Agincourt HDSS has population density of over 200 persons per square kilometre. The Agincourt HDSS extends between latitudes 24° 50´ and 24° 56´S and longitudes 31°08´ and 31°´ 25´ E. The altitude is about 400-600m above sea level.
        </geogCover>
        <anlyUnit>
          Exposure Episodes
        </anlyUnit>
        <universe>
          Households resident in dwellings within the study area will be eligible for inclusion in the surveillance. All individuals identified by the household proxy informant as a member of the household will be enumerated. A resident household member is an individual that intends to sleep the majority of time at the dwelling occupied by the household over a four-month period. Households will include resident and non-resident members. An individual is a non-resident member if they have close ties to the household, but do not physically reside with the household most of the time. They can also be called temporary migrants and they are enumerated within the household list. Because household membership is not tied to physical residency, an individual may be a member of more than one household.
        </universe>
        <dataKind>
          Event history data
        </dataKind>
      </sumDscr>
      <notes>
        <![CDATA[Each record in the dataset represents a period of observation for an individual during which all the recorded characteristics of the individual stay constant. For example, on the birthday of the individual a new episode will start,  because the age of the individual has changed. An out-migration will result in a new episode, because the location or residential status has changed. Any change in one of the status values, such as education or marital status, will likewise result in a new episode on the date of the change.]]>
      </notes>
    </stdyInfo>
    <method>
      <dataColl>
        <timeMeth>
          2015-2021
        </timeMeth>
        <sampProc>
          This dataset is not based on a sample but contains information from the complete demographic surveillance areas.
        </sampProc>
        <resInstru>
          The data on this Repository is not the result of a single questionnaire but is a result of harmonised data from three different sites longitudinally collected over more than twenty years using different questionnaires that varied over time and site.
        </resInstru>
        <sources/>
        <collSitu>
          <![CDATA[In all the HDSS nodes, data are collected from a household proxy respondent, preferably the head of household or any next available senior adult resident household member, after informed consent was obtained by trained fieldworkers. Respondents are informed of the purpose and confidentiality of the interview, their right to refuse participation or withdraw from the study, and that scientists would be given access to anonymised data to analyse and publish information. Informed consent was verbal in all HDSS nodes until 2016. Written informed consent started in 2017 in AHRI, and 2018 in DIMAMO and 2019 in Agincourt. Until 2016 for Agincourt and AHRI, and 2017 for DIMAMO, data collection was field-based 'paper and pen' personal interviews (PAPI), before changing to field-based computer-assisted personal interviews (CAPI). Since 2019, all SAPRIN HDSS nodes collect data in 3 annual rounds over a 45-week data collection schedule; one field-based CAPI round, sandwiched on either side by a Call-Centre-based computer assisted telephonic interview (CATI), to create 3 data points at an interval of approximately 4 months in each calendar year.  In the past HDSS nodes had different data collection frequencies. AHRI data collection was 2 PAPI rounds per year from inception to 2011, changing to 3 PAPI rounds per year between 2012 and 2016, before becoming 1 PAPI round and 2 CATI rounds from 2017. Agincourt and DIMAMO have been collecting data once annually in a census-type format, over 4-5-month period until 2018.]]>
        </collSitu>
        <cleanOps>
          <![CDATA[The first step in the data preparation process is quality assurance. The SAPRIN Management hub team assess the data submitted to ensure it is in the correct format and falls within expected value ranges. Other potential issues checked include: missing data, incorrect data types, unexpected duplicate or orphan records. The SAPRIN Management hub assess this conversion by running both original operational database and the SAPRIN database created from the operational database through the iSHARE data quality assessment and indicator process. The data quality checking process is conducted using Pentaho Data Integration (PDI). PDI provides the Extract, Transform, and Load (ETL) capabilities that facilitates the process of capturing, cleansing, and storing data using a uniform and consistent format that is accessible and relevant to end users. The principle of the data quality checks is that if the data conversion conducted by the nodes was complete and accurate, there should be little or no difference in the data quality and demographic indicators between the base and SAPRIN versions of the nodal data. If the data submitted by the nodes meets the criteria for inclusion into the consolidated dataset the data moves to the second step of the data production process. However, if the data fail the inclusion checks, this could then lead to another iteration of data submission and quality control checks until SAPRIN Management hub is satisfied that they have high quality data.To produce this final standard dataset, the  data is processed using PDI  on the Centre for High Performance Computing cluster .]]>
        </cleanOps>
      </dataColl>
      <anlyInfo>
        <EstSmpErr>
          Not Applicable
        </EstSmpErr>
      </anlyInfo>
    </method>
    <dataAccs>
      <setAvail>
        <accsPlac/>
      </setAvail>
      <useStmt>
        <contact affiliation="Agincourt" URI="http://data.agincourt.ac.za/" email="datamanager@agincourt.co.za">
          Data Manager
        </contact>
        <citReq>
          
        </citReq>
        <conditions>
          <![CDATA[This data is made available for access under the following conditions:
1)The data and other materials provided will not be redistributed or sold to other individuals, institutions, or organizations without the written agreement of nodes.
2)The data will be used for statistical and scientific research purposes only. They will be used solely for reporting of aggregated information, and not for investigation of specific individuals or organisations. The Data User will neither use nor permit    others to use the data in any way other than listed in the original application (Analysis Plan) for access to the dataset.
3)No attempt will be made to re-identify respondents, and no use will be made of the identity of any person or establishment discovered inadvertently. Any such discovery should immediately be reported to respective nodes.
4)No attempt will be made to produce links among datasets provided, or among data from nodes and other datasets that could identify individuals or organizations.
5)The Data User will ensure that the data are kept in a secured environment and that only authorized users have access to the data.
6)Any books, articles, conference papers, theses, dissertations, reports, or other publications that employ this data will cite the source of data in accordance with the Citation Requirement provided with each dataset.
7)An electronic copy of all reports and publications based on the requested data will be sent to nodes.
8)The original collector of the data, and relevant funding agencies bear no responsibility for use of the data or for interpretations or inferences based upon such uses.
9) Once the data set has served its indicated purpose it must be destroyed. If the dataset needs to be lodged for publication purposes, a reference (a digital object identifier will be maintained for this purpose) to the original dataset on the Agincourt/other nodal data repository should be used. Derived or aggregated datasets produced from the original dataset do not fall within this provision and may be lodged as publication datasets. If the same dataset is needed for a different purpose, the dataset should be re-requested and the new purposes indicated.]]>
        </conditions>
        <disclaimer>
          The user of the data acknowledges that the original collector of the data and the relevant funding agencies bear no responsibility for the data's use or interpretation or inferences based upon it.
        </disclaimer>
      </useStmt>
    </dataAccs>
  </stdyDscr>
  <fileDscr ID="F5" URI="ZA011_RawCensoredEpisode.Nesstar?Index=0&amp;Name=ZA011_RawCensoredEpisodes">
    <fileTxt>
      <fileName>
        ZA011_RawCensoredEpisodes.NSDstat
      </fileName>
      <dimensns>
        <caseQnty>
          172081
        </caseQnty>
        <varQnty>
          13
        </varQnty>
      </dimensns>
      <fileType>
        Nesstar 200801
      </fileType>
    </fileTxt>
  </fileDscr>
  <dataDscr>
    <var ID="V132" name="recnr" files="F5" dcml="0" intrvl="contin">
      <location width="12"/>
      <labl>
        RecNr
      </labl>
      <valrng>
        <range min="1" max="172081"/>
      </valrng>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <sumStat type="min">
        1
      </sumStat>
      <sumStat type="max">
        172081
      </sumStat>
      <sumStat type="mean">
        86041
      </sumStat>
      <sumStat type="stdev">
        49675.65
      </sumStat>
      <varFormat type="numeric" schema="other"/>
    </var>
    <var ID="V133" name="countryid" files="F5" dcml="0" intrvl="discrete">
      <location width="8"/>
      <labl>
        CountryId
      </labl>
      <valrng>
        <range min="710" max="710"/>
      </valrng>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          710
        </catValu>
        <catStat type="freq">
          172081
        </catStat>
      </catgry>
      <varFormat type="numeric" schema="other"/>
    </var>
    <var ID="V134" name="centreid" files="F5" intrvl="discrete">
      <location width="5"/>
      <labl>
        CentreId
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          ZA011
        </catValu>
        <catStat type="freq">
          172081
        </catStat>
      </catgry>
      <varFormat type="character" schema="other"/>
    </var>
    <var ID="V135" name="individualid" files="F5" intrvl="discrete">
      <location width="5"/>
      <labl>
        IndividualId
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <varFormat type="character" schema="other"/>
    </var>
    <var ID="V136" name="sex" files="F5" dcml="0" intrvl="discrete">
      <location width="8"/>
      <labl>
        Sex
      </labl>
      <valrng>
        <range min="1" max="3"/>
      </valrng>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          1
        </catValu>
        <catStat type="freq">
          80093
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          2
        </catValu>
        <catStat type="freq">
          91985
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          3
        </catValu>
        <catStat type="freq">
          3
        </catStat>
      </catgry>
      <varFormat type="numeric" schema="other"/>
    </var>
    <var ID="V137" name="dob" files="F5" intrvl="discrete">
      <location width="11"/>
      <labl>
        DoB
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="min">
        1900-01-29
      </sumStat>
      <sumStat type="max">
        2023-01-14
      </sumStat>
      <varFormat type="character" formatname="Nesstar.date" schema="other" category="date"/>
    </var>
    <var ID="V138" name="episode" files="F5" dcml="0" intrvl="discrete">
      <location width="8"/>
      <labl>
        Episode
      </labl>
      <valrng>
        <range min="1" max="2"/>
      </valrng>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          1
        </catValu>
        <catStat type="freq">
          172070
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          2
        </catValu>
        <catStat type="freq">
          11
        </catStat>
      </catgry>
      <varFormat type="numeric" schema="other"/>
    </var>
    <var ID="V139" name="episodes" files="F5" dcml="0" intrvl="discrete">
      <location width="8"/>
      <labl>
        Episodes
      </labl>
      <valrng>
        <range min="1" max="2"/>
      </valrng>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          1
        </catValu>
        <catStat type="freq">
          172059
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          2
        </catValu>
        <catStat type="freq">
          22
        </catStat>
      </catgry>
      <varFormat type="numeric" schema="other"/>
    </var>
    <var ID="V140" name="startevent" files="F5" intrvl="discrete">
      <location width="3"/>
      <labl>
        StartEvent
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          BTH
        </catValu>
        <catStat type="freq">
          44080
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          ENT
        </catValu>
        <catStat type="freq">
          61253
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          ENU
        </catValu>
        <catStat type="freq">
          37004
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          IMG
        </catValu>
        <catStat type="freq">
          29744
        </catStat>
      </catgry>
      <varFormat type="character" schema="other"/>
    </var>
    <var ID="V141" name="startdate" files="F5" intrvl="discrete">
      <location width="11"/>
      <labl>
        Start Date
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="min">
        2015-01-01
      </sumStat>
      <sumStat type="max">
        2022-12-31
      </sumStat>
      <varFormat type="character" formatname="Nesstar.date" schema="other" category="date"/>
    </var>
    <var ID="V142" name="endevent" files="F5" intrvl="discrete">
      <location width="3"/>
      <labl>
        EndEvent
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <catgry>
        <catValu>
          BTH
        </catValu>
        <catStat type="freq">
          11
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          DTH
        </catValu>
        <catStat type="freq">
          6548
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          ENT
        </catValu>
        <catStat type="freq">
          1
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          EXT
        </catValu>
        <catStat type="freq">
          25159
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          IMG
        </catValu>
        <catStat type="freq">
          13
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          OBS
        </catValu>
        <catStat type="freq">
          117686
        </catStat>
      </catgry>
      <catgry>
        <catValu>
          OMG
        </catValu>
        <catStat type="freq">
          22663
        </catStat>
      </catgry>
      <varFormat type="character" schema="other"/>
    </var>
    <var ID="V143" name="enddate" files="F5" intrvl="discrete">
      <location width="11"/>
      <labl>
        End Date
      </labl>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="min">
        2015-01-01
      </sumStat>
      <sumStat type="max">
        2022-12-31
      </sumStat>
      <varFormat type="character" formatname="Nesstar.date" schema="other" category="date"/>
    </var>
    <var ID="V144" name="days" files="F5" dcml="0" intrvl="contin">
      <location width="8"/>
      <labl>
        Days
      </labl>
      <valrng>
        <range min="1" max="2922"/>
      </valrng>
      <sumStat type="vald">
        172081
      </sumStat>
      <sumStat type="invd">
        0
      </sumStat>
      <sumStat type="min">
        1
      </sumStat>
      <sumStat type="max">
        2922
      </sumStat>
      <sumStat type="mean">
        1961.128
      </sumStat>
      <sumStat type="stdev">
        1015.387
      </sumStat>
      <varFormat type="numeric" schema="other"/>
    </var>
  </dataDscr>
</codeBook>
