log using paradata.log, replace /* ---------------------------------------------------------------------------- The National Health Interview Survey (NHIS) 2021; Paradata data file This program loads the NHIS paradata ASCII data file downloaded from the NCHS website (https://www.cdc.gov/nchs/nhis/index.htm) to a Stata dataset. The program creates descriptive variable labels and formats with meaningful category labels. It sets the variable lengths and uses input statements to read in the data. BEFORE RUNNING THIS PROGRAM, PLEASE: - Create a folder called C:\NHIS2021 (on a machine running Windows) - Download the paradata ASCII file to the folder C:\NHIS2021 (on a machine running Windows) Running this program will replace the log file and the dataset in the default directory, if present. */ cd c:\nhis2021 version 6.0 * The following command temporarily changes the command- * ending delimiter from a carriage return to a semicolon #delimit; clear; set mem 200m; * INPUT ALL VARIABLES; infix /* FRT LOCATIONS */ typeabc 1 - 1 typea 2 - 2 typebobs 3 - 3 /* IDN LOCATIONS */ rectype 4 - 5 srvy_yr 6 - 9 str hhx 10 - 16 outcome1 17 - 19 /* UCF LOCATIONS */ region 20 - 20 pstrat 21 - 23 ppsu 24 - 26 /* CHI LOCATIONS */ totcount 27 - 28 mode_p 29 - 30 mode_t 31 - 32 ctstat1 33 - 34 ctstat2 35 - 36 ctstat3 37 - 38 unable1r 39 - 39 unable2r 40 - 40 unable3r 41 - 41 unable4r 42 - 42 unable5r 43 - 43 unabl99r 44 - 44 lang1r 45 - 45 lang2r 46 - 46 lang3r 47 - 47 lang4r 48 - 48 lang5r 49 - 49 nctp01r 50 - 50 nctpr03r 51 - 51 nctpr04r 52 - 52 nctp05r 53 - 53 nctpr07r 54 - 54 nctpr08r 55 - 55 nctpr09r 56 - 56 nctpr10r 57 - 57 nctpr11r 58 - 58 nctp12r 59 - 59 nctpr99r 60 - 60 nctl01r 61 - 61 nctl02r 62 - 62 nctel03r 63 - 63 nctel04r 64 - 64 nctel05r 65 - 65 nctl06r 66 - 66 nctl07r 67 - 67 nctel99r 68 - 68 relc01r 69 - 69 reluc02r 70 - 70 reluc03r 71 - 71 reluc05r 72 - 72 reluc06r 73 - 73 reluc07r 74 - 74 relc08r 75 - 75 relc09r 76 - 76 reluc11r 77 - 77 reluc12r 78 - 78 relc15r 79 - 79 reluc98r 80 - 80 reluc99r 81 - 81 strat01r 82 - 82 strat02r 83 - 83 strat03r 84 - 84 strat04r 85 - 85 strat05r 86 - 86 strat06r 87 - 87 strt11r 88 - 88 strat12r 89 - 89 strat13r 90 - 90 strt14r 91 - 91 strat98r 92 - 92 strat99r 93 - 93 reassign 94 - 94 sa_tod 95 - 95 sastrpnt 96 - 96 sc_tod 97 - 97 scstrpnt 98 - 98 /* FLG LOCATIONS */ str onefam_flg 99 - 99 quality_sa 100 - 100 quality_sc 101 - 101 str sarespsc_flg 102 - 102 /* GEN LOCATIONS */ intv_qrt 103 - 103 intv_mon 104 - 105 hh_pclass 106 - 106 ad_pclass 107 - 107 wtia_pd 108 - 115 /* HHC LOCATIONS */ endpnt 116 - 116 strtpnt 117 - 117 hhc_tod 118 - 118 /* TEL LOCATIONS */ telcurwrk_a 119 - 119 telcel_a 120 - 120 phonelive_a 121 - 121 phoneuse_a 122 - 122 /* LNK LOCATIONS */ rlink_a 123 - 123 /* TEL LOCATIONS */ telcurwrk_c 124 - 124 phonelive_c 125 - 125 /* LNK LOCATIONS */ rlink_c 126 - 126 /* BCK LOCATIONS */ intlangsa 127 - 127 intrptsa 128 - 128 otherssa 129 - 129 intlangsc 130 - 130 otherssc 131 - 131 intmodesa 132 - 132 intmodewhysa 133 - 134 intmodesc 135 - 135 intmodewhysc 136 - 137 parwhy 138 - 138 brkreason 139 - 140 str brkhhc 141 - 141 str brksa 142 - 142 str brksc 143 - 143 str ncomhhc 144 - 144 str ncomsa 145 - 145 str ncomsc 146 - 146 location01 147 - 147 location02 148 - 148 location03 149 - 149 location04 150 - 150 location05 151 - 151 location06 152 - 152 location07 153 - 153 location08 154 - 154 location09 155 - 155 using paradata21.dat; * DEFINE VARIABLE LABELS; * FRT VARIABLE LABELS; label variable typeabc "Type of noninterview"; label variable typea "Reason for Type A"; label variable typebobs "Type B by observation"; * IDN VARIABLE LABELS; label variable rectype "Record type"; label variable srvy_yr "Year of the National Health Interview Survey"; label variable hhx "Randomly assigned household number unique to a household"; label variable outcome1 "Outcome code--restricted to 201, 203, Type A, select Type B codes"; * UCF VARIABLE LABELS; label variable region "Household region"; label variable pstrat "Pseudo-stratum for public-use file variance estimation"; label variable ppsu "Pseudo-PSU for public-use file variance estimation"; * CHI VARIABLE LABELS; label variable totcount "Total count of CHI records for this case"; label variable mode_p "Number of personal visit attempts for this case"; label variable mode_t "Number of telephone attempts for this case"; label variable ctstat1 "Number of contacts with sample unit members"; label variable ctstat2 "Number of contacts with non-sample unit members"; label variable ctstat3 "Number of noncontacts"; label variable unable1r "Number of times 'Eligible person not available' was entered"; label variable unable2r "Number of times 'Inconvenient time' was entered"; label variable unable3r "Number of times 'Respondent is reluctant' was entered"; label variable unable4r "Number of times 'Language problem--specify' was entered"; label variable unable5r "Number of times 'Health problem' was entered"; label variable unabl99r "Number of times 'Other--specify' was entered"; label variable lang1r "Number of times 'Specify language or dialect' was entered"; label variable lang2r "Number of times 'No household member able to translate' was entered"; label variable lang3r "Number of times 'Contact RO about language problem' was entered"; label variable lang4r "Number of times 'Unable to find translator' was entered"; label variable lang5r "Number of times 'No time left to find translator' was entered"; label variable nctp01r "Number of times 'No one home/No eligible person home' was entered"; label variable nctpr03r "Number of times 'No one home--previous note/letter taken' was entered"; label variable nctpr04r "Number of times 'Household does not answer door--someone is home' entered"; label variable nctp05r "Number of times 'Observed HH from vehicle' was entered"; label variable nctpr07r "Number of times 'Unable to reach/locked gate/buzzer entry' was entered"; label variable nctpr08r "Number of times 'Address does not exist/unable to locate' was entered"; label variable nctpr09r "Number of times 'On vacation, away from home/at second home' was entered"; label variable nctpr10r "Number of times 'Spoke with neighbor' was entered"; label variable nctpr11r "Number of times 'Building management/doorman contact' was entered"; label variable nctp12r "Number of times 'Completed case (Type B or C or Vacant interview)' entered"; label variable nctpr99r "Number of times 'Other--specify' was entered"; label variable nctl01r "Number of times 'Got answering machine' was entered"; label variable nctl02r "Number of times 'Ring, no answer' was entered"; label variable nctel03r "Number of times 'Busy signal' was entered"; label variable nctel04r "Number of times 'Disconnected' was entered"; label variable nctel05r "Number of times 'Wrong number' was entered"; label variable nctl06r "Number of times 'Spoke with ineligible person' was entered"; label variable nctl07r "Number of times 'Respondent left message' was entered"; label variable nctel99r "Number of times 'Other-specify' was entered"; label variable relc01r "Number of times 'Not interested' was entered"; label variable reluc02r "Number of times 'Too busy' was entered"; label variable reluc03r "Number of times 'Interview takes too much time' was entered"; label variable reluc05r "Number of times 'Scheduling difficulties' was entered"; label variable reluc06r "Number of times 'Survey is voluntary' was entered"; label variable reluc07r "Number of times 'Privacy concerns' was entered"; label variable relc08r "Number of times 'Local/State/Fed. Govt. concerns' was entered"; label variable relc09r "Number of times 'Asks questions about the survey' was entered"; label variable reluc11r "Number of times 'Hang-up/slams door on FR' was entered"; label variable reluc12r "Number of times 'Hostile or threatens FR' was entered"; label variable relc15r "Number of times 'Family Issues (death, illness, etc.)' entered"; label variable reluc98r "Number of times 'No concerns' was entered"; label variable reluc99r "Number of times 'Other-specify' was entered"; label variable strat01r "Number of times 'Advance letter given' was entered"; label variable strat02r "Number of times 'Scheduled appointment' was entered"; label variable strat03r "Number of times 'Left note/appointment card' was entered"; label variable strat04r "Number of times 'Left promotional packet/informational brochure' was entered"; label variable strat05r "Number of times 'Called household' was entered"; label variable strat06r "Number of times 'Left message on answering machine' was entered"; label variable strt11r "Number of times 'Waited for respondent' was entered"; label variable strat12r "Number of times 'Checked with neighbors' was entered"; label variable strat13r "Number of times 'Contacted other family members' was entered"; label variable strt14r "Number of times 'Contacted property manager/doorman' was entered"; label variable strat98r "Number of times 'No strategies' was entered"; label variable strat99r "Number of times 'Other--specify' was entered"; label variable reassign "Case reassignment to another interviewer (FR)"; label variable sa_tod "Time of day that the Sample Adult section was started"; label variable sastrpnt "Point in the interview period when the Sample Adult section was started"; label variable sc_tod "Time of day that the Sample Child section was started"; label variable scstrpnt "Point in the interview period when the Sample Child section was started"; * FLG VARIABLE LABELS; label variable onefam_flg "All people in the household are in the same family"; label variable quality_sa "SA overall flag indicating the record is being removed for a quality reason"; label variable quality_sc "SC overall flag indicating the record is being removed for a quality reason"; label variable sarespsc_flg "Sample Adult is Sample Child respondent"; * GEN VARIABLE LABELS; label variable intv_qrt "Interview quarter"; label variable intv_mon "Interview month"; label variable hh_pclass "Household phone classification"; label variable ad_pclass "Adult phone classification"; label variable wtia_pd "Paradata file weight"; * HHC VARIABLE LABELS; label variable endpnt "Point in the interview period when the case was finished"; label variable strtpnt "Point in the interview period when the Household Composition section was started"; label variable hhc_tod "Time of day that the Household Composition section was started"; * TEL VARIABLE LABELS; label variable telcurwrk_a "House has non-cell phone"; label variable telcel_a "Cell phone"; label variable phonelive_a "Cell phone in HH"; label variable phoneuse_a "Calls answered"; * LNK VARIABLE LABELS; label variable rlink_a "Link without SSN/Medicare Numbers"; * TEL VARIABLE LABELS; label variable telcurwrk_c "Landline phone"; label variable phonelive_c "Working cell phone"; * LNK VARIABLE LABELS; label variable rlink_c "Link without SSN"; * BCK VARIABLE LABELS; label variable intlangsa "Language of SA Interview"; label variable intrptsa "Interpreter used in Adult interview"; label variable otherssa "Other people present during Sample Adult interview"; label variable intlangsc "Language of SC Interview"; label variable otherssc "Other people present during Sample Child interview"; label variable intmodesa "Sample Adult section primarily conducted by phone"; label variable intmodewhysa "Main reason primarily conducted by phone"; label variable intmodesc "Sample Child section primarily conducted by phone"; label variable intmodewhysc "Main reason primarily conducted by phone"; label variable parwhy "Reason interview not complete"; label variable brkreason "Main reason respondent terminated interview"; label variable brkhhc "Break off in household section"; label variable brksa "Break off in Sample Adult section"; label variable brksc "Break off in Sample Child section"; label variable ncomhhc "Household section not complete"; label variable ncomsa "Sample Adult section not complete"; label variable ncomsc "Sample child section not complete"; label variable location01 "Location of interview - Inside respondent's home"; label variable location02 "Location of interview - Immediately outside respondent's home"; label variable location03 "Location of interview - Over the telephone"; label variable location04 "Location of interview - Inside interviewer's/respondent's car"; label variable location05 "Location of interview - At respondent's place of work"; label variable location06 "Location of interview - Common area of apartment"; label variable location07 "Location of interview - Public area"; label variable location08 "Location of interview - In a home of a neighbor, friend, or relative"; label variable location09 "Location of interview - Other location"; * DEFINE VALUE LABELS FOR REPORTS; label define PD001X 1 "Early" 2 "Middle" 3 "Late" ; label define PD002X 01 "January" 02 "February" 03 "March" 04 "April" 05 "May" 06 "June" 07 "July" 08 "August" 09 "September" 10 "October" 11 "November" 12 "December" ; label define PD003X 1 "Quarter 1" 2 "Quarter 2" 3 "Quarter 3" 4 "Quarter 4" ; label define PD004X 201 "Completed interview" 203 "Sufficient partial interview, no follow-up" 213 "Language problem" 215 "Insufficient partial" 216 "No one home, repeated calls" 217 "Temporarily absent, no follow-up" 218 "Refused" 219 "Other Type A" 299 "Occupied entirely by Armed Forces or persons residing elsewhere" ; label define PD005X 1 "Wireless only" 2 "Wireless mostly" 3 "Dual users" 4 "Landline mostly" 5 "Landline only" 6 "Phoneless" 7 "Unknown" ; label define PD006X 1 "Landline(LL) with cell phone(CP)" 2 "LL without CP" 3 "LL with unknown CP" 4 "No LL with unknown CP" 5 "CP only" 6 "Phoneless" 7 "Unknown LL with CP" 8 "Unknown LL without CP" ; label define PD007X 0 "Case not reassigned" 1 "Case reassigned" ; label define PD008X 10 "Sample Adult" 20 "Sample Child" 30 "Sample Adult Income" 40 "Sample Child Income" 50 "Paradata" ; label define PD009X 1 "Northeast" 2 "Midwest" 3 "South" 4 "West" ; label define PD010X 1 "Morning" 2 "Afternoon" 3 "Evening" ; label define PD011X 0 "None" 1 "One or more times" ; label define PD012X 0 "No" 1 "Yes" ; label define PD013X 01 "Respondent does not want to participate" 02 "Respondent not interested" 03 "Respondent too busy" 04 "Respondent has privacy concerns or anti-government" 05 "Respondent or family member is physically or mentally ill" 06 "Unable to reach respondent before closeout" 07 "Case Duplication/reassignment/stopped by RO direction" 08 "Respondent temporarily away or moved" 09 "FR has safety concerns" 10 "Language problems" 11 "Technology issue (computer error, battery died, telephone lost signal)" 12 "Respondent (including Proxy) did not know answers" 13 "Other" ; label define PD014X 1 "English" 2 "Spanish" 3 "Both English and Spanish" 4 "Other" 8 "Not Ascertained" ; label define PD015X 1 "All" 2 "Some" 3 "None" 8 "Not Ascertained" ; label define PD016X 01 "Best method for respondent to complete interview" 02 "Respondent requested phone interview" 03 "Respondent/FR called and respondent wanted to complete interview immediately" 04 "Pets or small children or guests in home" 05 "Respondent or family member is physically or mentally ill" 06 "Inclement weather" 07 "Near closeout" 08 "Distance" 09 "FR has safety concerns" 10 "Other" 88 "Not Ascertained" ; label define PD017X 1 "Mentioned" 2 "Not mentioned" 8 "Not Ascertained" ; label define PD018X 1 "Someone else present for full interview" 2 "Someone else present for part of the interview" 3 "No one else present for any of the interview" ; label define PD019X 1 "Interview stopped in progress/Break-off" 2 "Completion before closeout not possible (Other than Break-off)" 8 "Not Ascertained" ; label define PD020X 1 "All or almost all calls on cell phone" 2 "Some on cell phone and some on home phone" 3 "Very few or none on cell phone" 7 "Refused" 8 "Not Ascertained" 9 "Don't Know" ; label define PD021X 1 "Refused" 2 "No one home, repeated calls" 3 "Temporarily absent" 4 "Language problem" 5 "Other" 8 "Not Ascertained" ; label define PD022X 1 "Type A" 2 "Type B" 3 "Type C" ; label define PD023X 1 "Yes" 2 "No" 8 "Not Ascertained" ; label define PD024X 1 "Yes" 2 "No" 7 "Refused" 8 "Not Ascertained" 9 "Don't Know" ; * ASSOCIATE VARIABLES WITH VALUE LABEL DEFINITIONS; * FRT VALUE LABEL ASSOCIATIONS; label values typeabc PD022X; label values typea PD021X; label values typebobs PD024X; * IDN VALUE LABEL ASSOCIATIONS; label values rectype PD008X; label values outcome1 PD004X; * UCF VALUE LABEL ASSOCIATIONS; label values region PD009X; * CHI VALUE LABEL ASSOCIATIONS; label values unable1r PD011X; label values unable2r PD011X; label values unable3r PD011X; label values unable4r PD011X; label values unable5r PD011X; label values unabl99r PD011X; label values lang1r PD011X; label values lang2r PD011X; label values lang3r PD011X; label values lang4r PD011X; label values lang5r PD011X; label values nctp01r PD011X; label values nctpr03r PD011X; label values nctpr04r PD011X; label values nctp05r PD011X; label values nctpr07r PD011X; label values nctpr08r PD011X; label values nctpr09r PD011X; label values nctpr10r PD011X; label values nctpr11r PD011X; label values nctp12r PD011X; label values nctpr99r PD011X; label values nctl01r PD011X; label values nctl02r PD011X; label values nctel03r PD011X; label values nctel04r PD011X; label values nctel05r PD011X; label values nctl06r PD011X; label values nctl07r PD011X; label values nctel99r PD011X; label values relc01r PD011X; label values reluc02r PD011X; label values reluc03r PD011X; label values reluc05r PD011X; label values reluc06r PD011X; label values reluc07r PD011X; label values relc08r PD011X; label values relc09r PD011X; label values reluc11r PD011X; label values reluc12r PD011X; label values relc15r PD011X; label values reluc98r PD011X; label values reluc99r PD011X; label values strat01r PD011X; label values strat02r PD011X; label values strat03r PD011X; label values strat04r PD011X; label values strat05r PD011X; label values strat06r PD011X; label values strt11r PD011X; label values strat12r PD011X; label values strat13r PD011X; label values strt14r PD011X; label values strat98r PD011X; label values strat99r PD011X; label values reassign PD007X; label values sa_tod PD010X; label values sastrpnt PD001X; label values sc_tod PD010X; label values scstrpnt PD001X; * FLG VALUE LABEL ASSOCIATIONS; label values quality_sa PD012X; label values quality_sc PD012X; * GEN VALUE LABEL ASSOCIATIONS; label values intv_qrt PD003X; label values intv_mon PD002X; label values hh_pclass PD006X; label values ad_pclass PD005X; * HHC VALUE LABEL ASSOCIATIONS; label values endpnt PD001X; label values strtpnt PD001X; label values hhc_tod PD010X; * TEL VALUE LABEL ASSOCIATIONS; label values telcurwrk_a PD024X; label values telcel_a PD024X; label values phonelive_a PD024X; label values phoneuse_a PD020X; * LNK VALUE LABEL ASSOCIATIONS; label values rlink_a PD024X; * TEL VALUE LABEL ASSOCIATIONS; label values telcurwrk_c PD024X; label values phonelive_c PD024X; * LNK VALUE LABEL ASSOCIATIONS; label values rlink_c PD024X; * BCK VALUE LABEL ASSOCIATIONS; label values intlangsa PD014X; label values intrptsa PD023X; label values otherssa PD018X; label values intlangsc PD014X; label values otherssc PD018X; label values intmodesa PD015X; label values intmodewhysa PD016X; label values intmodesc PD015X; label values intmodewhysc PD016X; label values parwhy PD019X; label values brkreason PD013X; label values location01 PD017X; label values location02 PD017X; label values location03 PD017X; label values location04 PD017X; label values location05 PD017X; label values location06 PD017X; label values location07 PD017X; label values location08 PD017X; label values location09 PD017X; describe; #delimit cr * data file is stored in paradata.dta * log file is stored in paradata.log log close