| |
Merging PSID Data: SPSS Example
Method 1
*---------------------------------------------------------------------*
| This example program demonstrates a relatively simple method for |
| merging PSID data. It uses data from 3 different years, subsetting |
| criteria, and the compress option (to conserve disk space). |
*---------------------------------------------------------------------.
* Read in 1990-1992 cross-year individual file and select variables
needed for analysis.
FILE HANDLE IND90_92 / NAME="[PATH]\IND2007ER.txt" LRECL = 3118.
DATA LIST FILE=IND90_92 /
ER30001 2 - 5
ER30002 6 - 8
ER30642 1528 - 1532
ER30643 1533 - 1534
ER30644 1535 - 1536
ER30645 1537 - 1539
ER30653 1555
ER30657 1563 - 1564
ER30659 1566 - 1571
ER30689 1647 - 1650
ER30690 1651 - 1652
ER30691 1653 - 1654
ER30692 1655 - 1657
ER30699 1672
ER30703 1680 - 1681
ER30705 1683 - 1688
ER30707 1690 - 1695
ER30733 1764 - 1767
ER30734 1768 - 1769
ER30735 1770 - 1771
ER30736 1772 - 1774
ER30744 1790
ER30748 1798 - 1799
ER30750 1801 - 1806
ER30752 1808 - 1813
ER30805 1907 - 1913 (3)
ER32000 2060
ER32022 2113 - 2114
ER32049 2189
.
VARIABLE LABELS
ER30001 "1968 INTERVIEW NUMBER 68"
ER30002 "PERSON NUMBER 68"
ER30642 "1990 INTERVIEW NUMBER"
ER30643 "SEQUENCE NUMBER 90"
ER30644 "RELATIONSHIP TO HEAD 90"
ER30645 "AGE OF INDIVIDUAL 90"
ER30653 "EMPLOYMENT STAT 90"
ER30657 "COMPLETED EDUCATION 90"
ER30659 "TOT TXBL INCOME 90"
ER30689 "1991 INTERVIEW NUMBER"
ER30690 "SEQUENCE NUMBER 91"
ER30691 "RELATIONSHIP TO HEAD 91"
ER30692 "AGE OF INDIVIDUAL 91"
ER30699 "EMPLOYMENT STAT 91"
ER30703 "COMPLETED EDUCATION 91"
ER30705 "TOT LABOR INCOME 91"
ER30707 "TOT ASSET INCOME 91"
ER30733 "1991 INTERVIEW NUMBER"
ER30734 "SEQUENCE NUMBER 92"
ER30735 "RELATIONSHIP TO HEAD 92"
ER30736 "AGE OF INDIVIDUAL 92"
ER30744 "EMPLOYMENT STAT 92"
ER30748 "COMPLETED EDUCATION 92"
ER30750 "TOT LABOR INCOME 92"
ER30752 "TOT ASSET INCOME 92"
ER30805 "COMBINED IND WEIGHT 92"
ER32000 "SEX OF INDIVIDUAL"
ER32022 "# BIRTHS OF THIS IND"
ER32049 "LAST KNOWN MARITAL STAT"
.
MISSING VALUES
ER30645 (99)
ER30657 (99)
ER30692 (99)
ER30703 (99)
ER30736 (99)
ER30748 (99)
ER32022 (98)
ER32049 (8)
.
RENAME VARIABLES
(ER30642=ID90)
(ER30689=ID91)
(ER30733=ID92)
.
* This example selects those who were ever heads or wives/"wives"
between 1990 and 1992.
SELECT IF (ER30643 EQ 01 AND ER30644 EQ 10) OR
(ER30643 EQ 02 AND (ER30644 EQ 20 OR ER30644 EQ 22)) OR
(ER30690 EQ 01 AND ER30691 EQ 10) OR
(ER30690 EQ 02 AND (ER30691 EQ 20 OR ER30691 EQ 22)) OR
(ER30734 EQ 01 AND ER30735 EQ 10) OR
(ER30734 EQ 02 AND (ER30735 EQ 20 OR ER30735 EQ 22))
.
* Sort active file by id90.
SORT CASES BY ID90
.
SAVE OUTFILE="IND90_92.SYS" / COMPRESS
.
EXECUTE .
* Read in 1990 family file and select variables needed for analysis.
FILE HANDLE FAM90 / NAME="[PATH]\FAM1990.txt" LRECL=2312 .
DATA LIST FILE=FAM90 /
V17702 4 - 8
V17836 283 - 288
V18262 1167 - 1169
V18564 1633 - 1635
V18814 2018
V18878 2160 - 2165
V18887 2206 - 2212 (2)
V18888 2213 - 2219 (2)
.
VARIABLE LABELS
V17702 "1990 INTERVIEW NUMBER"
V17836 "WIFE 89 LABOR/WAGE"
V18262 "C9-10 OCC-LAST JOB (H-U)"
V18564 "E9-10 OCC-LAST JOB (W-U)"
V18814 "M32 RACE OF HEAD (1 MEN)"
V18878 "TOTAL HEAD LABOR Y 89"
V18887 "HEAD 89 AVG HRLY EARNING"
V18888 "WIFE 89 AVG HRLY EARNING"
.
MISSING VALUES
V18262 (999)
V18564 (999)
V18814 (9)
.
RENAME VARIABLES
(V17702=ID90)
.
* Sort active file by id90.
SORT CASES BY ID90.
* Merge ind90_92.sys and active file by id90.
MATCH FILES FILE="IND90_92.SYS" / TABLE=* / BY ID90.
* Sort active file by id91.
SORT CASES BY ID91.
SAVE OUTFILE="FAM_IND.SYS" / COMPRESS.
* Read in 1991 family file and select variables needed for analysis.
FILE HANDLE FAM91 / NAME="[PATH]\FAM1991.txt" LRECL = 2314.
DATA LIST FILE=FAM91 /
V19002 2 - 5
V19136 281 - 286
V19562 1165 - 1167
V19864 1631 - 1633
V20114 2016
V20178 2158 - 2163
V20187 2204 - 2210 (2)
V20188 2211 - 2217 (2)
.
VARIABLE LABELS
V19002 "1991 INTERVIEW NUMBER"
V19136 "WIFE 90 LABOR/WAGE"
V19562 "C9-10 OCC-LAST JOB (H-U)"
V19864 "E9-10 OCC-LAST JOB (W-U)"
V20114 "L32 RACE OF HEAD (1 MEN)"
V20178 "TOTAL HEAD LABOR Y 90"
V20187 "HEAD 90 AVG HRLY EARNING"
V20188 "WIFE 90 AVG HRLY EARNING".
MISSING VALUES
V19562 (999)
V19864 (999)
V20114 (9).
RENAME VARIABLES
(V19002=ID91).
* Sort active file by id91.
SORT CASES BY ID91.
* Merge fam_ind.sys and active file by id91.
MATCH FILES FILE="FAM_IND.SYS" / TABLE=* / BY ID91.
* Sort active file by id92.
SORT CASES BY ID92.
SAVE OUTFILE="FAM_IND.SYS" / COMPRESS.
* Read in 1992 family file and select variables needed for analysis.
FILE HANDLE FAM92 / NAME="[PATH]\FAM1992.txt" LRECL = 2294.
DATA LIST FILE=FAM92 /
V20302 4 - 7
V20436 283 - 288
V20862 1174 - 1176
V21164 1640 - 1642
V21420 2031
V21484 2137 - 2142
V21493 2183 - 2189 (2)
V21494 2190 - 2196 (2)
.
VARIABLE LABELS
V20302 "1992 INTERVIEW NUMBER"
V20436 "WIFE 91 LABOR/WAGE"
V20862 "C9-10 OCC-LAST JOB (H-U)"
V21164 "E9-10 OCC-LAST JOB (W-U)"
V21420 "M32 RACE OF HEAD (1 MEN)"
V21484 "TOTAL HEAD LABOR Y 91"
V21493 "HEAD 91 AVG HRLY EARNING"
V21494 "WIFE 91 AVG HRLY EARNING".
MISSING VALUES
V20862 (999)
V21164 (999)
V21420 (9).
RENAME VARIABLES
(V20302=ID92).
* Sort active file by id92.
SORT CASES BY ID92.
* Merge fam_ind.sys and active file by id92.
MATCH FILES FILE="FAM_IND.SYS" / TABLE=* / BY ID92.
SAVE OUTFILE="FAM_IND.SYS" / COMPRESS.
|
|