/********** DEEL 1: DATABEHEER **********
*****************************************
*Controle intividuele variabelen
********************************/
data ess2;
set "/folders/myfolders/ess2e03_3.sas7bdat";
run;
proc freq data = ess2;
tables CNTRY DOMICIL AGEA HINCTNT EDULVLA HEALTH UEMP12M;
run;
proc freq data = ess2;
tables CNTRY DOMICIL AGEA HINCTNT EDULVLA HEALTH UEMP12M;
format CNTRY DOMICIL AGEA HINCTNT EDULVLA HEALTH UEMP12M;
run;
*HEALTH omkeren.
****************;
data ess2;
set ess2;
HEALTHRev = 6 - HEALTH;
label HEALTHRev = "Subjective general healt - Reversed";
run;
proc freq data = ess2;
tables HEALTHRev;
run;
*DOMICIL dummyficeren ("Country village" als referentiecategorie).
******************************************************************;
data ess2;
set ess2;
D1DOMICIL = (DOMICIL = 1);
if DOMICIL < 0 then D1DOMICIL = .;
D2DOMICIL = (DOMICIL = 2);
if DOMICIL < 0 then D2DOMICIL = .;
D3DOMICIL = (DOMICIL = 3);
if DOMICIL < 0 then D3DOMICIL = .;
D4DOMICIL = (DOMICIL = 5);
if DOMICIL < 0 then D4DOMICIL = .;
label D1DOMICIL = "Big city - dummy"
D2DOMICIL = "Suburbs - dummy"
D3DOMICIL = "Town or small city - dummy"
D4DOMICIL = "Farm or home in countryside - dummy";
run;
proc freq data = ess2;
tables D1DOMICIL D2DOMICIL D3DOMICIL D4DOMICIL;
run;
, *EDULVLA hercoderen.
********************;
proc format;
value EDULVLARecfmt
1 = "Laag geschoold"
2 = "Midden geschoold"
3 = "Hoog geschoold"
;
run;
data ess2;
set ess2;
select (EDULVLA);
when (1) EDULVLARec = 1;
when (2,3,4) EDULVLARec = 2;
when (5) EDULVLARec = 3;
otherwise EDULVLARec = .;
end;
label EDULVLARec = "Highest level of education - Recoded";
format EDULVLARec EDULVLARecfmt.;
run;
proc freq data = ess2;
tables EDULVLARec;
run;
*Landen numeriek maken.
***********************;
proc sort data = ess2;
by CNTRY;
run;
data ess2;
set ess2;
by CNTRY;
if first.CNTRY then CNTRYNUM + 1;
label CNTRYNUM = "Numerieke landvariabele";
run;
proc freq data = ess2;
tables CNTRY CNTRYNUM;
run;
*Landvariabele UEMP12M: intern aggregeren.
******************************************;
proc sort data = ess2;
by CNTRYNUM;
run;
proc freq data = ess2 noprint;
tables UEMP12M / out = frequnemp;
by CNTRYNUM;
run;
*****************************************
*Controle intividuele variabelen
********************************/
data ess2;
set "/folders/myfolders/ess2e03_3.sas7bdat";
run;
proc freq data = ess2;
tables CNTRY DOMICIL AGEA HINCTNT EDULVLA HEALTH UEMP12M;
run;
proc freq data = ess2;
tables CNTRY DOMICIL AGEA HINCTNT EDULVLA HEALTH UEMP12M;
format CNTRY DOMICIL AGEA HINCTNT EDULVLA HEALTH UEMP12M;
run;
*HEALTH omkeren.
****************;
data ess2;
set ess2;
HEALTHRev = 6 - HEALTH;
label HEALTHRev = "Subjective general healt - Reversed";
run;
proc freq data = ess2;
tables HEALTHRev;
run;
*DOMICIL dummyficeren ("Country village" als referentiecategorie).
******************************************************************;
data ess2;
set ess2;
D1DOMICIL = (DOMICIL = 1);
if DOMICIL < 0 then D1DOMICIL = .;
D2DOMICIL = (DOMICIL = 2);
if DOMICIL < 0 then D2DOMICIL = .;
D3DOMICIL = (DOMICIL = 3);
if DOMICIL < 0 then D3DOMICIL = .;
D4DOMICIL = (DOMICIL = 5);
if DOMICIL < 0 then D4DOMICIL = .;
label D1DOMICIL = "Big city - dummy"
D2DOMICIL = "Suburbs - dummy"
D3DOMICIL = "Town or small city - dummy"
D4DOMICIL = "Farm or home in countryside - dummy";
run;
proc freq data = ess2;
tables D1DOMICIL D2DOMICIL D3DOMICIL D4DOMICIL;
run;
, *EDULVLA hercoderen.
********************;
proc format;
value EDULVLARecfmt
1 = "Laag geschoold"
2 = "Midden geschoold"
3 = "Hoog geschoold"
;
run;
data ess2;
set ess2;
select (EDULVLA);
when (1) EDULVLARec = 1;
when (2,3,4) EDULVLARec = 2;
when (5) EDULVLARec = 3;
otherwise EDULVLARec = .;
end;
label EDULVLARec = "Highest level of education - Recoded";
format EDULVLARec EDULVLARecfmt.;
run;
proc freq data = ess2;
tables EDULVLARec;
run;
*Landen numeriek maken.
***********************;
proc sort data = ess2;
by CNTRY;
run;
data ess2;
set ess2;
by CNTRY;
if first.CNTRY then CNTRYNUM + 1;
label CNTRYNUM = "Numerieke landvariabele";
run;
proc freq data = ess2;
tables CNTRY CNTRYNUM;
run;
*Landvariabele UEMP12M: intern aggregeren.
******************************************;
proc sort data = ess2;
by CNTRYNUM;
run;
proc freq data = ess2 noprint;
tables UEMP12M / out = frequnemp;
by CNTRYNUM;
run;