*****pgm: descriptive_distribution.do**** use "C:\NHANES\Data\analysis_data.dta", clear generate age=1 if ridageyr >= 20 & ridageyr <=39 replace age=2 if ridageyr >= 40 & ridageyr <=59 replace age=3 if ridageyr >= 60 & ridageyr <. ****format variables****** label define agefmt 1 "20-39" label define agefmt 2 "40-59", add label define agefmt 3 "60+", add label define sexfmt 1 "male" label define sexfmt 2 "female", add label values age agefmt label values riagendr sexfmt log using "C:\NHANES\log\distribution.log", replace by riagendr age, sort : summarize lbxtc [aweight = wtmec4yr] if (ridageyr >=20 & ridageyr <.) & ridstatr==2, detail histogram lbxtc, by(riagendr age), if (ridageyr >=20 & ridageyr <.) & ridstatr==2, normal graph save "C:\NHANES\graph\histogram_descriptive.gph", replace graph box lbxtc [pweight = wtmec4yr], medtype(line) over(riagendr) over(age), if (ridageyr >=20 & ridageyr <.)& ridstatr==2 graph save "C:\NHANES\graph\box_plot.gph", replace log close