diff --git a/NEED/process-NEED-EULF-2014.do b/NEED/process-NEED-EULF-2014.do index a7c556db142714937b25962252631f950a575c35..ce33ad9ae0b3099c50f4d2e02e0315029422640c 100644 --- a/NEED/process-NEED-EULF-2014.do +++ b/NEED/process-NEED-EULF-2014.do @@ -14,6 +14,23 @@ * Gcons<year>valid variable has undefined labels: G, L, M = ? Presumably 0 = off gas & V = valid? * ideally DECC should set missing to -99 to aid re-coding and avoid unpleasant surprises in naive analysis! +the Gcons*valid variable codes: + + G = Gas consumption invalid, greater than 50,000 + L = Gas consumption invalid, less than 100 + M = Gas consumption data is missing in source data + 0 = Property does not have a gas connection + V = Valid gas consumption (between 100 and 50,000 inclusive) + NB - there are valid gas readings of '0' which presumably were > 100 but < 249 (first gas 'heap' = 'nearest 500') + +the Econs*valid variable codes: + + G Electricity consumption invalid, greater than 25,000 (DECC lookup table says 50,000) + L Electricity consumption invalid, less than 100 + M Electricity consumption data is missing in source dataset + V Valid electricity consumption (between 100 and 25,000 inclusive) + + /* Copyright (C) 2014 University of Southampton @@ -85,7 +102,6 @@ if `create_codebook' { log off main log using "`dpath'/processed/codebook-NEED-EULF-2014-`version'-`sample'pc-$S_DATE.smcl", replace name(cb) desc - di "** no idea what G, L, M mean in the 'valid' variables - presumably 0 = off gas & V = valid?" codebook log close cb log on main @@ -157,7 +173,6 @@ if `create_xwavefile' { log off main log using "`dpath'/processed/codebook-NEED-EULF-2014-`ifile'_xwavefile-`version'-`samplet'-$S_DATE.smcl", replace name(cb_xwave) desc - di "** no idea what G, L, M mean in the 'valid' variables - presumably 0 = off gas & V = valid?" di "** urban/rural would be helpful" codebook compress