Administrator approval is now required for registering new accounts. If you are registering a new account, and are external to the University, please ask the repository owner to contact ServiceLine to request your account be approved. Repository owners must include the newly registered email address, and specific repository in the request for approval.

Commit 153ddb41 authored by Ben Anderson's avatar Ben Anderson
Browse files

updated descriptives

added do_graphs switch
checks for valid gas values of 0 due to rounding of 100 < gcons < 250
to ‘nearest’ 500 - i.e 0!
parent 5998ea78
......@@ -28,11 +28,14 @@ local rpath "`proot'/results/NEED"
local version "v1.1"
* quick tests for 2012
local do_2012_desc = 0
local do_2012_desc = 1
* tests for all years using long file - takes a while
local do_long_desc = 1
* toggle graph drawing
local do_graphs = 0
set more off
log using "`rpath'/analyse-NEED-EULF-2014-descriptives-`version'-$S_DATE.smcl", replace
......@@ -48,13 +51,26 @@ if `do_2012_desc' {
* processor intensive
local vars "Econs2012 Gcons2012"
local tvars "EE_BAND FLOOR_AREA_BAND PROP_AGE"
* test values for valid - check for valid 0s for example. This only happens for gas where:
* gas cons > 100 (so included) but cons < 250 so 'rounded' to nearest 500 = 0
* elec always rounded to nearest 50 so min shoudl always be 100
foreach v of local vars {
tabstat `v', by(`v'Valid) s(n mean semean min max)
foreach tv of local tvars {
histogram `v' , by(`tv') name(h_`tv'_`v'_`sample')
graph export "`rpath'/NEED-EULF-2014-histo_`v'_by_`tv'_`sample'.png", replace
di "***************"
di "* Testing `tv'"
* test values for `tv' - check for 0s for example
tabstat `v' if `v'Valid == "V", by(`tv') s(n mean semean min max)
tab `v' if `v' < 1000
if `do_graphs' {
histogram `v' if `v'Valid == "V", by(`tv') name(h_`tv'_`v'_`sample')
graph export "`rpath'/NEED-EULF-2014-histo_`v'_by_`tv'_`sample'_valid.png", replace
graph box `v', over(`tv') name(b_`tv'_`v'_`sample')
graph export "`rpath'/NEED-EULF-2014-box_`v'_by_`tv'_`sample'.png", replace
graph box `v' if `v'Valid == "V", over(`tv') name(b_`tv'_`v'_`sample')
graph export "`rpath'/NEED-EULF-2014-box_`v'_by_`tv'_`sample'_valid.png", replace
}
}
}
}
......@@ -62,7 +78,7 @@ if `do_2012_desc' {
if `do_long_desc' {
* Now use the pre-processed long form file which contains all years of consumption data but not the constant values (housing charactersitics etc) which are in the xwave file
* do this for each random sample of differening sizes as a check
local samples "10 20 130 40 50 100"
local samples "10 20 30 40 50 100"
foreach s of local samples {
di "************************"
di "* Using `s'% sample"
......@@ -71,23 +87,33 @@ if `do_long_desc' {
* set as panel in case it wasn't
xtset HH_ID year
* examine panel status
xtdescribe
xtsum Econs Gcons
* summarise Electricity
table EconsValid year, c(count Econs min Econs mean Econs max Econs)
* summarise Gas
table GconsValid year, c(count Gcons min Gcons mean Gcons max Gcons)
* distributions by year
* distributions for valid obs
local vars "Econs Gcons"
foreach v of local vars {
histogram `v', by(year) name(histo_`s'pc_`v')
graph export "`rpath'/NEED-EULF-2014-`s'pc-histo_`v'_by_year.png", replace
graph box `v', over(year) name(box_`s'pc_`v')
graph export "`rpath'/NEED-EULF-2014-`s'pc-box_`v'_by_year.png", replace
* overall
xtsum `v' if `v'Valid == "V"
* test values for valid - check for valid 0s for example. This only happens for gas where:
* gas cons > 100 (so included) but cons < 250 so 'rounded' to nearest 500 = 0
* elec always rounded to nearest 50 so min shoudl always be 100
tabstat `v', by(`v'Valid) s(n mean semean min max)
* by year
* check for 0s
table `v' year if `v' < 1000
table `v'Valid year, c(count `v' min `v' mean `v' max `v')
if `do_graphs' {
histogram `v' if `v'Valid == "V", by(year) name(histo_`s'pc_`v')
graph export "`rpath'/NEED-EULF-2014-`s'pc-histo_`v'_by_year_valid.png", replace
graph box `v' if `v'Valid == "V", over(year) name(box_`s'pc_`v')
graph export "`rpath'/NEED-EULF-2014-`s'pc-box_`v'_by_year_valid.png", replace
}
}
* check the years where gas = valid but consumption = 0
* Presumably in these cases gas > 100 but < 249 ?
}
}
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment