diff --git a/NEED/process-NEED-EULF-2014.do b/NEED/process-NEED-EULF-2014.do
index a7c556db142714937b25962252631f950a575c35..ce33ad9ae0b3099c50f4d2e02e0315029422640c 100644
--- a/NEED/process-NEED-EULF-2014.do
+++ b/NEED/process-NEED-EULF-2014.do
@@ -14,6 +14,23 @@
 * Gcons<year>valid variable has undefined labels: G, L, M = ? Presumably 0 = off gas & V = valid?
 * ideally DECC should set missing to -99 to aid re-coding and avoid unpleasant surprises in naive analysis!
 
+the Gcons*valid variable codes:
+
+    G = Gas consumption invalid, greater than 50,000
+    L = Gas consumption invalid, less than 100
+    M = Gas consumption data is missing in source data
+    0 = Property does not have a gas connection
+    V = Valid gas consumption (between 100 and 50,000 inclusive)
+    NB - there are valid gas readings of '0' which presumably were > 100 but < 249 (first gas 'heap' = 'nearest 500')
+
+the Econs*valid variable codes:
+
+    G Electricity consumption invalid, greater than 25,000 (DECC lookup table says 50,000)
+    L Electricity consumption invalid, less than 100
+    M Electricity consumption data is missing in source dataset
+    V Valid electricity consumption (between 100 and 25,000 inclusive)
+
+
 /*   
 
 Copyright (C) 2014  University of Southampton
@@ -85,7 +102,6 @@ if `create_codebook' {
 	log off main
 	log using "`dpath'/processed/codebook-NEED-EULF-2014-`version'-`sample'pc-$S_DATE.smcl", replace name(cb)
 	desc
-	di "** no idea what G, L, M mean in the 'valid' variables - presumably 0 = off gas & V = valid?"
 	codebook
 	log close cb
 	log on main
@@ -157,7 +173,6 @@ if `create_xwavefile' {
 		log off main
 		log using "`dpath'/processed/codebook-NEED-EULF-2014-`ifile'_xwavefile-`version'-`samplet'-$S_DATE.smcl", replace name(cb_xwave)
 		desc
-		di "** no idea what G, L, M mean in the 'valid' variables - presumably 0 = off gas & V = valid?"
 		di "** urban/rural would be helpful"
 		codebook
 		compress