diff --git a/NEED/process-NEED-EULF-2014.do b/NEED/process-NEED-EULF-2014.do
index d8639e98f6cf8bec97daca014c345507d712ca0d..5d1af391cdbfbc2173041f5ef12edf9a172b9e64 100644
--- a/NEED/process-NEED-EULF-2014.do
+++ b/NEED/process-NEED-EULF-2014.do
@@ -36,9 +36,11 @@ local ifile "need_eul_may2014"
 * original data file
 local dfile_orig "`dpath'UKDA-7518-stata11/stata11/`ifile'.dta"
 
-* 10 = 10% sample, 50 = 50% sample, 100 = 100% sample
+
 * if you really wanted to you could set up a loop to iterate over a list of sample values to create a set of random sub-samples
-local sample 50
+* we'll just create a random sub-sample of sample% to make testing models etc easier
+* 10 = 10% sample, 50 = 50% sample, 100 = 100% sample etc
+local sample 20
 local samplet "`sample'pc"
 local sampleby "EE_BAND PROP_TYPE"