5 years ago · 9ed4f3828e
--- a/R/combmodels.R
+++ b/R/combmodels.R
@@ -27,7 +27,7 @@ cbp <- as.character(p$Series(sns$color_palette("colorblind", as.integer(9))$as_h
 
				 
			
 
				 ntps <- length(unique(aggdf$read_time))
			
 
				 
			
 
				-clus = "9"
			
 
				+clus = "1"
			
 
				 
			
 
				 yfreq <- floor(48 * 365.25)
			
 
				 wfreq <- floor(48 * 7)
			
@@ -89,7 +89,7 @@ cmplot + coord_cartesian(xlim = c(as.POSIXct("2017-03-01", tz = "UTC"), as.POSIX
 
				 #                 direction = "both", steps = 300)
			
 
				 
			
 
				 
			
 
				-newagg <- p$read_pickle("../data/9-proj-agg.pkl")
			
 
				+newagg <- p$read_pickle("../data/1617-agg.pkl")
			
 
				 newagg$cluster <- factor(newagg$cluster)
			
 
				 str(newagg)
			
 
				 
			
@@ -119,7 +119,14 @@ predplot <-ggplot(predf, aes(x = x, y = y)) + geom_line(aes(y = f), color = "blu
 
				 
			
 
				 predplot
			
 
				 
			
 
				-predplot + coord_cartesian(xlim = c(as.POSIXct("2018-03-01", tz = "UTC"), as.POSIXct("2018-04-01", tz = "UTC")))
			
 
				+predplot + coord_cartesian(xlim = c(as.POSIXct("2017-03-01", tz = "UTC"), as.POSIXct("2017-04-01", tz = "UTC")))
			
 
				 
			
 
				 mean(abs(predf$r))
			
 
				 sd(predf$r)
			
 
				+
			
 
				+
			
 
				+# number of icps per cluster
			
 
				+ocdf <- p$read_pickle('../data/9-clusters-sample-table.pkl')
			
 
				+ncdf <- p$read_pickle('../data/1617-asgn-table.pkl')
			
 
				+table(ocdf$cluster)
			
 
				+table(ncdf$cluster)
			
--- a/img/all-9-fix-1617-asigned.png
+++ b/img/all-9-fix-1617-asigned.png
--- a/img/all-9-fre-1617-asigned.png
+++ b/img/all-9-fre-1617-asigned.png
--- a/img/apr-9-fix-1617-asigned.png
+++ b/img/apr-9-fix-1617-asigned.png
--- a/img/apr-9-fre-1617-asigned.png
+++ b/img/apr-9-fre-1617-asigned.png
--- a/img/jan-9-fix-1617-asigned.png
+++ b/img/jan-9-fix-1617-asigned.png
--- a/img/jan-9-fre-1617-asigned.png
+++ b/img/jan-9-fre-1617-asigned.png
--- a/img/jul-9-fix-1617-asigned.png
+++ b/img/jul-9-fix-1617-asigned.png
--- a/img/jul-9-fre-1617-asigned.png
+++ b/img/jul-9-fre-1617-asigned.png
--- a/img/oct-9-fix-1617-asigned.png
+++ b/img/oct-9-fix-1617-asigned.png
--- a/img/oct-9-fre-1617-asigned.png
+++ b/img/oct-9-fre-1617-asigned.png
--- a/py/clusAssign.py
+++ b/py/clusAssign.py
@@ -8,6 +8,12 @@ clusfile = '../data/9-clusters.agg.pkl'
 
				 # A new dataset
			
 
				 ndsfile = '../data/2016-17-sample.pkl'
			
 
				 
			
 
				+# Table of assigned clusters
			
 
				+aclusfile = '../data/1617-asgn-table.pkl'
			
 
				+
			
 
				+# Aggregated dataset
			
 
				+aggfile = '../data/1617-agg.pkl'
			
 
				+
			
 
				 
			
 
				 clusdf = p.read_pickle(clusfile)
			
 
				 clusdf = clusdf.pivot(index = 'read_time', columns = 'cluster', values = 'kwh_tot_mean')
			
@@ -44,14 +50,28 @@ for i in icps:
 
				         print('ICP {} has constant value; assigning to cluster -1'.format(i))
			
 
				     clusdict[i] = bestc
			
 
				 
			
 
				-# Need to make sure cluster is integer ZZZ
			
 
				 newclusdf = p.DataFrame.from_dict(clusdict, orient = 'index', columns = ['cluster'])
			
 
				 newclusdf.index.name = 'icp_id'
			
 
				 newclusdf = newclusdf.reset_index()
			
 
				-# print(newclusdf)
			
 
				+print(newclusdf)
			
 
				+newclusdf.to_pickle(aclusfile)
			
 
				+
			
 
				 
			
 
				 newdf = p.melt(newdf.reset_index(), 'read_time', var_name = 'icp_id', value_name = 'kwh')
			
 
				 
			
 
				-######## ZZZ Something isn't working here
			
 
				-anndf = newdf.set_index('icp_id').join(newclusdf)
			
 
				+print(newdf.info())
			
 
				+print(newclusdf.info())
			
 
				+
			
 
				+anndf = newdf.set_index('icp_id').join(newclusdf.set_index('icp_id')).reset_index()
			
 
				 print(anndf)
			
 
				+
			
 
				+qlow  = lambda x: x.quantile(0.250)
			
 
				+qhigh = lambda x: x.quantile(0.750)
			
 
				+newagg = anndf.groupby(['read_time', 'cluster']).agg({
			
 
				+        'kwh': ['median', 'mean', ('CI_low', qlow), ('CI_high', qhigh)]
			
 
				+})
			
 
				+newagg.columns = ['_tot_'.join(x) for x in newagg.columns.ravel()]
			
 
				+newagg = newagg.reset_index()
			
 
				+
			
 
				+print(newagg)
			
 
				+newagg.to_pickle(aggfile)