Repository for Petra's work at ampli Jan-Feb 2019

agg.py 528B

1234567891011121314151617181920212223
  1. # Aggregrate given clusters
  2. import pandas as p
  3. def aggregator(widedf, clusdf):
  4. clusters = clusdf.cluster.unique()
  5. clusters.sort()
  6. aggv = {}
  7. qlow = lambda x: x.quantile(0.250)
  8. qhigh = lambda x: x.quantile(0.750)
  9. for c in clusters:
  10. icps = clusters[clusters.cluster == c].icp_id.values
  11. subdf = widedf[icps]
  12. agged = subdf.agg('median', 'mean', qlow, qhigh)
  13. print(agged)
  14. def main():
  15. wd = p.read_pickle()
  16. cd = p.read_pickle()
  17. if __name__ == "__main__":
  18. main()