https://github.com/ab4377/dream-project
Tip revision: 8e64d9628355fde264b6481f9955478fed995fe5 authored by Avinash Bukkittu on 04 October 2017, 22:20:26 UTC
Merge branch 'master' of https://github.com/ab4377/dream-project
Merge branch 'master' of https://github.com/ab4377/dream-project
Tip revision: 8e64d96
FindRecordIdsByCategory.py
import pandas as pd
import Constants
category_df = pd.read_csv("category.csv")
category = {}
for idx,row in category_df.iterrows():
tokens = row["value"].split("-")
category[(tokens[0],tokens[1])] = row["category"]
df = pd.read_csv(Constants.meta_data_location)
grouped = df.groupby(by=["phoneInfo","medTimepoint"])
groups = {}
for key,group in grouped:
grouped_df = grouped.get_group(key)
ll = []
for idx,row in grouped_df.iterrows():
ll.append(row["recordId"])
groups[key] = ll
for key in groups.keys():
data = pd.DataFrame(groups[key],columns=["recordIds"])
data.to_csv(category[key] + ".csv",index=False,header=False)