Skip to content
Snippets Groups Projects
Commit 8f8b5119 authored by Jakub Dylag's avatar Jakub Dylag
Browse files

move summary excel into json config

parent 28f44a19
No related branches found
No related tags found
No related merge requests found
...@@ -255,23 +255,14 @@ def run_all(mapping_file, target_code_type, ...@@ -255,23 +255,14 @@ def run_all(mapping_file, target_code_type,
out = out.drop_duplicates(subset=["CONCEPT_SET", "CONCEPT"]) out = out.drop_duplicates(subset=["CONCEPT_SET", "CONCEPT"])
out = out.sort_values(by=["CONCEPT_SET", "CONCEPT"]) out = out.sort_values(by=["CONCEPT_SET", "CONCEPT"])
#Merge with Concept Types in Summary Excel File #Add Concept Set Defintions metadata
if "excel_sheet" in summary_config: summary_df = pd.DataFrame(summary_config["concept_set"]) #transform to dataframe
summary_df = read_table_file(summary_config["file"], excel_sheet=summary_config["excel_sheet"]) if "metadata" in summary_df.columns:
else: summary_df = summary_df.join(pd.json_normalize(summary_df["metadata"])) #metadata to columns
summary_df = read_table_file(summary_config["file"]) summary_df = summary_df.drop(columns=["metadata"])
summary_cols_all = [] #get all column names summary_df = summary_df.rename(columns={"concept_set_name":"CONCEPT_SET"})
for v in summary_config["columns"].values(): #TODO: put in seperate function - get all columns in JSON file object
if type(v) == str:
summary_cols_all.append(v)
else:
summary_cols_all += v
output_version = summary_config["version"]
summary_df = summary_df[summary_cols_all] #select all relevant columns
summary_df = summary_df.rename(columns={summary_config["columns"]["concept_set_name"]: "CONCEPT_SET"})
summary_df = summary_df.drop_duplicates() #remove duplicates summary_df = summary_df.drop_duplicates() #remove duplicates
out = out.merge(summary_df, how="left", on='CONCEPT_SET') out = out.merge(summary_df, how="left", on='CONCEPT_SET') #merge with output
# Save Output File # Save Output File
print(bcolors.HEADER, "---"*5, "OUTPUT", "---"*5, bcolors.ENDC) print(bcolors.HEADER, "---"*5, "OUTPUT", "---"*5, bcolors.ENDC)
......
This diff is collapsed.
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment