Skip to content

Commit

Permalink
remove use of create_missing_column function, just subset on required…
Browse files Browse the repository at this point in the history
… release cols
  • Loading branch information
rxu17 committed Jan 24, 2024
1 parent 30c39e0 commit 7b6c2b3
Showing 1 changed file with 3 additions and 7 deletions.
10 changes: 3 additions & 7 deletions genie/database_to_staging.py
Original file line number Diff line number Diff line change
Expand Up @@ -96,11 +96,10 @@
"SIFT_Prediction": "string",
"SIFT_Score": "float",
"SWISSPROT": "float",
# "genomic_location_explanation": "string",
"n_depth": "float",
"t_depth": "float",
"mutationInCis_Flag": "boolean"
# "Annotation_Status": "string"
"mutationInCis_Flag": "boolean",
"Annotation_Status": "string"
}


Expand Down Expand Up @@ -823,7 +822,6 @@ def store_maf_files(
with open(MUTATIONS_CENTER_PATH % center, "w"):
pass
used_entities = []
# Must get the headers (because can't assume headers are the same order)
maf_ent = syn.get(centerMafSynIdsDf.id[0])
for _, mafSynId in enumerate(centerMafSynIdsDf.id):
maf_ent = syn.get(mafSynId)
Expand All @@ -842,9 +840,7 @@ def store_maf_files(
configured_mafdf = configure_maf(
mafchunk, remove_mafinbed_variants, flagged_mutationInCis_variants
)
configured_mafdf = process_functions.create_missing_columns(
dataset=configured_mafdf, schema=FULL_MAF_RELEASE_SCHEMA
)
configured_mafdf = configured_mafdf[list(FULL_MAF_RELEASE_SCHEMA.keys())]
# Create maf for release
merged_mafdf = remove_maf_samples(
configured_mafdf, keep_for_merged_consortium_samples
Expand Down

0 comments on commit 7b6c2b3

Please sign in to comment.