Skip to content

Commit

Permalink
create.py duplicate strain name bug (#50)
Browse files Browse the repository at this point in the history
Fixes issue that creates duplicate strain columns when using src-strain
  • Loading branch information
dthoward96 committed Apr 4, 2024
1 parent 998065c commit c61812b
Showing 1 changed file with 1 addition and 1 deletion.
2 changes: 1 addition & 1 deletion create.py
Original file line number Diff line number Diff line change
Expand Up @@ -399,7 +399,7 @@ def create_genbank_files(organism, config_dict, metadata, fasta_file, submission
# Retrieve the source df"
source_df = metadata.filter(regex="^gb-seq_id$|^src-|^ncbi-spuid$|^ncbi-bioproject$|^organism$|^collection_date$").copy()
source_df.columns = source_df.columns.str.replace("src-","").str.strip()
source_df = source_df.rename(columns = {"gb-seq_id":"Sequence_ID", "collection_date":"Collection_date", "ncbi-spuid":"strain"})
source_df = source_df.rename(columns = {"gb-seq_id":"Sequence_ID", "collection_date":"Collection_date"})
# Add BioProject if available
if "ncbi-bioproject" in source_df:
source_df = source_df.rename(columns={"ncbi-bioproject": "BioProject"})
Expand Down

0 comments on commit c61812b

Please sign in to comment.