Skip to content

Commit

Permalink
#401 filtered table now goes into further analysis
Browse files Browse the repository at this point in the history
  • Loading branch information
luppovdaniil committed Jan 30, 2025
1 parent 8ef6797 commit 0330a78
Showing 1 changed file with 3 additions and 2 deletions.
5 changes: 3 additions & 2 deletions py_src/runBuidDatabase.py
Original file line number Diff line number Diff line change
Expand Up @@ -80,7 +80,7 @@
master_table[f"j.{gene}"] = fixer_results.apply(lambda x: x.jId if x else None)
master_table[f"cdr3fix.{gene}"] = fixer_results.apply(lambda x: x.results_to_dict() if x else None)

master_table.set_index("cdr3.alpha").to_csv("../database/vdjdb_full.txt", sep="\t", quotechar='"')
master_table.set_index("cdr3.alpha").to_csv("../database/vdjdb_full_unfiltered.txt", sep="\t", quotechar='"')

mask_gene_list = []
mask_alleles_list = []
Expand All @@ -99,10 +99,11 @@
final_mask_alleles = final_mask_alleles | (master_table['species'] != 'HomoSapiens')
final_mask = final_mask | (master_table['species'] != 'HomoSapiens')

master_table.loc[final_mask & final_mask_alleles].set_index('cdr3.alpha').to_csv('../database/vdjdb_full_gene_clear.txt', sep='\t')
master_table.loc[final_mask & final_mask_alleles].set_index('cdr3.alpha').to_csv('../database/vdjdb_full.txt', sep='\t')
master_table.loc[~final_mask].set_index('cdr3.alpha').to_csv('../database/vdjdb_full_gene_broken.txt', sep='\t')
master_table.loc[~final_mask_alleles].set_index('cdr3.alpha').to_csv('../database/vdjdb_full_allele_broken.txt', sep='\t')

master_table = master_table.loc[final_mask & final_mask_alleles]
cprint("Generating and writing default database", 'magenta')
default_db = generate_default_db(master_table)

Expand Down

0 comments on commit 0330a78

Please sign in to comment.