Skip to content

Commit b211a11

Browse files
authored
Merge pull request #17 from HobnobMancer/test_exploration
Test exploration
2 parents e99c2bb + 8377685 commit b211a11

File tree

9 files changed

+507
-8
lines changed

9 files changed

+507
-8
lines changed

cazomevolve/cazome/explore/explore_cazomes.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -310,7 +310,7 @@ def compare_cazy_families(fgp_df, args):
310310
index.append('Class')
311311
if args.tax_order:
312312
index.append('Order')
313-
if args.tax_family_:
313+
if args.tax_family:
314314
index.append('Family')
315315
if args.genus:
316316
index.append('Genus')
@@ -323,15 +323,15 @@ def compare_cazy_families(fgp_df, args):
323323
fam_freq_genus_row_colours, fam_g_lut = build_row_colours(fam_freq_df_ggs, args.group_by, 'Set2')
324324

325325
for file_format in args.formats:
326-
outpath_cm = outdir / f"cazy_family_clustermap.{args.file_format}"
326+
outpath_cm = outdir / f"cazy_family_clustermap.{file_format}"
327327
logger.warning(
328328
f"Writing out clustermap of CAZy family frequencies in {file_format} format to:\n"
329329
f"{outpath_cm}"
330330
)
331331
build_family_clustermap(
332332
fam_freq_df_ggs,
333333
row_colours=fam_freq_genus_row_colours,
334-
fig_size=((len(fam_freq_df_ggs).columns)*0.4, len(fam_freq_df_ggs)*0.4),
334+
fig_size=(len(fam_freq_df_ggs.columns)*0.4, len(fam_freq_df_ggs)*0.4),
335335
file_path=outpath_cm,
336336
file_format=format,
337337
lut=fam_g_lut,
@@ -378,7 +378,7 @@ def compare_core_cazomes(fam_freq_df, fam_freq_df_ggs, all_families, args):
378378
index.append('Class')
379379
if args.tax_order:
380380
index.append('Order')
381-
if args.tax_family_:
381+
if args.tax_family:
382382
index.append('Family')
383383
if args.genus:
384384
index.append('Genus')
@@ -437,7 +437,7 @@ def find_always_cooccurring_families(fam_freq_df, fam_freq_df_ggs, all_families,
437437
exclude_core_cazome=False,
438438
)
439439
with open(outpath_all, "w") as fh:
440-
fh.write(cooccurring_fams_dict)
440+
fh.write(str(cooccurring_fams_dict))
441441

442442
grp_cooccuring_fams = {} # {genus: cooccurring_fams_d
443443
for grp in set(fam_freq_df[args.group_by]):
@@ -449,7 +449,7 @@ def find_always_cooccurring_families(fam_freq_df, fam_freq_df_ggs, all_families,
449449
)
450450
grp_cooccuring_fams[grp] = grp_cooccurring_fams_dict
451451
with open(outpath_grp, "w") as fh:
452-
fh.write(grp_cooccuring_fams)
452+
fh.write(str(grp_cooccuring_fams))
453453

454454
upsetplot_membership = []
455455
upsetplot_membership = add_to_upsetplot_membership(upsetplot_membership, cooccurring_fams_dict)
@@ -473,7 +473,7 @@ def find_always_cooccurring_families(fam_freq_df, fam_freq_df_ggs, all_families,
473473

474474
# calculate frequencies
475475
upset_plot_groups = get_upsetplot_grps(upsetplot_membership)
476-
476+
cooccurring_grp_freq_data = []
477477
cooccurring_grp_freq_data = add_upsetplot_grp_freqs(
478478
upset_plot_groups,
479479
cooccurring_grp_freq_data,
@@ -511,7 +511,7 @@ def run_pca(fam_freq_df, fam_freq_df_ggs, all_families, args):
511511
index.append('Class')
512512
if args.tax_order:
513513
index.append('Order')
514-
if args.tax_family_:
514+
if args.tax_family:
515515
index.append('Family')
516516
if args.genus:
517517
index.append('Genus')

tests/conftest.py

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,13 @@ def test_output_dir(test_dir):
7070
return dir_path
7171

7272

73+
@pytest.fixture
74+
def fgp_df(test_input_dir):
75+
df_path = test_input_dir / "cazome_data_files/FGP_df"
76+
df = pd.read_table(df_path)
77+
return df
78+
79+
7380
@pytest.fixture
7481
def fam_freq_df(test_input_dir):
7582
df_path = test_input_dir / "cazome_explore/fam_freq_df.csv"
@@ -98,6 +105,14 @@ def built_fam_freq_df(test_input_dir):
98105
return df
99106

100107

108+
@pytest.fixture
109+
def all_families(built_fam_freq_df):
110+
built_fam_freq_df = built_fam_freq_df.drop('Species', axis=1)
111+
built_fam_freq_df = built_fam_freq_df.set_index(['Genome'])
112+
fams = list(built_fam_freq_df.columns)
113+
return fams
114+
115+
101116
# Define fixtures for connection to db
102117

103118

0 commit comments

Comments
 (0)