From 2a3a9ab2f4a921db1c5d69a55bd12b08c9051fb5 Mon Sep 17 00:00:00 2001
From: Amandine PERRIN <amandine.perrin@pasteur.fr>
Date: Thu, 22 Oct 2020 11:53:48 +0200
Subject: [PATCH] Prepare module now returns the output info file

---
 PanACoTA/prepare_module/download_genomes_func.py | 1 -
 PanACoTA/prepare_module/filter_genomes.py        | 4 ++--
 PanACoTA/subcommands/prepare.py                  | 4 +++-
 3 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/PanACoTA/prepare_module/download_genomes_func.py b/PanACoTA/prepare_module/download_genomes_func.py
index e820316c..ffda0958 100644
--- a/PanACoTA/prepare_module/download_genomes_func.py
+++ b/PanACoTA/prepare_module/download_genomes_func.py
@@ -142,7 +142,6 @@ def download_from_refseq(species_linked, NCBI_species, NCBI_taxid, levels, outdi
         logger.error(error_message)
         sys.exit(1)
     nb_gen, db_dir = to_database(outdir)
-    logger.info(f"Downloaded {nb_gen} genomes.")
     return db_dir, nb_gen
 
 
diff --git a/PanACoTA/prepare_module/filter_genomes.py b/PanACoTA/prepare_module/filter_genomes.py
index aa3d7167..b56e9a18 100755
--- a/PanACoTA/prepare_module/filter_genomes.py
+++ b/PanACoTA/prepare_module/filter_genomes.py
@@ -227,7 +227,7 @@ def iterative_mash(sorted_genomes, genomes, outdir, species_linked, min_dist, ma
                    progressbar.Counter(), "/{}".format(nbgen), ' ',
                    progressbar.Timer(), ' - '
                   ]
-        bar = progressbar.ProgressBar(widgets=widgets, max_value=len(to_try), term_width=100).start()
+        bar = progressbar.ProgressBar(widgets=widgets, max_value=len(to_try), term_width=79).start()
         done = 0
 
     while len(to_try) > 1:
@@ -504,4 +504,4 @@ def write_outputfiles(genomes, sorted_genomes, genomes_removed, outdir, gspecies
             disf.write(utils.list_to_str([genome] + info))
     logger.info(f"Final list of genomes in the dataset: {list_file}")
     logger.info(f"List of genomes discarded by minhash steps: {discard_file}")
-    return 0
+    return list_file
diff --git a/PanACoTA/subcommands/prepare.py b/PanACoTA/subcommands/prepare.py
index ebe85ea6..9f4d221b 100644
--- a/PanACoTA/subcommands/prepare.py
+++ b/PanACoTA/subcommands/prepare.py
@@ -266,8 +266,10 @@ def main(cmd, NCBI_species, NCBI_taxid, levels, outdir, tmp_dir, threads, no_ref
     removed = fg.iterative_mash(sorted_genomes, genomes, outdir, species_linked,
                                 min_dist, max_dist, threads, quiet)
     # Write list of genomes kept, and list of genomes discarded by mash step
-    fg.write_outputfiles(genomes, sorted_genomes, removed, outdir, species_linked, min_dist, max_dist)
+    info_file = fg.write_outputfiles(genomes, sorted_genomes, removed, outdir, species_linked,
+                                     min_dist, max_dist)
     logger.info("End")
+    return info_file
 
 
 def build_parser(parser):
-- 
GitLab