From 5e5135693dc49f3d1f6a00d0bdeab695244ad748 Mon Sep 17 00:00:00 2001 From: Cunliang Geng Date: Wed, 27 Nov 2024 15:02:34 +0100 Subject: [PATCH] update bigscape loading process to use the setting bigscape.version --- src/nplinker/loader.py | 22 +++++++++------------- 1 file changed, 9 insertions(+), 13 deletions(-) diff --git a/src/nplinker/loader.py b/src/nplinker/loader.py index 8d2bcd18..7c0e5eaa 100644 --- a/src/nplinker/loader.py +++ b/src/nplinker/loader.py @@ -206,24 +206,20 @@ def _load_genomics(self): all_bgcs_with_strain = antismash_bgcs_with_strain + self.mibig_bgcs # Step 4: load all GCF objects - bigscape_cluster_file = ( - self.config.root_dir - / defaults.BIGSCAPE_DIRNAME - / f"mix_clustering_c{self.config.bigscape.cutoff}.tsv" - ) - bigscape_db_file = self.config.root_dir / defaults.BIGSCAPE_DIRNAME / "data_sqlite.db" - - # switch depending on found file. prefer V1 if both are found - if bigscape_cluster_file.exists(): + if self.config.bigscape.version == 1: + bigscape_cluster_file = ( + self.config.root_dir + / defaults.BIGSCAPE_DIRNAME + / f"mix_clustering_c{self.config.bigscape.cutoff}.tsv" + ) loader = BigscapeGCFLoader(bigscape_cluster_file) logger.info(f"Loading BigSCAPE cluster file {bigscape_cluster_file}") - elif bigscape_db_file.exists(): + elif self.config.bigscape.version == 2: + bigscape_db_file = self.config.root_dir / defaults.BIGSCAPE_DIRNAME / "data_sqlite.db" loader = BigscapeV2GCFLoader(bigscape_db_file) logger.info(f"Loading BigSCAPE database file {bigscape_db_file}") else: - raise FileNotFoundError( - f"Neither BigSCAPE cluster file {bigscape_cluster_file} nor database file {bigscape_db_file} were found." - ) + raise ValueError(f"Unsupported BigScape version: {self.config.bigscape.version}") raw_gcfs = loader.get_gcfs()