From d2dc38bbc8ab6291752196438d0dfe9adec04a81 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 29 May 2024 16:04:48 +0200 Subject: [PATCH 01/55] add BiG-SCAPE 2 to dependencies --- bin/install-nplinker-deps | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/bin/install-nplinker-deps b/bin/install-nplinker-deps index ee8d2eee5..de273575d 100755 --- a/bin/install-nplinker-deps +++ b/bin/install-nplinker-deps @@ -136,6 +136,17 @@ echo "🔥 Start installing BigScape ..." chmod 775 Annotated_MIBiG_reference ln -sf $LIB_PATH/BiG-SCAPE/bigscape.py $PY_PATH/bin cd .. + # blob size limit to remove large files left in history + [[ -d BiG-SCAPE-v2 ]] || git clone -b dev --filter=blob:limit=10m https://github.com/medema-group/BiG-SCAPE.git BiG-SCAPE-v2 + cd BiG-SCAPE-v2 + pip install click + pip install sqlalchemy + pip install pyhmmer + chmod 754 bigscape.py + ln -sf $LIB_PATH/BiG-SCAPE-v2/bigscape.py $PY_PATH/bin/bigscape-v2.py + cd .. + + echo -e "✅ BigScape installed successfully\n" #--- Install FastTree (not support Windows, required by BigScape) From 93848dd2489645f661d3bdd886d6de72828bbb70 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 29 May 2024 16:09:01 +0200 Subject: [PATCH 02/55] add example config for bigscape 2 --- src/nplinker/nplinker_default.toml | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/src/nplinker/nplinker_default.toml b/src/nplinker/nplinker_default.toml index 4d88540a9..733bcd9bc 100644 --- a/src/nplinker/nplinker_default.toml +++ b/src/nplinker/nplinker_default.toml @@ -9,7 +9,12 @@ to_use = true version = "3.1" [bigscape] +verison = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" + +# for version 2, use the following parameters string: +# parameters = "cluster --mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" + cutoff = "0.30" [scoring] From 9d0a2d0f60b3dec8ed0c9f71cb33e1d5f7337541 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 29 May 2024 16:09:12 +0200 Subject: [PATCH 03/55] implement running BiG-SCAPE --- src/nplinker/arranger.py | 1 + src/nplinker/genomics/bigscape/runbigscape.py | 26 ++++++++++++++++--- 2 files changed, 23 insertions(+), 4 deletions(-) diff --git a/src/nplinker/arranger.py b/src/nplinker/arranger.py index 97a57b283..129104024 100644 --- a/src/nplinker/arranger.py +++ b/src/nplinker/arranger.py @@ -267,6 +267,7 @@ def _run_bigscape(self) -> None: defaults.ANTISMASH_DEFAULT_PATH, defaults.BIGSCAPE_RUNNING_OUTPUT_PATH, config.bigscape.parameters, + config.bigscape.version, ) for f in glob( str( diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 2e10ba10f..351e40244 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -15,8 +15,14 @@ def run_bigscape( antismash_path: str | PathLike, output_path: str | PathLike, extra_params: str, + version: int = 1, ): - bigscape_py_path = "bigscape.py" + # switch to correct version of BiG-SCAPE + if version == 1: + bigscape_py_path = "bigscape.py" + elif version == 2: + bigscape_py_path = "bigscape-v2.py" + logger.info( f'run_bigscape: input="{antismash_path}", output="{output_path}", extra_params={extra_params}"' ) @@ -24,13 +30,25 @@ def run_bigscape( try: subprocess.run([bigscape_py_path, "-h"], capture_output=True, check=True) except Exception as e: - raise Exception(f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})") from e + raise Exception( + f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})" + ) from e if not os.path.exists(antismash_path): raise Exception(f'antismash_path "{antismash_path}" does not exist!') - # configure the IO-related parameters, including pfam_dir - args = [bigscape_py_path, "-i", antismash_path, "-o", output_path, "--pfam_dir", PFAM_PATH] + # assemble arguments. first argument is the python file + args = [bigscape_py_path] + + # version 2 points to specific Pfam file, version 1 points to directory + # version 2 also requires the cluster subcommand + if version == 1: + args.extend(["--pfam_dir", PFAM_PATH]) + elif version == 2: + args.extend(["cluster", "--pfam_path", PFAM_PATH + "/Pfam-A.hmm"]) + + # add input and output paths. these are unchanged + args.extend(["-i", antismash_path, "-o", output_path]) # append the user supplied params, if any if len(extra_params) > 0: From 6d40414132273b60c8a68c9029de3547acc1d98e Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 31 May 2024 15:27:20 +0200 Subject: [PATCH 04/55] fix bigscape2 dependency --- bin/install-nplinker-deps | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/bin/install-nplinker-deps b/bin/install-nplinker-deps index de273575d..4de3524fa 100755 --- a/bin/install-nplinker-deps +++ b/bin/install-nplinker-deps @@ -125,6 +125,7 @@ pip install -q -U pip setuptools echo "🔥 Start installing BigScape ..." [[ -d BiG-SCAPE ]] || git clone https://github.com/medema-group/BiG-SCAPE.git cd BiG-SCAPE + git reset --hard git config --add advice.detachedHead false # disable advice git config pull.ff only git checkout master @@ -139,11 +140,15 @@ echo "🔥 Start installing BigScape ..." # blob size limit to remove large files left in history [[ -d BiG-SCAPE-v2 ]] || git clone -b dev --filter=blob:limit=10m https://github.com/medema-group/BiG-SCAPE.git BiG-SCAPE-v2 cd BiG-SCAPE-v2 + git config --ad advice.detatchedHead false + git checkout dfb0d78427e020aab2c72cc741327ccd102470a1 # specific commit that includes important fixes to v2 pip install click pip install sqlalchemy pip install pyhmmer chmod 754 bigscape.py ln -sf $LIB_PATH/BiG-SCAPE-v2/bigscape.py $PY_PATH/bin/bigscape-v2.py + ln -sf $LIB_PATH/BiG-SCAPE-v2/config.ini $PY_PATH/bin # new system of configuration needs default config file + ln -sf $LIB_PATH/BiG-SCAPE-v2/big_scape $PY_PATH/bin # folder is needed for some files cd .. From 02bc843dd0288b8cd4b85b2fee4d0abc21c112aa Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 31 May 2024 15:31:43 +0200 Subject: [PATCH 05/55] copy db file properly --- src/nplinker/arranger.py | 32 ++++++++++++++++++++++---------- 1 file changed, 22 insertions(+), 10 deletions(-) diff --git a/src/nplinker/arranger.py b/src/nplinker/arranger.py index 129104024..f64f6af16 100644 --- a/src/nplinker/arranger.py +++ b/src/nplinker/arranger.py @@ -263,22 +263,34 @@ def _run_bigscape(self) -> None: default BiG-SCAPE directory. """ defaults.BIGSCAPE_RUNNING_OUTPUT_PATH.mkdir(exist_ok=True, parents=True) + + version = config.bigscape.version + run_bigscape( defaults.ANTISMASH_DEFAULT_PATH, defaults.BIGSCAPE_RUNNING_OUTPUT_PATH, config.bigscape.parameters, - config.bigscape.version, + version, ) - for f in glob( - str( - defaults.BIGSCAPE_RUNNING_OUTPUT_PATH - / "network_files" - / "*" - / "mix" - / "mix_clustering_c*.tsv" + + if version == 1: + for f in glob( + str( + defaults.BIGSCAPE_RUNNING_OUTPUT_PATH + / "network_files" + / "*" + / "mix" + / "mix_clustering_c*.tsv" + ) + ): + shutil.copy(f, defaults.BIGSCAPE_DEFAULT_PATH) + elif version == 2: + shutil.copy( + defaults.BIGSCAPE_RUNNING_OUTPUT_PATH / "data_sqlite.db", + defaults.BIGSCAPE_DEFAULT_PATH, ) - ): - shutil.copy(f, defaults.BIGSCAPE_DEFAULT_PATH) + else: + raise ValueError(f"Invalid BiG-SCAPE version: {version}") def arrange_strain_mappings(self) -> None: """Arrange the strain mappings file. From 2351055d107ef140c1024b09739450f1d650153d Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 31 May 2024 15:31:53 +0200 Subject: [PATCH 06/55] remove cluster arg --- src/nplinker/nplinker_default.toml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/nplinker_default.toml b/src/nplinker/nplinker_default.toml index 733bcd9bc..31b97b664 100644 --- a/src/nplinker/nplinker_default.toml +++ b/src/nplinker/nplinker_default.toml @@ -13,7 +13,7 @@ verison = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" # for version 2, use the following parameters string: -# parameters = "cluster --mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" +# parameters = "--mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" cutoff = "0.30" From 1b43a317c348365e36750573d398750b8da8ce4b Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 31 May 2024 15:54:45 +0200 Subject: [PATCH 07/55] run ruff formatter --- src/nplinker/arranger.py | 4 +++- src/nplinker/genomics/bigscape/runbigscape.py | 4 +--- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/src/nplinker/arranger.py b/src/nplinker/arranger.py index f64f6af16..e02d8eac4 100644 --- a/src/nplinker/arranger.py +++ b/src/nplinker/arranger.py @@ -332,7 +332,9 @@ def _validate_strain_mappings(self) -> None: def _generate_strain_mappings(self) -> None: """Generate the strain mappings file for the PODP mode.""" - podp_json_file = defaults.DOWNLOADS_DEFAULT_PATH / f"paired_datarecord_{config.podp_id}.json" + podp_json_file = ( + defaults.DOWNLOADS_DEFAULT_PATH / f"paired_datarecord_{config.podp_id}.json" + ) genome_status_json_file = defaults.DOWNLOADS_DEFAULT_PATH / GENOME_STATUS_FILENAME genome_bgc_mappings_file = defaults.ANTISMASH_DEFAULT_PATH / GENOME_BGC_MAPPINGS_FILENAME gnps_file_mapping_file = self.gnps_file_mappings_file diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 351e40244..2c114c089 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -30,9 +30,7 @@ def run_bigscape( try: subprocess.run([bigscape_py_path, "-h"], capture_output=True, check=True) except Exception as e: - raise Exception( - f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})" - ) from e + raise Exception(f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})") from e if not os.path.exists(antismash_path): raise Exception(f'antismash_path "{antismash_path}" does not exist!') From eb28d388c21f552748c7cb54995118d3ea1e140b Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 31 May 2024 15:58:02 +0200 Subject: [PATCH 08/55] fix ruff check issues --- src/nplinker/genomics/bigscape/runbigscape.py | 10 +++++++++- 1 file changed, 9 insertions(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 2c114c089..2cd2caab4 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -17,6 +17,12 @@ def run_bigscape( extra_params: str, version: int = 1, ): + """Runs BiG-SCAPE to cluster BGCs. + + The behavior of this function is slightly different depending on the version of + BiG-SCAPE that is set to run using the configuration file. + Mostly this means a different set of parameters is used between the two versions. + """ # switch to correct version of BiG-SCAPE if version == 1: bigscape_py_path = "bigscape.py" @@ -30,7 +36,9 @@ def run_bigscape( try: subprocess.run([bigscape_py_path, "-h"], capture_output=True, check=True) except Exception as e: - raise Exception(f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})") from e + raise Exception( + f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})" + ) from e if not os.path.exists(antismash_path): raise Exception(f'antismash_path "{antismash_path}" does not exist!') From 9293c646f505142d4870bbd9604377edf3800b19 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 3 Jun 2024 11:34:11 +0200 Subject: [PATCH 09/55] ensure str for mypy static type checking --- src/nplinker/genomics/bigscape/runbigscape.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 2cd2caab4..c72f51e65 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -54,7 +54,7 @@ def run_bigscape( args.extend(["cluster", "--pfam_path", PFAM_PATH + "/Pfam-A.hmm"]) # add input and output paths. these are unchanged - args.extend(["-i", antismash_path, "-o", output_path]) + args.extend(["-i", str(antismash_path), "-o", str(output_path)]) # append the user supplied params, if any if len(extra_params) > 0: From 4a0e86b2f08ee4328e93254d44c3d58b8cdb6b1d Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 7 Jun 2024 09:40:51 +0200 Subject: [PATCH 10/55] Move configuration to correct file --- src/nplinker/data/nplinker.toml | 5 +++++ src/nplinker/nplinker_default.toml | 3 --- 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/src/nplinker/data/nplinker.toml b/src/nplinker/data/nplinker.toml index e02094186..15b002498 100644 --- a/src/nplinker/data/nplinker.toml +++ b/src/nplinker/data/nplinker.toml @@ -43,6 +43,9 @@ version = "3.1" [bigscape] # The parameters to use for running BiG-SCAPE. +# Version of BiG-SCAPE to run. Make sure to change the parameters property below as well +# when changing versions. +version = 1 # Required bigscape parameters are `--mix`, `--include_singletons` and `--cutoffs`. NPLinker needs # them to run the analysis properly. # Parameters that must NOT exist: `--inputdir`, `--outputdir`, `--pfam_dir`. NPLinker will @@ -51,6 +54,8 @@ version = "3.1" # `mibig.version` to the version of mibig in bigscape. # The default value is "--mibig --clans-off --mix --include_singletons --cutoffs 0.30". parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" +# for version 2, use the following parameters string: +# parameters = "--mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" # Which bigscape cutoff to use for NPLinker analysis. # There might be multiple cutoffs in bigscape output. # Note that this value must be a string. diff --git a/src/nplinker/nplinker_default.toml b/src/nplinker/nplinker_default.toml index 31b97b664..4d1224f11 100644 --- a/src/nplinker/nplinker_default.toml +++ b/src/nplinker/nplinker_default.toml @@ -12,9 +12,6 @@ version = "3.1" verison = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" -# for version 2, use the following parameters string: -# parameters = "--mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" - cutoff = "0.30" [scoring] From 7361a983961bfb84e7ca474498c3a383b47b9e69 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 7 Jun 2024 09:42:48 +0200 Subject: [PATCH 11/55] use os.path.join instead of string concat --- src/nplinker/genomics/bigscape/runbigscape.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index c72f51e65..e3647ca18 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -51,7 +51,7 @@ def run_bigscape( if version == 1: args.extend(["--pfam_dir", PFAM_PATH]) elif version == 2: - args.extend(["cluster", "--pfam_path", PFAM_PATH + "/Pfam-A.hmm"]) + args.extend(["cluster", "--pfam_path", os.path.join(PFAM_PATH, "Pfam-A.hmm")]) # add input and output paths. these are unchanged args.extend(["-i", str(antismash_path), "-o", str(output_path)]) From a329e4396372c1e4dabb968730731f1d9b3ac47c Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 7 Jun 2024 09:49:25 +0200 Subject: [PATCH 12/55] fix merge mistake --- src/nplinker/arranger.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/arranger.py b/src/nplinker/arranger.py index 0d3e8656b..cf304e0ae 100644 --- a/src/nplinker/arranger.py +++ b/src/nplinker/arranger.py @@ -281,7 +281,7 @@ def _run_bigscape(self) -> None: The clustering file "mix_clustering_c{self.config.bigscape.cutoff}.tsv" will be copied to the default BiG-SCAPE directory. """ - defaults.BIGSCAPE_RUNNING_OUTPUT_PATH.mkdir(exist_ok=True, parents=True) + self.bigscape_running_output_dir.mkdir(exist_ok=True, parents=True) version = self.config.bigscape.version From caf27116c6a91fd1bf2ad7d407ba890178825f4e Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 14 Jun 2024 13:25:00 +0200 Subject: [PATCH 13/55] remove extra bigscape 2 files --- bin/install-nplinker-deps | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/bin/install-nplinker-deps b/bin/install-nplinker-deps index 4de3524fa..ba070270d 100755 --- a/bin/install-nplinker-deps +++ b/bin/install-nplinker-deps @@ -141,14 +141,12 @@ echo "🔥 Start installing BigScape ..." [[ -d BiG-SCAPE-v2 ]] || git clone -b dev --filter=blob:limit=10m https://github.com/medema-group/BiG-SCAPE.git BiG-SCAPE-v2 cd BiG-SCAPE-v2 git config --ad advice.detatchedHead false - git checkout dfb0d78427e020aab2c72cc741327ccd102470a1 # specific commit that includes important fixes to v2 + git checkout 99a4c2e4923bb50e175b2e619c2cee0a14918789 # Commits on Jun 14, 2024 pip install click pip install sqlalchemy pip install pyhmmer chmod 754 bigscape.py ln -sf $LIB_PATH/BiG-SCAPE-v2/bigscape.py $PY_PATH/bin/bigscape-v2.py - ln -sf $LIB_PATH/BiG-SCAPE-v2/config.ini $PY_PATH/bin # new system of configuration needs default config file - ln -sf $LIB_PATH/BiG-SCAPE-v2/big_scape $PY_PATH/bin # folder is needed for some files cd .. From 525c707e81406037f00644438a3a7bc9cbc8fbc2 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 14 Jun 2024 13:25:06 +0200 Subject: [PATCH 14/55] add missing library --- bin/install-nplinker-deps | 1 + 1 file changed, 1 insertion(+) diff --git a/bin/install-nplinker-deps b/bin/install-nplinker-deps index ba070270d..98b362aa4 100755 --- a/bin/install-nplinker-deps +++ b/bin/install-nplinker-deps @@ -145,6 +145,7 @@ echo "🔥 Start installing BigScape ..." pip install click pip install sqlalchemy pip install pyhmmer + pip install tqdm chmod 754 bigscape.py ln -sf $LIB_PATH/BiG-SCAPE-v2/bigscape.py $PY_PATH/bin/bigscape-v2.py cd .. From 2433d76b073d55c8fd7586935042b63e7d130d2f Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 14 Jun 2024 13:49:57 +0200 Subject: [PATCH 15/55] add validator for bigscape version --- src/nplinker/config.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/nplinker/config.py b/src/nplinker/config.py index 5e734ff50..ff5c3fef1 100644 --- a/src/nplinker/config.py +++ b/src/nplinker/config.py @@ -70,6 +70,7 @@ def load_config(config_file: str | PathLike) -> Dynaconf: # BigScape Validator("bigscape.parameters", required=True, is_type_of=str), Validator("bigscape.cutoff", required=True, is_type_of=str), + Validator("bigscape.version", required=True, is_type_of=int), # Scoring ## `scoring.methods` must be a list of strings and must contain at least one of the ## supported scoring methods. From 84472729fc5fe671b8fdb1588bef9b7d6845cae2 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 14 Jun 2024 13:50:04 +0200 Subject: [PATCH 16/55] add test for bigscape version --- tests/unit/test_config.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/unit/test_config.py b/tests/unit/test_config.py index f681cc928..37a6ebcb2 100644 --- a/tests/unit/test_config.py +++ b/tests/unit/test_config.py @@ -25,5 +25,6 @@ def test_config(tmp_path): == "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" ) assert config.bigscape.cutoff == "0.30" + assert config.bigscape.version == 1 assert config.scoring.methods == ["metcalf"] From f6330e974efb1666576967eae402fec8e12e8ab5 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Fri, 14 Jun 2024 13:50:08 +0200 Subject: [PATCH 17/55] fix typo --- src/nplinker/nplinker_default.toml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/nplinker_default.toml b/src/nplinker/nplinker_default.toml index 4d1224f11..037895bc4 100644 --- a/src/nplinker/nplinker_default.toml +++ b/src/nplinker/nplinker_default.toml @@ -9,7 +9,7 @@ to_use = true version = "3.1" [bigscape] -verison = 1 +version = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" cutoff = "0.30" From 84095b74a6d07c06b0a96582f8fd64365491ce36 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 19 Jun 2024 11:32:41 +0200 Subject: [PATCH 18/55] add simple run testing --- tests/unit/genomics/test_runbigscape.py | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100644 tests/unit/genomics/test_runbigscape.py diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py new file mode 100644 index 000000000..9f710e926 --- /dev/null +++ b/tests/unit/genomics/test_runbigscape.py @@ -0,0 +1,24 @@ +from nplinker.genomics.bigscape.runbigscape import run_bigscape +from .. import DATA_DIR + + +class TestRunBigscape: + def test_run_bigscape_v1(self, tmp_path): + result = run_bigscape( + antismash_path=DATA_DIR, + output_path=tmp_path, + extra_params="--help", + version=1, + ) + + assert result is True + + def test_run_bigscape_v2(self, tmp_path): + result = run_bigscape( + antismash_path=DATA_DIR, + output_path=tmp_path, + extra_params="--help", + version=2, + ) + + assert result is True From 21b46008adb538a6151622877698d6f6008ec557 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 19 Jun 2024 11:48:43 +0200 Subject: [PATCH 19/55] add test to check for nonextent input path --- tests/unit/genomics/test_runbigscape.py | 12 ++++++++++++ 1 file changed, 12 insertions(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 9f710e926..2705df33b 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -1,3 +1,4 @@ +import pytest from nplinker.genomics.bigscape.runbigscape import run_bigscape from .. import DATA_DIR @@ -22,3 +23,14 @@ def test_run_bigscape_v2(self, tmp_path): ) assert result is True + + def test_input_path_not_exist(self, tmp_path): + with pytest.raises(Exception) as e: + run_bigscape( + antismash_path=tmp_path / "not_exist", + output_path=tmp_path, + extra_params="", + version=1, + ) + + assert "antismash_path" in e.value.args[0] From a2b6eb87c24af9bf902a465c5b11d7efe7a96e2f Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 15 Jul 2024 12:16:17 +0200 Subject: [PATCH 20/55] add info to docstring --- src/nplinker/genomics/bigscape/runbigscape.py | 18 +++++++++++++++++- 1 file changed, 17 insertions(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index e3647ca18..a26e18ad8 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -16,12 +16,28 @@ def run_bigscape( output_path: str | PathLike, extra_params: str, version: int = 1, -): +) -> bool: """Runs BiG-SCAPE to cluster BGCs. The behavior of this function is slightly different depending on the version of BiG-SCAPE that is set to run using the configuration file. Mostly this means a different set of parameters is used between the two versions. + + The AntiSMASH output directory should be a directory that contains GBK files. + The directory can contain subdirectories, in which case BiG-SCAPE will search + recursively for GBK files. + + By default, only GBK Files with "cluster" or "region" in the filename are + accepted. GBK Files with "final" in the filename are excluded. + + Args: + antismash_path: Path to the antismash output directory. + output_path: Path to the output directory where BiG-SCAPE will write its results. + extra_params: Additional parameters to pass to BiG-SCAPE. + version: The version of BiG-SCAPE to run. Can be 1 or 2. + + Returns: + True if BiG-SCAPE ran successfully, False otherwise. """ # switch to correct version of BiG-SCAPE if version == 1: From c03f64ab5d68c72451ba4e3cf83474ef2699dd97 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 15 Jul 2024 12:38:00 +0200 Subject: [PATCH 21/55] add exception on invalid version number --- src/nplinker/genomics/bigscape/runbigscape.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index a26e18ad8..8528c44a6 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -44,6 +44,8 @@ def run_bigscape( bigscape_py_path = "bigscape.py" elif version == 2: bigscape_py_path = "bigscape-v2.py" + else: + raise ValueError("Unexpected BiG-SCAPE version number specified") logger.info( f'run_bigscape: input="{antismash_path}", output="{output_path}", extra_params={extra_params}"' From 9e9758e450919949928478fa7bf66c457fc73bb3 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 15 Jul 2024 12:55:14 +0200 Subject: [PATCH 22/55] move log to after validation --- src/nplinker/genomics/bigscape/runbigscape.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 8528c44a6..740c76c40 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -47,10 +47,6 @@ def run_bigscape( else: raise ValueError("Unexpected BiG-SCAPE version number specified") - logger.info( - f'run_bigscape: input="{antismash_path}", output="{output_path}", extra_params={extra_params}"' - ) - try: subprocess.run([bigscape_py_path, "-h"], capture_output=True, check=True) except Exception as e: @@ -61,6 +57,11 @@ def run_bigscape( if not os.path.exists(antismash_path): raise Exception(f'antismash_path "{antismash_path}" does not exist!') + + logger.info( + f'run_bigscape: input="{antismash_path}", output="{output_path}", extra_params={extra_params}"' + ) + # assemble arguments. first argument is the python file args = [bigscape_py_path] From 9e8c7678ea8dcd6369ad1aec8f47fd1601e99320 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 15 Jul 2024 12:55:19 +0200 Subject: [PATCH 23/55] add version info to log --- src/nplinker/genomics/bigscape/runbigscape.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 740c76c40..bc17bd652 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -58,6 +58,7 @@ def run_bigscape( raise Exception(f'antismash_path "{antismash_path}" does not exist!') + logger.info(f"Running BiG-SCAPE version {version}") logger.info( f'run_bigscape: input="{antismash_path}", output="{output_path}", extra_params={extra_params}"' ) From e9f734599664d20ba6b83f2ce7263cc7ab7fa62c Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 15 Jul 2024 12:55:52 +0200 Subject: [PATCH 24/55] use specific exception --- src/nplinker/genomics/bigscape/runbigscape.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index bc17bd652..ee63e9a05 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -50,12 +50,12 @@ def run_bigscape( try: subprocess.run([bigscape_py_path, "-h"], capture_output=True, check=True) except Exception as e: - raise Exception( + raise FileNotFoundError( f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})" ) from e if not os.path.exists(antismash_path): - raise Exception(f'antismash_path "{antismash_path}" does not exist!') + raise FileNotFoundError(f'antismash_path "{antismash_path}" does not exist!') logger.info(f"Running BiG-SCAPE version {version}") From 775cbf5a1b255b8d1ab865682d74b4851e624c6c Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Mon, 15 Jul 2024 13:07:08 +0200 Subject: [PATCH 25/55] rework return codes and exceptions --- src/nplinker/genomics/bigscape/runbigscape.py | 14 +++++++++----- 1 file changed, 9 insertions(+), 5 deletions(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index ee63e9a05..3c2a764a2 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -83,9 +83,13 @@ def run_bigscape( logger.info(f"BiG-SCAPE command: {args}") result = subprocess.run(args, stdout=sys.stdout, stderr=sys.stderr, check=True) logger.info(f"BiG-SCAPE completed with return code {result.returncode}") - # use subprocess.CompletedProcess.check_returncode() to test if the BiG-SCAPE - # process exited successfully. This throws an exception for non-zero returncodes - # which will indicate to the PODPDownloader module that something went wrong. - result.check_returncode() - return True + # return true on any non-error return code + if result.returncode == 0: + return True + + # otherwise log details and raise a runtime error + logger.error(f"BiG-SCAPE failed with return code {result.returncode}") + logger.error(f"output: {result.stdout}") + + raise RuntimeError(f"Failed to run BiG-SCAPE with error code {result.returncode}") From 874ea3a34b53623d047d9cc4cbed99bdd031ff94 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:15:18 +0200 Subject: [PATCH 26/55] add wrong version test --- tests/unit/genomics/test_runbigscape.py | 11 +++++++++++ 1 file changed, 11 insertions(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 2705df33b..6a0c6f0e1 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -24,6 +24,17 @@ def test_run_bigscape_v2(self, tmp_path): assert result is True + def test_run_bigscape_wrong_version(self, tmp_path): + with pytest.raises(Exception) as e: + run_bigscape( + antismash_path=DATA_DIR, + output_path=tmp_path, + extra_params="--help", + version=3, + ) + + assert "version" in e.value.args[0] + def test_input_path_not_exist(self, tmp_path): with pytest.raises(Exception) as e: run_bigscape( From bd699dec27a2dc3370a4eb0e13d6217284a4af26 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:16:42 +0200 Subject: [PATCH 27/55] add invalid path test for v2 --- nplinker.toml | 18 ++++++++++++++++++ tests/unit/genomics/test_runbigscape.py | 13 ++++++++++++- 2 files changed, 30 insertions(+), 1 deletion(-) create mode 100644 nplinker.toml diff --git a/nplinker.toml b/nplinker.toml new file mode 100644 index 000000000..037895bc4 --- /dev/null +++ b/nplinker.toml @@ -0,0 +1,18 @@ +# NPLinker default configurations + +[log] +level = "INFO" +use_console = true + +[mibig] +to_use = true +version = "3.1" + +[bigscape] +version = 1 +parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" + +cutoff = "0.30" + +[scoring] +methods = ["metcalf"] diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 6a0c6f0e1..274a9785d 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -35,7 +35,7 @@ def test_run_bigscape_wrong_version(self, tmp_path): assert "version" in e.value.args[0] - def test_input_path_not_exist(self, tmp_path): + def test_input_path_not_exist_v1(self, tmp_path): with pytest.raises(Exception) as e: run_bigscape( antismash_path=tmp_path / "not_exist", @@ -45,3 +45,14 @@ def test_input_path_not_exist(self, tmp_path): ) assert "antismash_path" in e.value.args[0] + + def test_input_path_not_exist_v2(self, tmp_path): + with pytest.raises(Exception) as e: + run_bigscape( + antismash_path=tmp_path / "not_exist", + output_path=tmp_path, + extra_params="", + version=2, + ) + + assert "antismash_path" in e.value.args[0] From 3189999df0c23eadda0a9c108dee10bef13132ab Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:17:04 +0200 Subject: [PATCH 28/55] specify exception --- tests/unit/genomics/test_runbigscape.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 274a9785d..4ba759141 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -36,7 +36,7 @@ def test_run_bigscape_wrong_version(self, tmp_path): assert "version" in e.value.args[0] def test_input_path_not_exist_v1(self, tmp_path): - with pytest.raises(Exception) as e: + with pytest.raises(FileNotFoundError) as e: run_bigscape( antismash_path=tmp_path / "not_exist", output_path=tmp_path, @@ -47,7 +47,7 @@ def test_input_path_not_exist_v1(self, tmp_path): assert "antismash_path" in e.value.args[0] def test_input_path_not_exist_v2(self, tmp_path): - with pytest.raises(Exception) as e: + with pytest.raises(FileNotFoundError) as e: run_bigscape( antismash_path=tmp_path / "not_exist", output_path=tmp_path, From 19e72f202fc18165a8c151655d41827bf4adf243 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:31:22 +0200 Subject: [PATCH 29/55] fix tests not correctly running --- tests/unit/genomics/test_runbigscape.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 4ba759141..d5466f028 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -33,7 +33,7 @@ def test_run_bigscape_wrong_version(self, tmp_path): version=3, ) - assert "version" in e.value.args[0] + assert "version" in e.value.args[0] def test_input_path_not_exist_v1(self, tmp_path): with pytest.raises(FileNotFoundError) as e: @@ -44,7 +44,7 @@ def test_input_path_not_exist_v1(self, tmp_path): version=1, ) - assert "antismash_path" in e.value.args[0] + assert "antismash_path" in e.value.args[0] def test_input_path_not_exist_v2(self, tmp_path): with pytest.raises(FileNotFoundError) as e: @@ -55,4 +55,4 @@ def test_input_path_not_exist_v2(self, tmp_path): version=2, ) - assert "antismash_path" in e.value.args[0] + assert "antismash_path" in e.value.args[0] From a9c9cec0acfa0b64d5f9161deb84b086de2772f2 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:33:35 +0200 Subject: [PATCH 30/55] change imports to reflect style in other tests --- tests/unit/genomics/test_runbigscape.py | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index d5466f028..12646f2bd 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -1,11 +1,11 @@ import pytest -from nplinker.genomics.bigscape.runbigscape import run_bigscape +from nplinker.genomics import bigscape from .. import DATA_DIR class TestRunBigscape: def test_run_bigscape_v1(self, tmp_path): - result = run_bigscape( + result = bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, extra_params="--help", @@ -15,7 +15,7 @@ def test_run_bigscape_v1(self, tmp_path): assert result is True def test_run_bigscape_v2(self, tmp_path): - result = run_bigscape( + result = bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, extra_params="--help", @@ -26,7 +26,7 @@ def test_run_bigscape_v2(self, tmp_path): def test_run_bigscape_wrong_version(self, tmp_path): with pytest.raises(Exception) as e: - run_bigscape( + bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, extra_params="--help", @@ -37,7 +37,7 @@ def test_run_bigscape_wrong_version(self, tmp_path): def test_input_path_not_exist_v1(self, tmp_path): with pytest.raises(FileNotFoundError) as e: - run_bigscape( + bigscape.run_bigscape( antismash_path=tmp_path / "not_exist", output_path=tmp_path, extra_params="", @@ -48,7 +48,7 @@ def test_input_path_not_exist_v1(self, tmp_path): def test_input_path_not_exist_v2(self, tmp_path): with pytest.raises(FileNotFoundError) as e: - run_bigscape( + bigscape.run_bigscape( antismash_path=tmp_path / "not_exist", output_path=tmp_path, extra_params="", From 2164f6cb06bce8436a4364c14197d72fef3d2d06 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:33:45 +0200 Subject: [PATCH 31/55] specify exception type --- tests/unit/genomics/test_runbigscape.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 12646f2bd..8fefa1c78 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -25,7 +25,7 @@ def test_run_bigscape_v2(self, tmp_path): assert result is True def test_run_bigscape_wrong_version(self, tmp_path): - with pytest.raises(Exception) as e: + with pytest.raises(ValueError) as e: bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, From 92578fdbfebf4e7a33dc555b5ef20db2db5b221e Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:42:08 +0200 Subject: [PATCH 32/55] add minimal test data --- .../JK1_GCF_00/BGC0001596.region001.gbk | 2043 +++++++++ .../JK1_GCF_00/JCM_4504.region33.gbk | 1730 ++++++++ .../JK1_GCF_01/JCM_4529.region35.gbk | 1627 +++++++ .../JK1_GCF_01/JK1.region01.gbk | 3887 +++++++++++++++++ 4 files changed, 9287 insertions(+) create mode 100755 tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk create mode 100755 tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/JCM_4504.region33.gbk create mode 100755 tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JCM_4529.region35.gbk create mode 100755 tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk diff --git a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk new file mode 100755 index 000000000..ce0e4e4e6 --- /dev/null +++ b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk @@ -0,0 +1,2043 @@ +LOCUS BGC0001596 46688 bp DNA linear CON 11-APR-2022 +DEFINITION Streptomyces albus strain DSM 41398 chromosome, complete genome. +ACCESSION BGC0001596 +VERSION BGC0001596 +KEYWORDS . +SOURCE Streptomyces albus + ORGANISM Streptomyces albus + Bacteria; Actinobacteria; Streptomycetales; Streptomycetaceae; + Streptomyces. +COMMENT REFSEQ INFORMATION: The reference sequence is identical to + CP010519.1. + The annotation was added by the NCBI Prokaryotic Genome Annotation + Pipeline (PGAP). Information about PGAP can be found here: + https://www.ncbi.nlm.nih.gov/genome/annotation_prok/ + COMPLETENESS: full length. + ##antiSMASH-Data-START## + Version :: 6.2.0-924c3663(changed) + Run date :: 2022-11-08 02:46:11 + NOTE: This is a single region extracted from a larger record! + Orig. start :: 0 + Orig. end :: 46688 + ##antiSMASH-Data-END## +FEATURES Location/Qualifiers + CDS 1..468 + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF024970.2" + /locus_tag="SLNWT_RS23545" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5111" + /product="ATP-binding protein" + /protein_id="WP_052482552.1" + /transl_table=11 + /translation="MSTVRDPGPLAAPVRLAPRATALRETEALCSMPVSAEAVPLLRRF + ARDTSRQWDLPGSAQEAACVIVTELVTNVLLHSGSRDVTLRIVLSDFALTVHVDDEGRW + KHRPAARLATEDAGARCGRGLQLVDAYAVACDVDRTERGTRVRAEIAVAAA" + subregion 1..46688 + /aStool="externally annotated by: MIBiG" + /contig_edge="True" + /label="BGC0001596" + /subregion_number="1" + /tool="antismash" + region 1..46688 + /candidate_cluster_numbers="1" + /contig_edge="True" + /product="T2PKS" + /region_number="1" + /rules="(t2ks and t2clf)" + /subregion_numbers="1" + /tool="antismash" + protocluster 1..44880 + /aStool="rule-based-clusters" + /category="PKS" + /contig_edge="True" + /core_location="[7427:9880]" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + /t2pks_malonyl_elongations="8|9 (Score: 709.5; E-value: + 2.4e-216)" + /t2pks_molecular_weights="acetyl-CoA_8 (Da): 396.388" + /t2pks_molecular_weights="acetyl-CoA_9 (Da): 438.425" + /t2pks_product_classes="angucycline" + /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" + /tool="antismash" + proto_core 7428..9880 + /aStool="rule-based-clusters" + /tool="antismash" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + /t2pks_malonyl_elongations="8|9 (Score: 709.5; E-value: + 2.4e-216)" + /t2pks_molecular_weights="acetyl-CoA_8 (Da): 396.388" + /t2pks_molecular_weights="acetyl-CoA_9 (Da): 438.425" + /t2pks_product_classes="angucycline" + /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" + cand_cluster 1..44880 + /SMILES="" + /candidate_cluster_number="1" + /contig_edge="True" + /detection_rules="(t2ks and t2clf)" + /kind="single" + /product="T2PKS" + /protoclusters="1" + /tool="antismash" + gene 1..468 + /locus_tag="SLNWT_RS23545" + /old_locus_tag="SLNWT_5111" + gene complement(509..1117) + /locus_tag="SLNWT_RS23550" + /old_locus_tag="SLNWT_5112" + CDS complement(509..1117) + /codon_start=1 + /gene_functions="regulatory (smcogs) SMCOG1057:TetR family + transcriptional regulator (Score: 90.1; E-value: 4.1e-27)" + /gene_kind="regulatory" + /inference="COORDINATES: protein motif:HMM:NF012655.2" + /locus_tag="SLNWT_RS23550" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5112" + /product="TetR/AcrR family transcriptional regulator" + /protein_id="WP_052482553.1" + /transl_table=11 + /translation="MAAGSEKTTGAEKAQSTRPRLRADAERNRARVLNAARELFAERGA + EVSMDEVARRAEVGIGTLYRHFPTKEAMVIAAGQQRFGEILTYYRTVCRDSAEPLQALH + LLLTRIAEVESRDRGFATAVTEGSLGSEGPRSPLREDLEAELMALIGKGQEGGSIRQDM + ASVDILSLTCGLTSIVHRRSGDWRRYIDIMLDGLKSQAA" + gene 1422..1832 + /locus_tag="SLNWT_RS23555" + /old_locus_tag="SLNWT_5113" + CDS 1422..1832 + /GO_function="GO:0070967 - coenzyme F420 binding [Evidence + IEA]; GO:0016491 - oxidoreductase activity [Evidence IEA]" + /GO_process="GO:0008150 - biological_process [Evidence + IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018104096.1" + /locus_tag="SLNWT_RS23555" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5113" + /product="TIGR03618 family F420-dependent PPOX class + oxidoreductase" + /protein_id="WP_040258142.1" + /transl_table=11 + /translation="MSRERASAPRVTPSVEAFLAEPHLATLTTLRPDGTPHVVAVRFTW + DARSGLARVMTVRDSRKVRNVLAAPGGRAALCQVAGFKWVTLEGAATVSEDPVRVTEGA + RRYAARYLSPPPNPPGRVVVEIAVDRVMSLNS" + gene complement(2013..2462) + /locus_tag="SLNWT_RS23560" + /old_locus_tag="SLNWT_5114" + CDS complement(2013..2462) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383123.1" + /locus_tag="SLNWT_RS23560" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5114" + /product="nuclear transport factor 2 family protein" + /protein_id="WP_040253434.1" + /transl_table=11 + /translation="MTPSESTAEIAGLLDRYLITLDDEKLDDDWTRSLFTEDASVTFPV + GGHQGAAGMGAFHQRTLDAFTCTQHMGTHAFVEIEGGGDTARLRANCTSTHVHRPENAA + ELGPLFRTGTFVDGRARRTPEGWRLSALSFRLMWKHGTPPGGGGR" + gene 2627..4096 + /locus_tag="SLNWT_RS23565" + /old_locus_tag="SLNWT_5115" + CDS 2627..4096 + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 515.3; E-value: + 3.1e-156)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 501.7; E-value: 5.3e-153)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007385270.1" + /locus_tag="SLNWT_RS23565" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5115" + /product="FAD-dependent monooxygenase" + /protein_id="WP_040253436.1" + /transl_table=11 + /translation="MENFDADVIIVGAGPTGLMLAGELGLHGISALAVDRLEEPIQQSR + ALGFSARTIEEFGQRGLLARFGQVDVIPFGHFGGVPLDFQIVEGGSYGARGIPQSRTEG + VLAGWAREKGAEIRRGVEVTGLDDDGEGVTLQVRTGEGESRLRGRYVVGCDGARSVVRK + AAGIGFPGSEAEIELRFADISGIQLRPRFIGEKVPGGMVMVLPLGPDRSRIIYFDRTQP + LRESAEPITFEEASEAFQRLCGEDISGATPHWVSSTTDVSRQAEAYRSGRVFVAGDAAH + IHLPIGAQGMSAGIQDAVNLGWKLALDLKGRAPEGLLDTYHEERHPVGRRILVNTLAQR + SLYLGGEEMKPLVDVMGELAGYEVVRKHLVGMVTGLDIRHSTVPGEHPLLGRRLPDREL + AVGGEKTTVFALLTEGRGVLLDLSGSAEARKAAEGHAGRVEVVTAESHGIGAELDALLV + RPDGYVAWVAPAGSGAEGLLEALDHWFGAAD" + gene 4166..4855 + /locus_tag="SLNWT_RS23570" + /old_locus_tag="SLNWT_5116" + CDS 4166..4855 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383121.1" + /locus_tag="SLNWT_RS23570" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5116" + /product="antibiotic biosynthesis monooxygenase" + /protein_id="WP_040253438.1" + /transl_table=11 + /translation="MPKISTEDGYLTVLNLFTADAPEKQEKLLGEMRKIVDAATYEGWI + SSTVHAGVDQPGTANFIQWRSGEDLEKRYAGEEFKHRTLPVFGEMTTSIRLLQNDIVYT + QRAPELNGVTEISPDRDDYTVITVFGVEKENQDALVEALSQDHFLKVDGYRSHSVLKGR + AARGLEGSFVVAYSQWASKEAYDAFNSQPEGERSAERKEAEATVRSLITSVDSNTYRVV + HTRAAGE" + gene 5176..6491 + /locus_tag="SLNWT_RS23575" + /pseudo="" + CDS 5176..6491 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015036312.1" + /locus_tag="SLNWT_RS23575" + /note="frameshifted; Derived by automated computational + analysis using gene prediction method: Protein Homology." + /product="multicopper oxidase family protein" + /pseudo="" + /transl_table=11 + /translation="VKFTRPLPALPVLSPRRRTARAETYELRQRETECEIVPGLKTRVR + TFDGCFAPPVIKAVRGRRTVIRQVNELTVPTSIHLHGGHVPESSDGGPMDLVQPGASRT + YTYPNEQAHANLWFHDHAHHQESETVFRGLTGLICSPTRPSSGCRCPRAPTTCRSRSAT + SASTRPGRSSTP" + gene 7073..7396 + /locus_tag="SLNWT_RS23580" + /old_locus_tag="SLNWT_5120" + CDS 7073..7396 + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1225:Polyketide synthesis cyclase (Score: 159.3; + E-value: 4.3e-49)" + /gene_functions="biosynthetic-additional (t2pks) CYC + C4-C17/C2-C19 (Score: 196.7; E-value: 8.3e-61)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383120.1" + /locus_tag="SLNWT_RS23580" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5120" + /product="TcmI family type II polyketide cyclase" + /protein_id="WP_040253440.1" + /transl_table=11 + /translation="MHSTLIVARMDLGSSKDVAGLFGEFDATEMPHRMGTRRRQLFAYK + GLYFHLQDFDEDNGGERIEEAKTDPRFIGISQDLKPFIEAYDPATWRSPADAMAQRFYT + WEA" + gene 7428..8669 + /locus_tag="SLNWT_RS23585" + /old_locus_tag="SLNWT_5121" + CDS 7428..8669 + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (44-387). E-value: + 6.2e-54. Score: 175.3. Matches aSDomain: + nrpspksdomains_SLNWT_RS23585_PKS_KS.1" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1022:Beta-ketoacyl synthase (Score: 467.5; E-value: + 6.9e-142)" + /gene_functions="biosynthetic-additional (t2pks) KS (Score: + 765.6; E-value: 2.8e-233)" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383119.1" + /locus_tag="SLNWT_RS23585" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5121" + /product="beta-ketoacyl-[acyl-carrier-protein] synthase + family protein" + /protein_id="WP_052483223.1" + /sec_met_domain="t2ks (E-value: 4.2e-244, bitscore: 801.4, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MEVLAPGGVGTKNFWSLLSEGRTATRGITFFDPAPFRSRVAAEID + FDPYAHGLSPHEVRRMDRAAQLAVVAARGALADSGLETAALEPHRTGVTVGSAVGATMG + LDEEYRVVSDGGRLDLVDHAYAVPHLYNHLVPSSFAAEVAWAVGAEGPSTVVSTGCTSG + IDALGYALELVREGSVDVMVAGASDAPISPITMACFDAIKATTPRHDDPEHASRPFDGT + RNGFVLGEGSAFFVLEEWESARRRGAHVYAELAGYATRSNAYHMTGLRTDGAEMAEAIR + LALDEARLAPEAIDYVNAHGSGTKQNDRHETAAFKKSLGAHAYATPVSSIKSMVGHSLG + AIGSIEIAASALAMEHHTVPPTANLTTPDPECDLDYVPLHAREQRTDAVLSVGSGFGGF + QSAMVLARPERSPA" + aSDomain 7560..8588 + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23585_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="6.20E-54" + /label="SLNWT_RS23585_PKS_KS.1" + /locus_tag="SLNWT_RS23585" + /protein_end="387" + /protein_start="44" + /score="175.3" + /tool="antismash" + /translation="DFDPYAHGLSPHEVRRMDRAAQLAVVAARGALADSGLETAALEPH + RTGVTVGSAVGATMGLDEEYRVVSDGGRLDLVDHAYAVPHLYNHLVPSSFAAEVAWAVG + AEGPSTVVSTGCTSGIDALGYALELVREGSVDVMVAGASDAPISPITMACFDAIKATTP + RHDDPEHASRPFDGTRNGFVLGEGSAFFVLEEWESARRRGAHVYAELAGYATRSNAYHM + TGLRTDGAEMAEAIRLALDEARLAPEAIDYVNAHGSGTKQNDRHETAAFKKSLGAHAYA + TPVSSIKSMVGHSLGAIGSIEIAASALAMEHHTVPPTANLTTPDPECDLDYVPLHAREQ + RTD" + gene 8666..9880 + /locus_tag="SLNWT_RS23590" + /old_locus_tag="SLNWT_5122" + CDS 8666..9880 + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (68-400). E-value: + 1.4e-31. Score: 101.6. Matches aSDomain: + nrpspksdomains_SLNWT_RS23590_PKS_KS.1" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1093:Beta-ketoacyl synthase (Score: 681.1; E-value: + 6.9e-207)" + /gene_functions="biosynthetic-additional (t2pks) CLF 8|9 + (Score: 709.5; E-value: 2.4e-216)" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_010359931.1" + /locus_tag="SLNWT_RS23590" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5122" + /product="ketosynthase chain-length factor" + /protein_id="WP_040253445.1" + /sec_met_domain="t2clf (E-value: 1.6e-212, bitscore: 696.9, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MSAPAVITGIGVAAPNGLGLRDYWAATLGGKSGIARLTHFDPSGY + PAQLAGEVPGFVAEDHLPSRLIPQTDRMTRMALAAADWALADAGITPAELPSFDMGVVT + ASSSGGFEFGQGELRKLWSQGSQFVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSDQ + AGGLDALAQARRQIRRGTPLIVTGAVDASLCPWGWVAQLSGGRMSTSAEAARAYLPFDR + EARGYVPGEGGAILIMEDAEAARARGARVHGRILGYGATFDPRPGSGRPPALRRAAQTA + LADAGVDAADIDVVFADAAGEPAADRAEAEVLTALFGIRGVPVTAPKTMTGRLYSGAAP + LDVTAALLALRDQVIPPTVHVEPCPEYGLDLVLAQPRPAKLRTALVLARGHGGFNSALV + VRGPE" + aSDomain 8870..9865 + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23590_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="1.40E-31" + /label="SLNWT_RS23590_PKS_KS.1" + /locus_tag="SLNWT_RS23590" + /protein_end="400" + /protein_start="68" + /score="101.6" + /tool="antismash" + /translation="QTDRMTRMALAAADWALADAGITPAELPSFDMGVVTASSSGGFEF + GQGELRKLWSQGSQFVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSDQAGGLDALAQ + ARRQIRRGTPLIVTGAVDASLCPWGWVAQLSGGRMSTSAEAARAYLPFDREARGYVPGE + GGAILIMEDAEAARARGARVHGRILGYGATFDPRPGSGRPPALRRAAQTALADAGVDAA + DIDVVFADAAGEPAADRAEAEVLTALFGIRGVPVTAPKTMTGRLYSGAAPLDVTAALLA + LRDQVIPPTVHVEPCPEYGLDLVLAQPRPAKLRTALVLARGHGGFNSALVV" + CDS_motif 9323..9361 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_SLNWT_RS23590_0001" + /evalue="2.00E-03" + /label="PKSI-KS_m4" + /locus_tag="SLNWT_RS23590" + /protein_end="232" + /protein_start="219" + /score="11.4" + /tool="antismash" + /translation="FDREARGYVPGEG" + gene 9975..10244 + /locus_tag="SLNWT_RS23595" + /old_locus_tag="SLNWT_5123" + CDS 9975..10244 + /NRPS_PKS="Domain: ACP (12-82). E-value: 1.7e-16. Score: + 52.2. Matches aSDomain: nrpspksdomains_SLNWT_RS23595_ACP.1" + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) PP-binding" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1129:acyl carrier protein (Score: 118.5; E-value: + 1.6e-36)" + /gene_functions="biosynthetic-additional (t2pks) ACP + (Score: 133.6; E-value: 4.3e-42)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383117.1" + /locus_tag="SLNWT_RS23595" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5123" + /product="acyl carrier protein" + /protein_id="WP_040253447.1" + /sec_met_domain="PP-binding (E-value: 7.6e-10, bitscore: + 30.7, seeds: 164, tool: rule-based-clusters)" + /transl_table=11 + /translation="MATAAFTLDDLKRILLQSAGAAEGVDLDGEILDTEFEVLGYESLA + LLETGGAIEREYGISLDDEVITDAETPRALIDAVNAHLSTAGAA" + aSDomain 10011..10220 + /aSDomain="ACP" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23595_ACP.1" + /evalue="1.70E-16" + /label="SLNWT_RS23595_ACP.1" + /locus_tag="SLNWT_RS23595" + /protein_end="82" + /protein_start="12" + /score="52.2" + /tool="antismash" + /translation="RILLQSAGAAEGVDLDGEILDTEFEVLGYESLALLETGGAIEREY + GISLDDEVITDAETPRALIDAVNAH" + gene 10263..11057 + /locus_tag="SLNWT_RS23600" + /old_locus_tag="SLNWT_5124" + CDS 10263..11057 + /NRPS_PKS="Domain: PKS_KR (11-121). E-value: 3.7e-10. + Score: 31.8. Matches aSDomain: + nrpspksdomains_SLNWT_RS23600_PKS_KR.1" + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) adh_short" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1001:short-chain dehydrogenase/reductase SDR (Score: + 259.9; E-value: 3.7e-79)" + /gene_functions="biosynthetic-additional (t2pks) KR C9 + (Score: 473.5; E-value: 3.7e-145)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018839768.1" + /locus_tag="SLNWT_RS23600" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5124" + /product="SDR family NAD(P)-dependent oxidoreductase" + /protein_id="WP_040253449.1" + /sec_met_domain="adh_short (E-value: 8.9e-36, bitscore: + 115.0, seeds: 230, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTENTQEHGRLALVSGGTSGIGLASARLLAEQGHRVFLGARDADR + VAATVKELAGEGLPVDGTVLDVREDASVRAFVQAAVDRFGTVDVLVNNAGRSGGGVTAD + IPFELWADVIETNLTSVFRMTKEVLNAGGMRAKSRGRIINIASTAGKQGVVLGAPYSAS + KHGVVGFTKALGNELAPTGITVNAVCPGYVETPMAQRVRQGYADAYDTSEEAILEKFQA + KIPLGRYSTPEEVAGLVGYLASDTAASLTSQALNVCGGLGNF" + aSDomain 10296..10625 + /aSDomain="PKS_KR" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23600_PKS_KR.1" + /evalue="3.70E-10" + /label="SLNWT_RS23600_PKS_KR.1" + /locus_tag="SLNWT_RS23600" + /protein_end="121" + /protein_start="11" + /score="31.8" + /specificity="KR activity: inactive" + /specificity="KR stereochemistry: C1" + /tool="antismash" + /translation="ALVSGGTSGIGLASARLLAEQGHRVFLGARDADRVAATVKELAGE + GLPVDGTVLDVREDASVRAFVQAAVDRFGTVDVLVNNAGRSGGGVTADIPFELWADVIE + TNLTSV" + CDS_motif 10299..10370 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_SLNWT_RS23600_0001" + /evalue="8.70E-07" + /label="PKSI-KR_m1" + /locus_tag="SLNWT_RS23600" + /protein_end="36" + /protein_start="12" + /score="21.6" + /tool="antismash" + /translation="LVSGGTSGIGLASARLLAEQGHRV" + gene 11107..12048 + /locus_tag="SLNWT_RS23605" + /old_locus_tag="SLNWT_5125" + CDS 11107..12048 + /NRPS_PKS="Domain: Polyketide_cyc2 (4-146). E-value: + 1.4e-18. Score: 59.5. Matches aSDomain: + nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (155-292). E-value: + 2.3e-10. Score: 32.9. Matches aSDomain: + nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.2" + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1128:cyclase/dehydrase (Score: 444.3; E-value: + 3.9e-135)" + /gene_functions="biosynthetic-additional (t2pks) CYC C7-C12 + (Score: 476.4; E-value: 6.9e-146)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330940.1" + /locus_tag="SLNWT_RS23605" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5125" + /product="aromatase/cyclase" + /protein_id="WP_040253451.1" + /transl_table=11 + /translation="MTTREVEHEITIAAPAAAVYRLLAEVANWPRIFPPTLYVDREELG + PGQERIHIWATANGEAKNWTSHRTLDEDALRITFRQEVSPEPVAEMNGTWIIEPQGASS + SRVRLLHAFKAIGDDPHDLLWIETAVDKNSTKELAGLKENVELAHAAEELTFSFTDTVR + IDGAAKDAYDFIDQADKWDERLPHVARVRLTEDTPGLQELEMDTRAKDGSTHTTKSYRV + TFPHHRIAYKQVTLPALMTLHTGIWTFEEDPTGTHTTASSQHTVTLRPENIEKILGPDA + TVADARAYVQSALSTNSTATLGHAKNHAERQG" + aSDomain 11119..11544 + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="1.40E-18" + /label="SLNWT_RS23605_Polyketide_cyc2.1" + /locus_tag="SLNWT_RS23605" + /protein_end="146" + /protein_start="4" + /score="59.5" + /tool="antismash" + /translation="EVEHEITIAAPAAAVYRLLAEVANWPRIFPPTLYVDREELGPGQE + RIHIWATANGEAKNWTSHRTLDEDALRITFRQEVSPEPVAEMNGTWIIEPQGASSSRVR + LLHAFKAIGDDPHDLLWIETAVDKNSTKELAGLKENVE" + aSModule 11119..11982 + /domains="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.1" + /domains="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.2" + /incomplete + /locus_tags="SLNWT_RS23605" + /tool="antismash" + /type="unknown" + aSDomain 11572..11982 + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.2" + /domain_subtype="Polyketide_cyc2" + /evalue="2.30E-10" + /label="SLNWT_RS23605_Polyketide_cyc2.2" + /locus_tag="SLNWT_RS23605" + /protein_end="292" + /protein_start="155" + /score="32.9" + /tool="antismash" + /translation="FSFTDTVRIDGAAKDAYDFIDQADKWDERLPHVARVRLTEDTPGL + QELEMDTRAKDGSTHTTKSYRVTFPHHRIAYKQVTLPALMTLHTGIWTFEEDPTGTHTT + ASSQHTVTLRPENIEKILGPDATVADARAYVQS" + gene 12048..13505 + /locus_tag="SLNWT_RS23610" + /old_locus_tag="SLNWT_5126" + CDS 12048..13505 + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 499.9; E-value: + 1.5e-151)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 551.4; E-value: 4.3e-168)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330939.1" + /locus_tag="SLNWT_RS23610" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5126" + /product="FAD-dependent monooxygenase" + /protein_id="WP_040253452.1" + /transl_table=11 + /translation="MDTADRLETQVIIVGAGPVGLLLAGELRLGGAEVVVLEQREAPTT + ESRASTLHARTMEILDSRGLLAGLGTPPQEPRGHFGGIPLDLTLPSRYPGQWKVPQFRT + EELLQEWALGLGADIRRGHQVHALNPGDQAEYVEAEATGPGGRRVLVRGRHLVACDGEE + GTVRRLTGVVFPGQSATRELLRADVDGIDVPDRRFERLPRGLAIAARRGDGVTRVMAHV + FGSTAQPRTGEAEFGEVVAAWKQVTGEDISGGTPLWVNTFGDASRQLVHYRRGRILFAG + DAAHVQMPIGGQALNLGLQDAFNLGWKLARQLREPGGEALLDSYHTERHAVGRRVLGNI + KAQAMLLLGGPEVEPLRTLLAELIRHEKVRAHLAGMISGLDIRYQLPGPAHPLLGARLP + HTVLTSPQGRVSVSELLRTGRGVWINPGVDVPDGARLSTLTGRPEEGPLTDKDSVLVRP + DGHVAWAGSTGTPPPAEALGPGWEATA" + gene 13588..15108 + /locus_tag="SLNWT_RS23615" + /old_locus_tag="SLNWT_5127" + CDS 13588..15108 + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 533.9; E-value: + 7.4e-162)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 546.1; E-value: 1.8e-166)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330938.1" + /locus_tag="SLNWT_RS23615" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5127" + /product="FAD-dependent monooxygenase" + /protein_id="WP_040253455.1" + /transl_table=11 + /translation="MAGTAQGTAVDADVIIVGAGPTGLMLAGELRLGGARVIVAERLAE + PTGQSRGLGFTARAMEIFDQRGLLPRFGQGETLETSPMGHFGGLQFDFTTLPGAHFGAR + GIPQYQTEAVLEEWAAGLGADIRRGWEFLELAEGFLTGEGVEVTFGTPEGVRTLRAAYL + VGCDGGGSQVRKAAGFAFPGLPATRAMFLADVTGLNLKPRFLGERLPHGMVMAAPLAEG + VDRIIVCPHGTPARDRDESVTFEEVAAAWQHITGEDISHGGADWVSSFSDAARQVDSYR + RGRVLLAGDAAHIHLPAGGQGLSTGVQDAANLGWKLAATVAGRAPAGLLDSYHTERHAV + GSRLLMNTRAQGFVFLGGEPADPLRTVFAELLGHEEVKQHLAGIVSHLDVHYAAPEGAH + PLTGHRLGEHILVGKEGESAVFAELHGGRGLLLDLADDAGVRAAGAGLTDRLTTVTATL + KSAPGDADRLDGVRALLVRPDGYVAWAGETTEGLAEAVRRWFGEASPA" + gene 15254..16195 + /locus_tag="SLNWT_RS23620" + /old_locus_tag="SLNWT_5128" + CDS 15254..16195 + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) Abhydrolase_6" + /gene_functions="biosynthetic-additional + (rule-based-clusters) PF00561" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018103054.1" + /locus_tag="SLNWT_RS23620" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5128" + /product="alpha/beta fold hydrolase" + /protein_id="WP_052482554.1" + /sec_met_domain="Abhydrolase_6 (E-value: 5.3e-13, bitscore: + 41.5, seeds: 455, tool: rule-based-clusters)" + /sec_met_domain="PF00561 (E-value: 5e-08, bitscore: 24.3, + seeds: 48, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTALGSTPTGDTDPPAPEPPAPDPPVPGAFSTGVRRITLDAGGLD + LSALLSEPEQGPPRATVVAVHGGGMSAGYFDGQAHPEQSLMTLGAQLGYTVLSVDRPGY + GSSAAWLPEGLTLGEQAVVLHAALDDFRRHYAHGAGLFLLAHSLGGALVMATAAGAEAD + RALLGLDVSGCGHRYAVVPDQGRTTRRNTLRHWGPLRLYPPNTFATSTGLVAPVPAREA + GELARWPELFAALAPRISVPVRLTFAEHEAWWRHGEQDLADLAAQLTASPRVLVERQPD + AGHNISLGWAARAYHLRSLAFLEDCLTHTGRE" + gene 16321..16995 + /locus_tag="SLNWT_RS23625" + /old_locus_tag="SLNWT_5130" + CDS 16321..16995 + /GO_function="GO:0008897 - holo-[acyl-carrier-protein] + synthase activity [Evidence IEA]" + /NRPS_PKS="Domain: ACPS (140-185). E-value: 1.2e-11. Score: + 36.4. Matches aSDomain: + nrpspksdomains_SLNWT_RS23625_ACPS.1" + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1012:4'-phosphopantetheinyl transferase (Score: 143.8; + E-value: 7.6e-44)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015037171.1" + /locus_tag="SLNWT_RS23625" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5130" + /product="4'-phosphopantetheinyl transferase superfamily + protein" + /protein_id="WP_052482555.1" + /transl_table=11 + /translation="MTSTRAPLPAPGTYQLWVFDSLTEEGIPATRAEAGPEALGPEERR + RARLFRRPADRRQYESAHLVLRRLLADHTGLAPERLEFGREGGRRGKPRLLGSPVPVHF + SLSHSHGLVAIALAADPVGVDVQRVPGARTVERCLPSLHPAERAELTALPESERPDAFA + LLWTRKEAYLKGLGTGLARPLAADYLGSGGLAARPPDWTVHNTAARPGHAAAAALRTPA + TG" + aSDomain 16741..16875 + /aSDomain="ACPS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_SLNWT_RS23625_ACPS.1" + /evalue="1.20E-11" + /label="SLNWT_RS23625_ACPS.1" + /locus_tag="SLNWT_RS23625" + /protein_end="185" + /protein_start="140" + /score="36.4" + /tool="antismash" + /translation="SLHPAERAELTALPESERPDAFALLWTRKEAYLKGLGTGLARPLA + " + gene 17035..18609 + /locus_tag="SLNWT_RS23630" + /old_locus_tag="SLNWT_5131" + CDS 17035..18609 + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1059:acetyl-CoA carboxylase, carboxyl transferase, + (Score: 729.5; E-value: 4e-221)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019520922.1" + /locus_tag="SLNWT_RS23630" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5131" + /product="acyl-CoA carboxylase subunit beta" + /protein_id="WP_052482556.1" + /transl_table=11 + /translation="MATATEDTHHPRALAAELGARKEEARQGPDPRATERQHAKGKLTA + RERIDLLLDKNSFTEVEQLRRHRATGFGLEARKPYTDGVVTGWGTVEGRTVFVYAHDFR + IFGGALGEAHAAKIHKIMDMALAAGAPLVSLNDGAGARIQEGVSALAGYGGIFQRNTRA + SGVIPQISVMLGPCAGGAAYSPALTDFVFMVRDTSQMFITGPDVVQAVTGEEISQNGLG + GAEVHAGTSGVAHFAYDDEETCLAEVRYLLSFLPSNNRSMPPHLPSADPADRPGERLTE + VVPADGNRAYDVREVIEEVVDDGEYLEVHASWAPNLVCALARLDGHVVGVVANQPNAFA + GVLDIRASEKGARFVQFCDSFSIPLVTLVDVPGFLPGVDQEHEGIIRRGAKLLYAYCNA + TVPRVSVVLRKAYGGAYIVMDSRSIGADIALAWPTNEIAVMGAEGAANVVFRREIAAAA + DPGEMRAQKIKEYREELVHPYYAAERGLVDDVIDPRETRAVLCRAVTMLAAKDADLPRR + KHGNPPQ" + gene 18829..19044 + /locus_tag="SLNWT_RS23635" + /old_locus_tag="SLNWT_5132" + CDS 18829..19044 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018850635.1" + /locus_tag="SLNWT_RS23635" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5132" + /product="hypothetical protein" + /protein_id="WP_040258146.1" + /transl_table=11 + /translation="MLRVVRGNPAPEELAVLSALLFARLSAPEAQAAGPLGRAVAGWRR + PERGSMFDGPRTWRGTGSAAHPTGGR" + gene complement(19200..19985) + /locus_tag="SLNWT_RS23640" + /old_locus_tag="SLNWT_5133" + CDS complement(19200..19985) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017237263.1" + /locus_tag="SLNWT_RS23640" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5133" + /product="DUF3050 domain-containing protein" + /protein_id="WP_040253457.1" + /transl_table=11 + /translation="MSRYDWGKENASIEKLRKVIDDARLEVVKHPIYHRLATLEDVNTF + NENHVFAVWDFMSLLKSLQRSLTCVDVPWVPQGSSESRRLINDIVLVEESDELGDGFIS + HFELYVNGMAEAGADVTVINNFLDRIRGGEGVRTALVGASVPAAAATFVNATFDFIEGA + PLHCRAAAFAFGREDLIPEMFDQVIKVDDQGGKLATFREYLARHIEVDGEEHTPMAMAM + VADLCGEDEAKWQEAAETVTAALRARVALWDGIVAALDA" + gene 20578..20913 + /locus_tag="SLNWT_RS23645" + /old_locus_tag="SLNWT_5135" + CDS 20578..20913 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383104.1" + /locus_tag="SLNWT_RS23645" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5135" + /product="4Fe-4S ferredoxin" + /protein_id="WP_040253458.1" + /transl_table=11 + /translation="MPWEKNEAAGGETSGRDARIAARAREENWKKPPRRIESAECITCD + SCLRGCPAEFGAIFDRGLDVVIIPELCSGCPACVLECPVDCIYVDEDWAPTDESLWKHI + ELTADGA" + gene 20913..22832 + /locus_tag="SLNWT_RS23650" + /old_locus_tag="SLNWT_5136" + CDS 20913..22832 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_017237261.1" + /locus_tag="SLNWT_RS23650" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5136" + /product="hypothetical protein" + /protein_id="WP_040253460.1" + /transl_table=11 + /translation="MPSPAERGLSRREINARKRQSRRPSRHGSAAGAAPGPDYPREDGV + GFPGLLDRAWRAALAAGELPAAVDALLTLDGHVPGDIQLRALRTADEAALKVLCGASWR + GVRDGGQASGASAERAQVPPQDAVFDGEIALSTTGRILVRVPSQGPLAESGNLVAPALQ + VPWSAADLAAYRTESARAAARYSSAVVDCRQWLAAHSTQAREELLDLLKDAALRTAPFV + LYQEDRQYTNFRDPNTLTGKTLWPGHPDCALSSLAGLPLDQWSDSEAVLVVCLTLLVRS + ASYARIEEANGTQLTPDHVGHLLEGVRRNYNAHSRGEAVPPAASARVADLDALAGALRA + RRTEVLGEVQLYREIHGPLMHKIERTAAPRGAAARHREAEVTARLTEALPLAGEDLGAL + AAHLAESPAWLTKPHGEFRTGLEALVHASVAASTEAFEADFAMSRGMRSLAGLREALRA + QAWAEITDWGITDFFCCVVPDPAARRHFGDSVDRLADTAWAMSSRMQYNSWHFIAGNLP + KVPAVVARDHFVPPTLPDIAFYSDQHHHGHVAAKVRFSIRSPQAVEIDGRRFNGFMDLR + LLRCEGTPFGEQDLLAAHRVSAFVAGATGLAAELVAAGEEIEVTSFDSAWHGESVRAAV + KARG" + gene 22838..24277 + /locus_tag="SLNWT_RS23655" + /old_locus_tag="SLNWT_5137" + CDS 22838..24277 + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1105:amidase (Score: 418.1; E-value: 8.2e-127)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383106.1" + /locus_tag="SLNWT_RS23655" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5137" + /product="amidase family protein" + /protein_id="WP_078845181.1" + /transl_table=11 + /translation="MSPSEAGSVRPVTSEETQLTAYGIAATRALLGRGERTATEHLAAH + LAAIEERDPGLGAFVAVAGEGALRAAAAADARLRALGPAAFQDQPLLGVPVSVKDLIQT + GELPTRRGSLLPNRRPAADAPAVARLKAAGAIVVGKTTTSEYGWSASTVSRVSPPTRNP + WDPAYSAGGSSGGAAASVAAGLCTAALGTDGAGSIRIPAAFCGVVGYKPSFGRVPYVPA + GADRLSHLGPLARSVEDVMEIAAVLPGPHRQDPDSGLGALESRPERRGLRVGWIEFPGT + APEVRRVSERALEALAALGHHPERIEVPFRDPYPALLDILAAAEAAGAAPGDEADGDPG + RLAVVRHGRGLDGAAVMRAEEVRMELRTRLAAVMERHDLLAMATVPVEPFAPEAIGPDW + ASDPESLLWLAWSPATYPFNMTGQPAVSLPAGLSRAGLPVGVQLVGPVGADALVLDTAR + DLEAGLGPLPEVPQRVSERML" + gene 24280..25791 + /locus_tag="SLNWT_RS23660" + /old_locus_tag="SLNWT_5138" + CDS 24280..25791 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383107.1" + /locus_tag="SLNWT_RS23660" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5138" + /product="glutamine synthetase family protein" + /protein_id="WP_040253462.1" + /transl_table=11 + /translation="MYTRKWSRPAAEDGVGRSDFVAEHGLWDERQRAAAAEIEAHLGEV + DLIRLVFGDPHGLARSKTLTVEAFRAALRGGMDYSPGPFLFDTGHAVAVDFLSDPGVDV + PELLGAGNFVVVPDPVTFQLLPGGEARTAWVIGEEYLPDGRPHPLSSRHVLRKVIAAYA + AQEYTPVLGLEVEWYLTRRLEGPVGNAGNGFGLQGEAPRVAAMNPGYQFNSDNAFASVA + AFAHPLSALLRQLGLPLRSMEHESGPGQIETTFAPMHALDTADAMLLFRTLVKQRAAQG + GYHATFMSLPRIDGFDPSGWHVHQSVVDTRTGRNLFAPDDPAAPLSAAGLAYAEGLLRR + ARELCLLSVPTVNGHRRLGSGFSLSPTRIGWSPEDRTAMVRVVGAGGSRHLENRTGEPC + ANPYLALAAQLFAGLEGMNSDSLVPRPALGPDAAGAETLPGSLEESLAAFRQGSPADLL + GTPLARCLAKLKQSELDRFRTWAEKEQPPEGEVTEWEQREYFEAF" + gene 25861..27147 + /gene="purB" + /locus_tag="SLNWT_RS23665" + /old_locus_tag="SLNWT_5139" + CDS 25861..27147 + /EC_number="4.3.2.2" + /GO_function="GO:0004018 - N6-(1,2-dicarboxyethyl)AMP + AMP-lyase (fumarate-forming) activity [Evidence IEA]" + /GO_process="GO:0009152 - purine ribonucleotide + biosynthetic process [Evidence IEA]" + /codon_start=1 + /gene="purB" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1063:argininosuccinate lyase/adenylosuccinate lyase + (Score: 148.3; E-value: 5.8e-45)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007389998.1" + /locus_tag="SLNWT_RS23665" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5139" + /product="adenylosuccinate lyase" + /protein_id="WP_040253465.1" + /transl_table=11 + /translation="MIPRYTRPEMAELFSDQARYETWVRVEILATEAQVRLGAVPGSAL + ADMRRAPVPLASRVAEIEKERDHEVLSFLAAYCEEIPEESARWVHLGMTSYDLVDTALG + HTLARGTDLLLDAARALRRILAERAVEHWDTVCVGRTHGVHAEPTTFGHKLAGYAFAVD + RSLTRLRAAREAVAVGTVSGSVGTYALIDPAVERHVLTALGLAAEPAPSQVVARDRHAQ + LVQAVAALGAVVEQVALEMRLLQRTEVREVEERRTGAYQGSSAMPHKRNPTTSERLVGL + ARLLRGHAGTALENVALWHERDLAHQSVERVILPDSLSVGHFQVTMATELLTHLAVFPE + RMRAHLEQTGGLVYSSAVLAELLATGTEREKAYRGVQAAANRTLAGGADFAAALAEEGI + DLGPLGPERFLGHHDVIRERLEQLRDLED" + gene 27131..27535 + /locus_tag="SLNWT_RS23670" + /old_locus_tag="SLNWT_5140" + CDS 27131..27535 + /EC_number="2.3.1.-" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383109.1" + /locus_tag="SLNWT_RS23670" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5140" + /product="GNAT family N-acetyltransferase" + /protein_id="WP_040253467.1" + /transl_table=11 + /translation="MTWKIERVPGDGLDLDEVLTVYRESGLGERRPIEDRERFAAMLRG + ANLVVVCRTEEGRLIGIARSVSDFSYVTYLSDIAVSADFQRAGIGRALIAGTQAETPGV + KIVLLSAPAAVDYYPHLGFTRHESAWVLQP" + gene complement(27621..28349) + /locus_tag="SLNWT_RS23675" + /old_locus_tag="SLNWT_5141" + CDS complement(27621..28349) + /codon_start=1 + /gene_functions="regulatory (smcogs) SMCOG1008:response + regulator (Score: 185.3; E-value: 1.9e-56)" + /gene_kind="regulatory" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015037154.1" + /locus_tag="SLNWT_RS23675" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5141" + /product="response regulator transcription factor" + /protein_id="WP_237282926.1" + /transl_table=11 + /translation="MPSPRFAEDEGFGPTTRKVAGLPTGQRILVVDNDSDYAEALVCRL + RRHGHETTRVQQGGTALQSLEDIDLVLLDLELPDLDGLEVCGAIRSVSCLPVIIVTARG + TELDRVLGLQAGADDFLVKPYGFRELLARIDAVMRRVHQQPQRVREIQHGPLKIDASSR + EVSLDGREVGLTRKEFDLLHLLASNPDTVIPRKRLLQQVWGDSWSRRTVDTHVSSLRSK + LGDSGWIITVRGVGFKLGSA" + misc_feature complement(27756..27758) + /note="tta leucine codon, possible target for bldA + regulation" + /tool="antismash" + gene complement(28640..29536) + /locus_tag="SLNWT_RS23680" + /old_locus_tag="SLNWT_5142" + CDS complement(28640..29536) + /GO_function="GO:0003677 - DNA binding [Evidence IEA]; + GO:0003700 - DNA-binding transcription factor activity + [Evidence IEA]; GO:0016987 - sigma factor activity + [Evidence IEA]" + /GO_process="GO:0006352 - DNA-templated transcription, + initiation [Evidence IEA]; GO:0006355 - regulation of + transcription, DNA-templated [Evidence IEA]" + /codon_start=1 + /gene_functions="regulatory (smcogs) SMCOG1032:RNA + polymerase, sigma-24 subunit, ECF subfamily (Score: 117.4; + E-value: 8.6e-36)" + /gene_kind="regulatory" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018088855.1" + /locus_tag="SLNWT_RS23680" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5142" + /product="sigma-70 family RNA polymerase sigma factor" + /protein_id="WP_040253470.1" + /transl_table=11 + /translation="MDKGEWPALAEKFESQRPHLRAVAYRMLGSVAEADDAVQETWLRL + SRSEAGEIGNLGGWLTTVAGRICLDMLRSRSSRREDPLGDHLPEHGPRDQAAAPTDPAH + EAQLVDSVGLALLVVLDTLDPAERIAFVLHDMFSVPFGEIAPIVGRTPVAARQLASRAR + RRVQAVDTSPDSDLPRQRAVVDAFLAAARGGEFEALLALLDPDVVLRVDAAATPAGAPM + EIVGAQPVAAQAGLYSGRAHLARTALVDGRLGLATAAPRQLSVVMDFTVSEGRITAMNI + IADPTRLAGLDVAILSA" + gene 29994..31013 + /locus_tag="SLNWT_RS23685" + /old_locus_tag="SLNWT_5143" + CDS 29994..31013 + /codon_start=1 + /inference="COORDINATES: ab initio prediction:GeneMarkS-2+" + /locus_tag="SLNWT_RS23685" + /note="Derived by automated computational analysis using + gene prediction method: GeneMarkS-2+." + /old_locus_tag="SLNWT_5143" + /product="ParB N-terminal domain-containing protein" + /protein_id="WP_159393028.1" + /transl_table=11 + /translation="MSLAEQLTYPAVDLDEIESSAIWIESHPITRVRIDSLVFEGSPRL + GGEDHDHVRVLAEAGDSLPAITVHRPTLRVIDGTHRVRAALLNGRTEIAARMLDCDEAA + AFVLSVKANVTHGLPLSRQERAAAAARIIMTHPQWSDRAVAAATGISDKTVSRIRSQSG + ADSAQSATRLGRDGRLRPLDSGQRRRRAAAMFLDRPDAGLREVARATGLSPATVRDVRQ + RIDRGEDPVPGRYRTAESPGGATAARQRPAAGRLDRRTVVVDRQRLLAKLSEDPSLRLN + EAGRRALRWLHHYSVDGNGIETLGQGLPCHWAPDVADLARSCAAAWAELAEQLQQRAE" + gene 31680..32846 + /locus_tag="SLNWT_RS23690" + /old_locus_tag="SLNWT_5145" + CDS 31680..32846 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018563740.1" + /locus_tag="SLNWT_RS23690" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5145" + /product="inositol-3-phosphate synthase" + /protein_id="WP_052482559.1" + /transl_table=11 + /translation="MSQHPEKAGPPGAPASGPGTGVWFIGARGSVATTAVTGAAALAAG + LQPPTGLVTEAPEFAGSGLPALSSLVFGGHDTADWPLPKRAEALAEGGVLPRGLAAAVQ + RELAAADEEIRPGGPLPGDRRGDEELIADFAADIADFTRRTGVARTVVVNLASTEPLPE + PNSARLPASSLYAAAALRAGAAYVNFTPSAGLHHPALAEAAASARVPYAGRDGKTGQTL + LRSVLAPMFRQRALDVRAWSGTNLLGGGDGAALADPAAAEAKNAGKNRVLEDTLGALPE + GEVHIDEVPALGEWKTAWDHVAFEGFLGSRMILQTIWQGCDSALAAPLVLDLARLAARA + QEAGLTGQLPALGFYFKDPDGGSSALAEQYAALLAFAARLGARPAEAS" + gene 32843..33769 + /locus_tag="SLNWT_RS23695" + /old_locus_tag="SLNWT_5146" + CDS 32843..33769 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_014049484.1" + /locus_tag="SLNWT_RS23695" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5146" + /product="UbiA family prenyltransferase" + /protein_id="WP_040253473.1" + /transl_table=11 + /translation="MSTPRDWAELLRVSALLSVPGDALAGAAASRRRPNSRTALALCSS + LCLYEAGMALNDWADRAEDAEERPHRPLPSGRIAPGAALAAAAGLTAAGLGLAARAGRP + AALCATALAGAVWAYDLRLKHTAAGPAAMAAARGLDLVLGALATAGPRSGEAAGSVLGR + ALPPAAVLGAHTWAVTAVSRAETQGGSAGRPLAALGTTAALGTLLAPAGARPLRLERAR + RLPETPRELAQAALAGAYAATAGRSYLHAALNPSPPLTQRAVGGGIRAMIPLQAALAAR + SGALATAASLGALVPLARSLARKVSPT" + gene 33766..34713 + /locus_tag="SLNWT_RS23700" + /old_locus_tag="SLNWT_5147" + CDS 33766..34713 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_016823815.1" + /locus_tag="SLNWT_RS23700" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5147" + /product="sugar phosphate isomerase/epimerase" + /protein_id="WP_078845184.1" + /transl_table=11 + /translation="MSIRLGYGTNGLTDLRLREALTLLAELGYQGVGLTLDHMHLDPLA + RGLSGRAKALARTLGALGLDVTVETGARYVLDPRRKHGPSLLDPDPEARVAREALLVTA + VEVAAELGAHAVHCFSGVRPEGTDEGTAWQRLADSLGPVLDAAQRDGIPLALEPEPGHL + VESLADFHRLRALLGDPELLGLTLDIGHCQCLEPASPAECVTAAAPWLRHVQIEDMRRG + VHEHLPFGEGEIDFPPVLAALEASGYRGLTVVELPRHSHAGPELARRSMEFLRPLVAAA + AREDRAAGAPSPVRARPVPLLTGPPLRQEAPSRT" + gene 34723..35409 + /locus_tag="SLNWT_RS23705" + /old_locus_tag="SLNWT_5148" + CDS 34723..35409 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018851358.1" + /locus_tag="SLNWT_RS23705" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5148" + /product="EboA domain-containing protein" + /protein_id="WP_186095464.1" + /transl_table=11 + /translation="MPITPITPEEPRPAPEPADGTEAELRREAAELRERLSAEGADWLD + GALAEAARAAAEPAPAESRAVPGWELRFAAAGRACGTEAAESARVLLLRAARPGPAALT + RLYRHGTGEERRAVLRALPRLPLAPGEGLPLVEDALRTNDTRLVAAAVGPYAAAHLDDH + AWRHAVLKCLFTQVPVRALARLPERARGDAELARMLRDFAAERTAAGRAVPADLDHVLA + LTAKDA" + gene 35409..36257 + /locus_tag="SLNWT_RS23710" + /old_locus_tag="SLNWT_5149" + CDS 35409..36257 + /GO_function="GO:0016788 - hydrolase activity, acting on + ester bonds [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_016327783.1" + /locus_tag="SLNWT_RS23710" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5149" + /product="TatD family hydrolase" + /protein_id="WP_040253475.1" + /transl_table=11 + /translation="MRIFDPHIHMTSRTTDDYEAMYAAGVRALVEPAFWLGQPRTSPES + FFDYFDALLGWEPFRAAQYGIAHHCTLALNPKEANDPRCLPVLDALPRYLVKDHVVAVG + EIGYDAMTPAEDTALAAQLELAAEHGLPALVHTPHRDKLTGLRRTLDVVAESKLPTERV + LIDHLNETTVKEARESGSWLGFSVYPDTKMDEHRMVALLKEYGPERVLVNSAADWGKSD + PLKTRKVGEAMLAAGFGEDEVHRVLWENPVAFYGLSGRLDLEVPGTEALHEGNSLLRGG + E" + gene 36261..37430 + /gene="eboE" + /locus_tag="SLNWT_RS23715" + /old_locus_tag="SLNWT_5150" + CDS 36261..37430 + /codon_start=1 + /gene="eboE" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003972400.1" + /locus_tag="SLNWT_RS23715" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5150" + /product="metabolite traffic protein EboE" + /protein_id="WP_040253477.1" + /transl_table=11 + /translation="MRFRHPDGSLVHLAYCTNVHPAEDLDGVLAQLGAYCEPVRRRLGT + ERLGIGLWLARDAARALTTEASALRRLRTELDRRGLEVVTLNGFPYRGFGAEKVKYRVY + QPDWRDAERLEYTAELAGLLAELLPPDVTEGTLSTLPLAWRSDFDAAGAAAAERQLTEL + ARRLDDLEERTGRSIRVALEPEPGCAVERTADALAPLAALPAHRFGLCLDTCHLATCFE + EPAAALAALERAGATVPKVQLSAALHAEDPADPAVRAALAAFDEPRFLHQTRALAEGVL + HGTDDLGPALAGGTLPETVPWRAHFHVPLHAPPAPPLTSTMDVLRGSLDVLLGQDAPRS + RHFEVETYTWQALPPEARPADAAQLADGIAAELALARGLFRDLGLKELP" + gene 37427..38827 + /locus_tag="SLNWT_RS23720" + /old_locus_tag="SLNWT_5151" + CDS 37427..38827 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_020125660.1" + /locus_tag="SLNWT_RS23720" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5151" + /product="alkaline phosphatase family protein" + /protein_id="WP_040253479.1" + /transl_table=11 + /translation="MTATPTPLLVLDVVGLTPALLEQMPRLKSLARKGSSAGLGTVLPA + VTCAAQSTFLTGAPPAEHGIVGNGWYFRELGEVLLWRQHNGLVAGDKLWDAARRAHPGY + TVANVCWWYAMGADTDWTVTPRPVYYADGRKEPDCYTRPVELHDELTDALGTFPLFHFW + GPGADLVSSRWIIDATRHLNRTRHPDLTLCYLPHLDYDLQRFGPRDPRSLRAAAELDAA + LGPLLDEAEAEGRTVVVLSEYGITEVSRPVDINRALRRAGLLEVHTQDGMEYLDPMASR + AFAVADHQLAHVYVRRPEDLARVREVLEGLDGVAELLGDEGKKAHGLDHPRAGELVALA + APEAWFTYYYWLDDERAPDFAQLVEIHRKPGYDPAELFLDPLDPYVKLRAAGALARKKL + GMRYRMAVVPLDPAPVRGSHGRLPARPEDGPVLLCSRPGALPGEVAATEVKSLLLGLAG + LAEVPATG" + gene complement(38832..39386) + /locus_tag="SLNWT_RS23725" + /old_locus_tag="SLNWT_5153" + CDS complement(38832..39386) + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1111:GCN5-related N-acetyltransferase (Score: 146.6; + E-value: 1.2e-44)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018549427.1" + /locus_tag="SLNWT_RS23725" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5153" + /product="GNAT family N-acetyltransferase" + /protein_id="WP_040253481.1" + /transl_table=11 + /translation="MYAVPLAEDAALRPLEPWQAEEFLAHMDRARPHTDPWIPWASRST + DLDSARATLQDYADKQAADTGRLYGIWRAGTLVGGVMFVHFDTRLGNCEIGVWTEPAGE + GHGLITAAVRHLIDYAFAERGMHRVEWFSSTRNARSRAVAQRVGMQLDGTLREYFPNRG + FRHDKEVWSLLAPEWPGAAAV" + gene 39465..40115 + /locus_tag="SLNWT_RS23730" + /old_locus_tag="SLNWT_5152" + CDS 39465..40115 + /codon_start=1 + /gene_functions="regulatory (smcogs) SMCOG1057:TetR family + transcriptional regulator (Score: 120.6; E-value: 1.8e-36)" + /gene_kind="regulatory" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_016328168.1" + /locus_tag="SLNWT_RS23730" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5152" + /product="TetR family transcriptional regulator C-terminal + domain-containing protein" + /protein_id="WP_163011131.1" + /transl_table=11 + /translation="MPPARGDHEARRREVSEAVWQVLAARGFGGLTLRAVAAQMGATTG + LLTHYFPGKRALLAHALDVLDRRSAERPRPAAEEAGEAAGLVMLRAMLLDILPLDAASA + ASNRIWVGSWDAALTDPELAEEHAARYRRARARMTGYVADAQRLGELPAGPAAEEIAAA + AQSFVLGLVVQALFAPGEFPPERQVALLDAHLAKAAAGADRAPGTPPVPAGES" + gene complement(40161..41249) + /locus_tag="SLNWT_RS23735" + /old_locus_tag="SLNWT_5154" + CDS complement(40161..41249) + /codon_start=1 + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1042:O-methyltransferase (Score: 297.1; E-value: + 2.7e-90)" + /gene_functions="biosynthetic-additional (t2pks) MET + (Score: 268.6; E-value: 1.8e-82)" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383099.1" + /locus_tag="SLNWT_RS23735" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5154" + /product="hydroxyneurosporene methyltransferase" + /protein_id="WP_078845185.1" + /transl_table=11 + /translation="MPKLPPAKVVRAVEGVRAGLVKLTRLLAPPPFALLELSQGSMVTQ + ALYVAAELKVADELKDGPLTAAQLAQRVGADPESLHRLLRLLATYSVFEERADGSFKLK + PMGQALRSDTPQSMRATVLLMGHPTHWEEWAHLVDAVRTGEASLPKLRGMGAFEFIDAN + PEYGEIFTAGMGAMSETETLPLLAAYDFRRFRTIVDYGAGRGGLLAAALQQAKDARGVL + FDARIDTNGAADYLREQGVADRCTLEKGGLFDPAPAGGDAYLLKHIVHDWPEEQVIEIL + RNVRKVIDPDGRILLMEFVTPDDKPNKPHPAKLVDLWLMLLVGGKERSEKQYAEVLAAG + GFRLEKITETAAPISVIEARPV" + gene 41716..42792 + /locus_tag="SLNWT_RS23740" + /old_locus_tag="SLNWT_5156" + CDS 41716..42792 + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF033206.1" + /locus_tag="SLNWT_RS23740" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5156" + /product="ScyD/ScyE family protein" + /protein_id="WP_159393029.1" + /transl_table=11 + /translation="MSRAHKPWAGALLAAAVVAGLTATAAPSQAAHRAGPEVLATNLNN + PRDITLQADGSILVAESGSGPATACAPGTSCLGFTGSIYRVNGSQKGRVVTGLPSKLEV + RADGGASVAGPNQVEARTGGYTVSSSFGGDAADRKALGAGGETLGTLHIAKGKVLGDLV + DHETRLDPDGPLGNNDVHSNAWMFAHHGKDYLVTDAGGNDLIRVLPDGTTKTEFVFPNN + GENETVPTGIVAAPDGSFYISDLSGQAAGKSRIWRYVPGSAPKVFATGLTNVTDLALDG + KGGLIALTLTKGYTETGPLPGALNRVDLKSGKATEIPTADRLVNSLGLAVGKGGEIYVT + NKTVGTTGELLKFPAARR" + gene 43304..43888 + /locus_tag="SLNWT_RS37105" + /old_locus_tag="SLNWT_5157" + CDS 43304..43888 + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF019498.2" + /locus_tag="SLNWT_RS37105" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5157" + /product="cupin domain-containing protein" + /protein_id="WP_040253485.1" + /transl_table=11 + /translation="MTKIILPEDRPAGRRGFEIVLPSSLTDGAASLVEAHVSEAMSGPP + LHTHAESDETYFVLGGALIMIIDGKLTELRAGGLAHISKDTSHTWATRPDEGAHFLTLH + LPGGYELYHPTALHAEHEKGGPLEQKDLFELAARFDWRLAGPPEPHRLTPTGVLVPAGK + ADAEAEATKALATAEYERALAASIEAADSGS" + gene 43945..45807 + /locus_tag="SLNWT_RS23750" + /old_locus_tag="SLNWT_5158" + CDS 43945..45807 + /codon_start=1 + /gene_functions="transport (smcogs) SMCOG1005:Drug + resistance transporter, EmrB/QacA (Score: 389.3; E-value: + 3.1e-118)" + /gene_kind="transport" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383102.1" + /locus_tag="SLNWT_RS23750" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5158" + /product="MFS transporter" + /protein_id="WP_063778692.1" + /transl_table=11 + /translation="MSGPGSGGPGTAAVPGAAPPGAAGAPDPRRWFALVVILVAGFMDL + LDVTIVNVVLPSVLADLDAAYTHGEWIVAGYVLGFAALMITGGRLGDILGRRKVFLAGV + AGFTAASLLCGLADGPGALIAARFLQGAMAGLMVPQILAIIHVTFPAEERGKVLGIWGG + VLGAASAAGLVAGGLLAEADPYGLGWRAVFLVNVPVGAAALLAAWFLVPDSRAPERPRL + DPLGALLSAAGILLLVYPLTEGRGLGWPPWTFLLMGAAVLVLGLFVLQQRGRTRADNSP + LMSLRLFRARAFSAGMAVWALFWIALGGFFFIWTLYMQVGLGWPPLRAGLTSSAFAVGC + AAGSGTAVEFFTPRFGRKALLAGALLCGTGFLGYVLVAAHYGPAVAPWQMVAPLLVAGI + GFGLVVAPMIDAVLTEVPVREAGSASGVLGTVQQIGIALGTALAGVLFFQQLDHDAARA + VARAAPALRQELTRAEVPAAERERILDAFADCLADRAAATDPTAEPASCRGPLPSPEVR + ALVIGAGQRATADNFSRTFALTLRWGAGSMGLVFLGLFALPRRVEFRGLDGGGPGPGSG + PSVPGASEGGAAVGPGAGPASGPGKERSAPARSGGQDAGTHPAG" + gene 46203..46688 + /locus_tag="SLNWT_RS23755" + /old_locus_tag="SLNWT_5160" + CDS 46203..46688 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019359898.1" + /locus_tag="SLNWT_RS23755" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="SLNWT_5160" + /product="phospholipase" + /protein_id="WP_040253488.1" + /transl_table=11 + /translation="MRRRHVLPLAAAALAMPAALLSTGSASAAPADKPQVLSSFTQTSA + SSYNAWNAARNNQGQWAAYGFDWSTDYCSTSPDNPFGFPFETACARHDFGYRNYKAMGT + FSANKARIDSALYEDLKRVCSRYSGATKTSCDGLAWTYYHAVDIFGIKGFKQLDKAA" +ORIGIN + 1 atgagcaccg tcagggaccc gggtccgctc gccgctcccg tccgtctcgc gccgcgggcg + 61 accgccctgc gggagaccga ggcgctgtgc tcgatgccgg tgagcgccga agcggtcccc + 121 ctgctgcggc ggttcgccag ggacacctcc cggcagtggg acctccccgg cagcgcccag + 181 gaagcggcct gcgtcatcgt caccgaactc gtcaccaacg tcctgctgca cagcggcagc + 241 cgggacgtca ccctgcggat cgtgctcagc gacttcgccc tgaccgtcca tgtcgacgac + 301 gagggccgct ggaagcaccg ccctgccgcc cgcctcgcca ccgaggacgc gggcgcgcgc + 361 tgcggccggg gcctgcaact cgtcgacgcc tacgcggtcg cctgcgatgt ggaccgtacg + 421 gagcgcggga cccgggtgcg ggccgagatc gcggtcgcgg cggcctgagc cccgtacctc + 481 cccggcttcc gcgggccggc cgacggcctc aggccgcctg ggacttgagc ccgtccagca + 541 tgatgtcgat gtagcggcgc cagtccccgc tgcggcggtg cacgatcgag gtcagcccgc + 601 aggtgagcga gaggatgtcc acgctcgcca tgtcctggcg gatgctgccg ccctcctggc + 661 ccttgccgat cagcgccatg agttccgctt cgaggtcctc ccgcagcggg ctgcgcgggc + 721 cctccgagcc gaggctgccc tcggtgacgg cggtggcgaa cccccggtcg cgggactcca + 781 cttcggcgat ccgggtgagc agcagatgca gggcctggag cggctcggcg gagtcgcggc + 841 agaccgtgcg gtagtaggtc aggatctccc cgaagcgctg ctggcccgcg gcgatgacca + 901 tggcctcctt ggtggggaag tgccggtaga gggtgccgat gccgacctcg gcccggcggg + 961 ccacctcgtc catggacacc tcggcgccgc gctccgcgaa gagctcccgc gcggcgttga + 1021 gcacgcgggc ccggttgcgc tcggcgtccg cgcggagccg gggacgggtg ctctgcgcct + 1081 tctcggcgcc ggtcgtcttc tcgctgcctg ccgccatgcg gaacctcctt ccggttgact + 1141 ctactatgcc ccctccgggc ccctcggcgg agcgggcaat cggccaactt gcacacccgg + 1201 cggacgattt ggggtggttg ggtgatcaac cgcgggccgc cgggcggtgg ttgacacccc + 1261 ttcgcgctct cgcctgtact gaaatatcgg aagcggagtc cgattcccgt accggtggcc + 1321 cgagtcggcg ccgccggtac cggtcgcacc cggcggcccg tccgcggcgg caggaccgga + 1381 caggggaacc aagggaacag ggaaggacgt acacgatgtc gatgtcccgg gaacgggcga + 1441 gcgcgccgcg ggtgacgccc tcggtggagg ccttcctcgc cgagccgcac ctggccaccc + 1501 tgaccacgct ccgccccgac ggcaccccgc atgtggtcgc cgtccgcttc acctgggacg + 1561 cgcggtcggg gctcgcccgg gtgatgaccg tgcgcgactc ccgcaaggtg cgcaatgtgc + 1621 tcgcggcgcc gggcggccgg gccgcgctct gccaggtcgc cgggttcaaa tgggtcaccc + 1681 tggagggcgc cgccaccgtg tccgaggacc ccgtacgggt caccgagggc gcccgccgct + 1741 acgccgcccg ctacctctcg ccgccgccca atccgccggg ccgggtcgtg gtcgagatcg + 1801 ccgtggaccg ggtgatgagc ctcaacagct gagcgggggc gggcacttcg gccgccgtgc + 1861 gcggatccgt acgcgaggtg tgagcgcgta cggatccgtg cgggacgtag cggtacgcgg + 1921 aggaagcggg gcgcccgggc ggcgccccgc ttcccgtgtg ccgggggagg aggcgcgggc + 1981 ccgcccccgg cggacgggcc cgcgccggag cgctacctgc ccccgccgcc cggcggggtg + 2041 ccgtgcttcc acatcaggcg gaagctcagc gcggacagcc gccagccctc gggggtcctg + 2101 cgggcgcggc cgtccacgaa ggtgccggtc cggaagagcg ggcccagctc cgcggcgttc + 2161 tccggccggt ggacgtgggt cgaggtgcag ttggcgcgca gccgggccgt gtcgcccccg + 2221 ccctcgatct cgacgaaggc gtgggtgccc atgtgctggg tacaggtgaa ggcgtccagg + 2281 gtgcgctggt ggaaggcgcc catgcccgcg gcgccctggt ggccgccgac cgggaaggtg + 2341 accgaggcgt cctcggtgaa caggctccgc gtccagtcgt cgtccagctt ctcgtcgtcc + 2401 agggtgatca ggtaccggtc caggagtccc gcgatttcgg cggtcgattc gcttggcgtc + 2461 atacctgaag gattgcccgc cattcgtggc ctgccaggct tcctgtcacg gatctgacgt + 2521 tcctgtcgaa ggcctgtagt agccacccca aggcctgtac ttgacgactg tttacccctt + 2581 gccgcattcc tgggaagaat gaggcaacac cgtcgggaga gggcagatgg aaaactttga + 2641 cgcggacgtg atcattgtcg gtgccggtcc cacaggactg atgctcgccg gggaactcgg + 2701 gctccacgga atttcggccc tcgcggtcga caggctcgaa gaaccgatcc agcagtcccg + 2761 cgccctcggt ttctccgcgc ggaccatcga ggaattcggc cagcgcggac tcctcgcccg + 2821 tttcggtcag gtcgacgtca tcccgttcgg gcatttcggc ggagtgccgc tcgatttcca + 2881 gatcgtcgag ggcggttcct acggggcccg cggaattccg cagtcgcgca ccgagggcgt + 2941 cctcgccggg tgggcccgcg agaagggcgc cgagatccgc cgcggcgtcg aggtcaccgg + 3001 cctcgacgac gacggcgagg gcgtcaccct ccaggtgcgc accggcgagg gcgagtcccg + 3061 gctgcgcggc cggtacgtgg tcggctgcga cggcgcccgc agcgtcgtcc gcaaggccgc + 3121 cgggatcggc ttcccgggca gcgaggcgga gatcgagctg cgcttcgcgg acatctccgg + 3181 gatccagctg cgcccgcggt tcatcggcga gaaggtcccc ggcggcatgg tgatggtgct + 3241 gccgctcggg cccgaccgca gccgcatcat ctacttcgac cgtacgcagc cgctgcgcga + 3301 gtcggccgag ccgatcacct tcgaggaggc ctccgaggcc ttccagcggc tgtgcggcga + 3361 ggacatcagc ggcgccaccc cgcactgggt cagctccacc accgacgtca gccgccaggc + 3421 ggaggcctac cgcagcggcc gggtcttcgt cgcgggcgac gccgcccaca tccatctgcc + 3481 gatcggcgcc cagggtatga gcgccgggat ccaggacgcg gtcaacctcg gctggaagct + 3541 cgctctggac ctgaagggca gggcgcccga ggggctgctc gacacctacc acgaggagcg + 3601 gcacccggtc ggccgccgca tcctcgtcaa caccctcgcc cagcgcagcc tctacctcgg + 3661 cggcgaggag atgaagccgc tggtcgacgt gatgggcgag ctggccgggt acgaggtggt + 3721 ccgcaagcac ctggtcggca tggtcaccgg cctcgacatc cggcactcca ccgtccccgg + 3781 cgagcacccg ctgctcggcc gccgcctgcc cgaccgcgag ctggccgtcg gcggcgagaa + 3841 gaccaccgtc ttcgccctgc tcaccgaggg ccggggcgtc ctgctcgacc tctccggcag + 3901 cgccgaggcc cgcaaggcgg ccgagggcca cgccggccgc gtcgaggtcg tcaccgccga + 3961 aagccacggc atcggcgccg agttggacgc cctgctggtg cgccccgacg gctatgtcgc + 4021 ctgggtcgcc cccgcgggct cgggcgccga ggggctcctg gaggccctcg accactggtt + 4081 cggcgccgcc gactgagccg cccggggccc cgccccgcca cgtaccccct gctctcccac + 4141 cctccgagaa ggaagcgacg acagcatgcc caagatctcc accgaagacg gctacctgac + 4201 cgtgctcaac ctcttcaccg cggacgcccc cgagaagcag gagaagctgc tcggtgagat + 4261 gcgcaagatc gtcgacgccg ccacctacga gggctggatc tccagcaccg tgcacgcggg + 4321 cgtcgaccag ccgggcaccg cgaacttcat ccagtggcgc agcggcgagg acctcgaaaa + 4381 gcggtacgcg ggcgaggagt tcaagcaccg cacgctgccg gtcttcggcg agatgaccac + 4441 ctcgatccgg ctgctgcaga acgacatcgt ctacacccag cgcgccccgg agctgaacgg + 4501 cgtcaccgag atctccccgg accgcgacga ctacaccgtc atcacggtct tcggggtgga + 4561 gaaggagaac caggacgcgc tcgtcgaggc gctctcccag gaccacttcc tgaaggtcga + 4621 cggctaccgc tcgcactccg tcctcaaggg ccgggccgcc cgcggcctcg aaggctcctt + 4681 cgtggtcgcc tactcccagt gggcgagcaa ggaggcctac gacgccttca actcccagcc + 4741 ggagggcgag cgttcggccg agcgcaagga ggccgaggcc accgtccgct cgctgatcac + 4801 ctcggtggac tccaacacct accgggtcgt gcacacccgc gccgcgggcg agtgacccac + 4861 cggcccggcc cgggagttcc gggccggcca gccgcggcga cgcccggccc ccgacggggc + 4921 cgggcgttcg ccgtcgttcc gcaccgaagg cccgggccgg acgccgcccg gccccaactg + 4981 ccgtcatctc aacggggaga agacatgttc acgcgcagaa ccgcactccg ctccggcgcc + 5041 gccctcaccg gcaccctcgg cgccgccggg ctcgccgtac cgctgctcgg cggcaccgag + 5101 gccggggccg ccgcgcccgg ggaggccgcc gggcaggccg gggccggggc cgccggcttc + 5161 gacgtctcgg cgctggtgaa gttcacccgg ccgctgcccg cgctgcccgt gctgagcccg + 5221 cgccgccgca ccgcccgcgc ggagacgtac gaactgcgcc agcgggagac ggagtgcgag + 5281 atcgtgccgg gcctgaagac ccgggtgcgg accttcgacg gctgcttcgc cccgccggtg + 5341 atcaaggcgg tacggggccg ccgcaccgtg atccggcagg tcaacgagct gaccgtgccg + 5401 acctcgatcc atctgcacgg cgggcatgtg cccgagtcca gcgacggcgg gccgatggac + 5461 ctggtccagc cgggcgcgag ccgcacgtac acgtacccca acgagcaggc gcacgccaac + 5521 ctctggttcc acgaccacgc ccaccaccag gagtccgaga ccgtcttccg cgggctgacc + 5581 ggccttatct gctcaccgac gagaccgagc agcggctgcc gctgccctcg ggcgcctacg + 5641 acgtgccgat cgcgatccgc gacatccgcc tcgacgaggc cgggcagatc gtctacgcca + 5701 tgaacgacgg caaggaccgc aacctgatgc tggccaacgg cgtcgcctat ccgtatctcg + 5761 ccgtcgccgc ccgcaagtac cgcttccgga tcgtcaacac ctccaatctg cgcaccctcg + 5821 acctgcggct ctccgacggc tcctcctatg tgcagatcgg ctccgacggc ggactgctcg + 5881 cccggccctt caccacctcc tcgctcaccc tctcgtccgg tgaacgcgcc gatatcgtgg + 5941 tcgacttcgc gcggtacgcg gccggcacca ggctcgtcct gaagaacgcg gtggccagcc + 6001 cgcccgggcc cgaggaccag atcggcgacc tcctcgaatt ccgggtcggc gacagggccg + 6061 aggaccgcag ccggatcccg gacaccctgc ggtcgctgcc gccgctcccg ccgccggacc + 6121 gcacccggga gatcgagctc ctgatgggcg cggacggcac tggtctgatc gacggcaagg + 6181 cctaccagga agggcgcgtc gacgcccaga tccccttcgg ctccaccgag ttgtggtcca + 6241 tccgcaacgc caacgaccgc ggcagccaca acttccatgt gcacctggtg cagttcaggg + 6301 tggtggagcg caacggccag ccggtgacgg ccggtccgga gagcggcctg aaggacaccg + 6361 tccggctcgc cccgggggag acggtcaagg tgcaggccac cttcggcggc taccgggggg + 6421 acttcgtcta ccactgccac atgatcgacc acgcggccat ggggatgatg gccaccatgc + 6481 gggtcggctg agcgggcggg gccgcgccgc tccgagccct ggcgccacgg gggcgtgccg + 6541 gtgtaccggt acgcccctgg gccatgcccg gaaaccggcg cgcaccccgg cgcccgtacc + 6601 ggcccgggcg ccccggctgt cccggcacca ccccgcgcac ccgctcgcgc ccccgcccca + 6661 gccgcctccc gggtggcgtc cggtcacttc cctgacccgt ccgtgccgct tcctgacgtt + 6721 cgcctggcgg tcctctgaca ttgcgggggc ggctctgcgg tacctgacga ttccgtaccg + 6781 agaaatgcac aagggcgcct tgtaggacgc gggctttgga agaaccattt accacaccgg + 6841 gcgatgtcac cggggggcgg cctccggtaa ggcacttccc cgccactcct tttcaccgag + 6901 tgccggaaaa gtgcctgcgg cgggccgcag aacaccgccg agctcccatg ggcggccgaa + 6961 tggattcgtg aatgcaattc ccgggccggt ttgtgtctcc ggcgcggggg cggcgctttc + 7021 gcgggcgcag ccgagtgccg cacagaccgc aactgccaag gagcgagaag atatgcacag + 7081 cacgctgatc gtcgcccgga tggacctcgg ttcgagcaag gacgtggccg ggctcttcgg + 7141 cgaattcgac gccaccgaaa tgccgcaccg catggggacg cggcgccgcc agctcttcgc + 7201 gtacaagggc ctgtacttcc acctccagga cttcgacgag gacaacggcg gtgagcgcat + 7261 cgaggaggcc aagaccgacc cgcgcttcat cggcatcagc caggacctca agcccttcat + 7321 cgaggcctac gaccccgcca cctggcgctc cccggccgac gcgatggccc agcgcttcta + 7381 cacctgggag gcgtgaggtg cccgggcgca gagtcgtgat caccgggatg gaggtcctcg + 7441 cccccggtgg tgtcggcacc aagaacttct ggagcctgct cagcgagggc cgcaccgcca + 7501 cccgcggcat caccttcttc gatcccgcgc ccttccgctc ccgggtcgcc gccgagatcg + 7561 acttcgaccc gtacgcgcac gggctgagcc cgcacgaggt gcgccgcatg gaccgcgccg + 7621 cccagctggc cgtggtcgcc gcccgcggcg ccctcgccga cagcggcctg gagaccgcgg + 7681 ccctggagcc gcaccgcacc ggcgtcaccg tcggcagcgc ggtcggcgcc accatgggcc + 7741 tggacgagga gtaccgggtg gtcagcgacg gcggccggct cgacctggtc gaccacgcct + 7801 acgcggtgcc gcacctctac aaccacctgg tgcccagctc cttcgccgcc gaggtcgcct + 7861 gggcggtggg cgccgagggc cccagcaccg tggtctccac cggctgcacc tcgggcatcg + 7921 acgccctcgg ctacgccctg gaactggtcc gcgagggctc ggtggacgtg atggtcgccg + 7981 gggcctccga cgcccccatc tcgcccatca ccatggcctg cttcgacgcc atcaaggcca + 8041 ccaccccgcg ccacgacgac ccggagcacg cctcgcggcc cttcgacggc acccgcaacg + 8101 gcttcgtgct cggcgagggc agcgccttct tcgtcctgga ggagtgggag tcggcccgcc + 8161 gccgcggcgc gcacgtctac gccgaactcg cgggctacgc cacccgctcc aacgcgtacc + 8221 acatgaccgg actgcgcacc gacggcgcgg agatggccga ggcgatccgg ctcgccctcg + 8281 acgaggcgcg gctcgccccg gaggccatcg actacgtcaa cgcgcacggc tccggcacca + 8341 agcagaacga ccggcacgag acggccgcct tcaagaagag cctcggcgcg cacgcctacg + 8401 cgaccccggt cagctccatc aagtcgatgg tgggccactc cctcggcgcg atcggctcca + 8461 tcgagatcgc cgcctcggcg ctcgcgatgg agcaccacac ggtgccgccg accgccaacc + 8521 tcaccacccc cgacccggag tgcgacctcg actacgtccc cctgcacgcc cgcgagcagc + 8581 gcaccgacgc ggtgctctcg gtcggcagcg gattcggcgg cttccagagc gcgatggtgc + 8641 tcgcccgccc ggagaggagc ccggcatgag cgcaccggcg gtcatcacgg gaatcggtgt + 8701 cgccgcaccc aacggcctgg gcctgcgcga ctactgggcc gccaccctcg gcggcaagag + 8761 cggcatcgcc cgcctcaccc acttcgaccc ctccggctat ccggcccaac tcgcgggcga + 8821 ggtacccggg ttcgtcgccg aggaccacct gccgagcagg ctgatcccgc agaccgaccg + 8881 gatgacccgg atggcgctcg cggcggccga ctgggcgctg gccgacgcgg gcatcacccc + 8941 cgccgaactg ccctccttcg acatgggcgt ggtcaccgcc agctcctccg gcggcttcga + 9001 gttcggccag ggcgagctgc gcaaactctg gagccagggc agccagttcg tctccgcgta + 9061 ccagtccttc gcctggttct acgcggtcaa cagcggccag atctccatcc gcaacggcat + 9121 gaagggcccg agcggggtgg tggtcagcga ccaggccggc gggctcgacg ccctcgccca + 9181 ggcgcggcgg cagatccgcc ggggcacccc gctgatcgtc accggcgcgg tcgacgcctc + 9241 gctctgcccc tggggctggg tggcgcagct ctccggcggc cggatgtcca ccagcgccga + 9301 ggcggcccgc gcctatctgc ccttcgaccg ggaggcccgc ggctatgtgc ccggcgaggg + 9361 cggcgccatc ctgatcatgg aggacgccga ggcggcccgc gcccgcgggg cccgggtgca + 9421 cggccggatc ctcggctacg gcgccacctt cgacccgagg ccgggcagcg gacgcccgcc + 9481 cgcccttcgc cgggccgcgc agacggcgct cgcggacgcg ggcgtggacg ccgccgacat + 9541 cgacgtggtc ttcgcggacg ccgcgggcga accggccgcc gaccgcgccg aggccgaggt + 9601 gctcaccgcg ctcttcggga tccgcggcgt cccggtgacc gcgccgaaga ccatgaccgg + 9661 gcggctgtac tcgggggccg cgccgctgga cgtcaccgcg gccctgctcg ccctgcgcga + 9721 ccaggtgatc ccgccgaccg tgcatgtgga gccctgcccc gagtacgggc tcgacctcgt + 9781 cctcgcccag ccgcgccccg cgaagctgcg caccgcgctg gtcctcgccc gcgggcacgg + 9841 cggcttcaac tccgcgctcg tggtccgcgg tcccgagtga accaccctgc cccgccgcgc + 9901 agttgagtgc gcgtcagctc cccgtccccg cgccgccccg ctcgccccgt gacatcccga + 9961 tggaaggaca ccccatggcc accgccgcgt tcaccctcga cgacctgaag cggatcctgc + 10021 tgcaatccgc cggcgccgcc gagggcgtcg acctggacgg cgagatcctc gacaccgagt + 10081 tcgaggtcct cggctacgaa tccctcgccc tcctggagac cggcggcgcc atcgagcgcg + 10141 agtacggcat ctcgctggac gacgaggtca tcaccgacgc ggagaccccg cgcgccctca + 10201 tcgacgccgt caacgcccac ctgtccaccg ccggtgcggc ctgagccgaa ggagccttca + 10261 ccatgaccga gaacacccag gaacacggcc gcctcgccct cgtctcgggc ggcaccagcg + 10321 gtatcgggct ggcgagcgcg cggctgctcg ccgagcaggg gcaccgggtc ttcctcggcg + 10381 cccgggacgc cgaccgggtc gcggcgaccg tcaaggaact ggccggcgag ggcctgccgg + 10441 tggacggcac cgtcctcgac gtgcgcgagg acgcctccgt acgggccttc gtccaggccg + 10501 ccgtggaccg cttcggcacc gtggacgtgc tggtcaacaa cgccggccgc tccggtggcg + 10561 gggtcaccgc ggacatcccc ttcgagctgt gggccgatgt catcgagacc aacctcacca + 10621 gcgtcttccg gatgaccaag gaggtgctga acgcgggcgg catgcgtgcc aagagccggg + 10681 ggcggatcat caacatcgcc tccaccgcgg gcaagcaggg tgtcgtcctc ggcgccccgt + 10741 actcggcctc caagcacggt gtcgtcggct tcaccaaggc gctgggcaac gagctggcgc + 10801 cgaccgggat cacggtgaac gcggtctgcc ccggctatgt cgagacgccc atggcccagc + 10861 gggtgcgcca ggggtacgcc gacgcgtacg acaccagtga ggaggccatc ctggagaagt + 10921 tccaggcgaa gatccccctc ggccgctact ccacgcccga ggaggtcgcc ggactcgtcg + 10981 gctacctcgc ctccgacacc gccgcctcgc tcacctccca ggccctcaac gtctgcggcg + 11041 gactgggcaa cttctgacgt ccgtacggcg atccccgcac cccttcatct gtctggagtt + 11101 gtggctatga cgacccgtga ggtcgagcac gagatcacca tcgcggctcc ggcggcggcc + 11161 gtgtaccggc tgctcgccga ggtggccaac tggccccgca tcttcccccc gaccctctac + 11221 gtggaccgcg aggagctggg cccggggcag gagcggatcc acatctgggc caccgccaac + 11281 ggcgaggcga agaactggac ttcgcaccgg acgctggacg aggacgccct gcgcatcacc + 11341 ttccggcagg aggtgagtcc ggagccggtg gcggagatga acgggacgtg gatcatcgag + 11401 ccgcagggcg cctcgtcctc gcgggtgcgg ctgctgcacg ccttcaaggc gatcggtgac + 11461 gatccgcacg acctgctgtg gatcgagacg gcggtcgaca agaacagcac caaggaactg + 11521 gccgggctga aggagaacgt cgaactcgcg catgcagccg aggagttgac gttctcgttc + 11581 accgacacgg tccgtatcga cggtgcggcg aaggacgcgt acgacttcat cgaccaggcc + 11641 gacaagtggg acgaacggct cccgcacgtg gcgcgggtgc ggctcaccga ggacaccccg + 11701 gggctgcagg agctggagat ggacaccagg gccaaggacg gctccaccca caccaccaag + 11761 tcctaccggg tgaccttccc ccaccaccgc atcgcctaca agcaggtcac cctgcccgcg + 11821 ctgatgaccc tgcacaccgg gatctggacc ttcgaggagg accccaccgg cacccacacc + 11881 acggcctcct cccagcacac cgtcaccctg cgcccggaga acatcgagaa gatcctcggc + 11941 cccgacgcga ccgtcgccga cgcccgcgcc tatgtgcaga gcgcgctgtc caccaacagc + 12001 accgccaccc tcggccacgc caagaaccac gcggagcgcc agggctgatg gacaccgcgg + 12061 accgcctgga gacccaggtc atcatcgtcg gcgccggtcc ggtcgggctc ctgctcgccg + 12121 gtgaactccg cctgggcggc gccgaggtgg tggtgctcga acagcgcgag gcgcccacga + 12181 ccgagtcgcg ggcctccacc ctgcacgccc gcaccatgga gatcctcgac agccggggac + 12241 tgctggccgg cctcggcacc ccgccgcagg agccgcgcgg ccacttcggc ggcatcccgc + 12301 tcgatctgac gctgcccagc cgctacccgg gccagtggaa ggtgccgcag ttccgcaccg + 12361 aggaactgct ccaggagtgg gcgctcggcc tcggcgcgga catccgccgc ggccaccagg + 12421 tgcacgcgct gaacccgggc gaccaggcgg agtacgtcga ggccgaggcc accggacccg + 12481 gcggcaggcg cgtcctggtg cgcggccgcc acctggtggc ctgcgacggc gaggagggca + 12541 ccgtccgcag gctgaccggg gtggtcttcc ccgggcagag cgccacccgg gagctgctgc + 12601 gcgccgacgt ggacggcatc gacgtacccg atcggcgctt cgagcggctg ccgcggggcc + 12661 tggccatcgc cgcccggcgg ggcgacgggg tgacccgggt gatggcccat gtcttcggct + 12721 cgaccgccca accccgcacc ggggaggccg agttcgggga ggtcgtggcg gcctggaagc + 12781 aggtcaccgg ggaggacatc tccggcggca ccccgctgtg ggtgaacacc ttcggcgacg + 12841 cctcccggca gctggtgcac taccggcgcg ggcgcatcct cttcgcgggc gacgccgccc + 12901 atgtgcagat gccgatcggc gggcaggccc tcaacctcgg cctccaggac gccttcaacc + 12961 tcggctggaa gctcgcccgg cagctgcggg aacccggcgg ggaggcgctg ctcgacagct + 13021 accacaccga gcggcacgcg gtcggccgcc gggtcctcgg caacatcaag gcccaggcca + 13081 tgctgctgct cggcggcccc gaagtggagc cgctgcgcac cctgctggcc gaactcatcc + 13141 gccacgagaa ggtccgcgcg cacctggccg ggatgatcag cggactcgac atccgctacc + 13201 aactcccggg ccccgcgcac cccttgctcg gcgcccggct gccgcacacc gtcctgacga + 13261 gtcctcaggg acgggtgtcc gtcagcgagt tgctgcgcac cggacgcgga gtgtggatca + 13321 acccgggcgt ggacgtgccg gacggggccc gtctcagcac gctcaccggc cgccccgagg + 13381 aggggccgct gaccgacaag gactccgtcc tggtgcggcc cgacgggcat gtcgcctggg + 13441 cgggctccac cgggacccca ccgcccgccg aggcactcgg gcccgggtgg gaagccaccg + 13501 cctgaggaga cccaccgccc cgaaggcacc gcccccactg tgccgggcac cacccgcacg + 13561 cccacacctc acgaagggac cgaaaccatg gcagggacag cacaggggac cgcggtggac + 13621 gccgatgtca tcatcgtcgg cgccggaccg accgggctga tgctcgccgg tgaactccgg + 13681 ctcggcggcg cccgcgtcat cgtcgccgaa cggctcgccg agcccaccgg gcagtcccgc + 13741 gggctcggct tcaccgcccg cgcgatggag atcttcgacc agcgcgggct gctgccccgc + 13801 ttcggccagg gcgagaccct ggagaccagc ccgatgggcc acttcggcgg cctgcagttc + 13861 gacttcacca ccctgcccgg cgcccacttc ggcgcccgcg gcatcccgca gtaccagacc + 13921 gaggcggtac tggaggagtg ggcggccgga ctcggcgcgg acatccgccg cggctgggag + 13981 ttcctggagc tggccgaggg cttcctcacc ggcgagggcg tcgaggtcac cttcggcacc + 14041 cccgagggcg tacgcaccct gcgcgccgcc tatctggtcg gctgcgacgg cggcggcagc + 14101 caggtccgca aggcggccgg tttcgccttc cccggactgc ccgcgacccg cgcgatgttc + 14161 ctcgccgatg tcaccggcct gaacctcaag ccccgcttcc tcggcgagcg cctgccgcac + 14221 gggatggtga tggcggcccc gctcgccgag ggcgtggacc ggatcatcgt ctgcccgcac + 14281 ggcacccccg cccgcgaccg cgacgagagc gtcaccttcg aggaggtcgc cgccgcctgg + 14341 cagcacatca ccggcgagga catcagccac ggcggcgccg actgggtcag ctccttctcc + 14401 gacgccgccc gccaggtcga cagctaccgc cgcggccggg tgctgctcgc cggggacgcc + 14461 gcgcacatcc acctccccgc cgggggccag gggctgagca ccggggtgca ggacgccgcc + 14521 aacctcggct ggaagctggc ggccaccgtc gccgggcggg cgcccgcggg gctgctcgac + 14581 agctaccaca ccgagcggca cgcggtcggc agccgcctgc tgatgaacac ccgcgcccag + 14641 ggcttcgtct tcctcggcgg cgaaccggcc gacccgctgc gcacggtctt cgccgaactc + 14701 ctcggccacg aggaggtcaa gcagcacctg gccgggatcg tcagccacct cgacgtgcac + 14761 tacgcggccc ccgagggcgc ccacccgctc accggccacc ggctcggcga gcacatcctg + 14821 gtcggcaagg agggcgagag cgctgtcttc gccgaactgc acggcgggcg tggcctgttg + 14881 ctcgacctcg ctgacgacgc cggggtccgc gcggcgggcg cgggactgac cgaccggctc + 14941 accaccgtca cggccaccct caagtccgcc cccggcgacg ccgaccgcct cgacggcgtc + 15001 cgcgccctcc tggtccgccc ggacggctat gtggcctggg cgggggagac caccgagggg + 15061 ctggcggagg ccgtacgccg atggttcggc gaggcctcgc ccgcctgatc ccgaccgccg + 15121 cgagcaccgg cgcccgcccg cacgggtgcc ggacccccag ggcggtgcgc cgggtacgtg + 15181 gcgcacccgg cacaccgccc gcccccctgc gaggccccgg cctcgcccct tcgaggcctc + 15241 gggagacccg gccatgacgg cgctcggcag cacgcccacc ggcgacacgg acccgcccgc + 15301 accggagccc ccggcaccgg acccgcccgt acccggcgcc ttctccaccg gggtccgccg + 15361 gatcaccctc gacgcgggcg gcctcgacct ctccgcgctg ctgagcgagc ccgagcaggg + 15421 cccgccccgg gccaccgtcg tcgcggtgca cggcggcggc atgagcgccg ggtacttcga + 15481 cgggcaggcc caccccgagc agtccctgat gacgctcggc gcccaactcg gctacaccgt + 15541 cctgtcggtg gaccgccccg gctacggcag ctccgccgcg tggctccccg agggactcac + 15601 cctcggcgag caggcggtgg tgctgcacgc cgccctcgac gacttccgcc ggcactacgc + 15661 ccacggggcc gggctcttcc tgctcgccca ctcgctcggc ggcgccctgg tgatggccac + 15721 cgccgccggg gccgaggcgg accgcgccct gctcggactc gacgtctcgg gctgcggcca + 15781 ccgctacgcc gtcgtgccgg accagggccg gaccacccga aggaacaccc tgcggcactg + 15841 gggcccgctg cggctctacc cgccgaacac cttcgccacg agcaccggcc tggtcgcccc + 15901 ggtcccggcc cgcgaggcgg gtgaactcgc ccgctggccc gagctgttcg ccgccctggc + 15961 gccccggatc agcgtgccgg tgcggctcac cttcgccgag cacgaggcct ggtggcggca + 16021 cggcgaacag gacttggccg acctcgccgc ccaactcacc gcctcaccac gggtcctggt + 16081 ggagcgtcag cccgacgccg ggcacaacat cagcctgggc tgggcggccc gcgcgtacca + 16141 tctgcgctcg ctggccttcc tggaggactg cctcacccac accggccggg agtgagcggc + 16201 cgtgccgccc gccggggtct tccgcaccgc ccgccgccga gcggggcccg aggcgtaccc + 16261 ggggccgtcg gccgcacagg gcggcaggca ccgccgcccg cggacgggag gtcccctgtc + 16321 gtgacgtcca cccgcgcccc gctgcccgcg cccggcacct accagctgtg ggtcttcgac + 16381 tccctcacgg aggaggggat cccggccacc cgcgccgagg cgggacccga ggcgctcggc + 16441 cccgaggagc ggcgccgggc ccgcctcttt aggcgccccg ccgaccgcag gcagtacgag + 16501 agcgcccatc tggtcctgcg gcggctgctc gccgaccaca ccggactggc ccccgagcgg + 16561 ctggagttcg gccgcgaggg cgggcggcgc ggcaagcccc gcctgctcgg ctcgccggtg + 16621 ccggtgcact tctcgctctc gcacagccac ggcctcgtcg cgatcgccct cgccgccgat + 16681 ccggtgggcg tggacgtcca gcgggtgccg ggggcgcgca ccgtcgagcg gtgcctgccc + 16741 tcgctgcacc ccgccgagcg ggccgaactc accgccctgc ccgagtcgga gcgcccggac + 16801 gccttcgccc tgctgtggac ccgcaaggag gcctacctca agggactcgg caccgggctc + 16861 gcccggccgc tcgccgcgga ctacctgggc agcggcggcc tcgccgcccg cccgccggac + 16921 tggaccgtgc acaacaccgc cgcccgcccg gggcacgcgg cagccgccgc gctccgtaca + 16981 cccgcgaccg gatgacagcc gggcgcgtac gccaccactg ggggaaggga caccatggcg + 17041 acagccaccg aggacaccca ccacccgcgc gcactcgccg cggaactcgg cgcgcgcaag + 17101 gaggaggccc ggcagggtcc cgacccgcgg gccaccgaac gccagcacgc caagggcaag + 17161 ttgacggcgc gtgagcggat cgacctgctg ctcgacaaga acagcttcac cgaggtcgag + 17221 cagttgcgca ggcaccgggc gaccggcttc ggcctggagg cgaggaagcc gtacaccgac + 17281 ggggtggtga ccggctgggg cacggtcgag ggccggacgg tcttcgtcta cgcccacgac + 17341 ttccggatct tcgggggcgc cctcggcgag gcgcacgccg cgaagatcca caagatcatg + 17401 gacatggcgc tggccgccgg ggcgccgctg gtctcgctca acgacggcgc gggcgcccgg + 17461 atccaggagg gcgtctccgc gctcgcgggc tacggcggca tcttccagcg caacacccgc + 17521 gcctcgggcg tcatcccgca gatctcggtg atgctcggcc cctgcgcggg cggcgccgcc + 17581 tacagccccg cgctcaccga cttcgtcttc atggtccgcg acacctccca gatgttcatc + 17641 accgggcccg atgtcgtcca ggcggtcacc ggcgaggaga tcagccagaa cgggctcggc + 17701 ggcgccgagg tgcacgccgg tacctccggg gtggcccact tcgcctacga cgacgaggag + 17761 acctgcctcg ccgaggtccg ctacctgctg tccttcctgc cgtccaacaa ccgcagcatg + 17821 ccgccgcacc tgccgagcgc cgaccccgcc gaccggcccg gcgagcggct caccgaggtg + 17881 gtgccggccg acggcaaccg cgcctacgac gtccgggagg tgatcgagga ggtcgtcgac + 17941 gacggcgagt acctggaggt gcacgcctcc tgggcgccca atctggtctg cgccctggcc + 18001 cgcctcgacg ggcatgtggt cggcgtggtc gccaaccagc cgaacgcctt cgccggggtc + 18061 ctcgacatca gggcgagcga gaagggcgcc cgcttcgtgc agttctgcga ctccttcagc + 18121 atcccgctgg tgaccctggt cgacgtgccg ggcttcctgc cgggcgtgga ccaggagcac + 18181 gagggcatca tccggcgcgg cgccaagctc ctgtacgcct actgcaacgc caccgtgccc + 18241 cgggtctcgg tggtcctccg caaggcctac ggcggcgcct acatcgtgat ggactcgcgc + 18301 tccatcggcg ccgacatcgc gctcgcctgg ccgaccaacg agatcgccgt gatgggggcc + 18361 gagggcgccg ccaacgtggt cttccggcgc gagatcgccg ccgccgcgga ccccggggag + 18421 atgcgcgcgc agaagatcaa ggagtaccgg gaggagctgg tccaccccta ctacgcggcc + 18481 gaacgcggtc tcgtcgacga cgtcatcgac ccccgcgaga cccgcgcggt gctctgccgc + 18541 gcggtcacca tgctggccgc caaggacgcc gacctgcccc gccgcaaaca cggcaaccca + 18601 ccgcagtagc agggcggttg cccctgctca ccaggcggct gcccggctcg cggggcggtc + 18661 gccgcggctc gtacgggagc ggtcgcgcgg gcggaagcgg gcagcgcgta cggaatcggc + 18721 agcgcgtacg gaatcagcag agaggtgagg cgaatgtccg agcggaacac gggtgcggcc + 18781 ggggagccgg agagcggtga gggcggccgg gagaccccct gccgccagtt gctgagggtg + 18841 gtgcgcggca acccggcgcc ggaggaactc gccgtgctct ccgccctgtt gttcgcccgg + 18901 ctctcggcgc cggaggcaca ggcggccggt cccctggggc gggcggtggc cggctggcgg + 18961 cgccccgagc gcggctcgat gttcgacggc ccgcgcacct ggcgcggcac cggatccgcc + 19021 gcgcacccga ccggcgggcg gtagggcccg ggaggccggt ggcgggtgcc ggggtgagcc + 19081 ccgccgcccc gcgtgccccg cgacgcgcgg aggccgcgta cgcgccgggc gtacgcggcc + 19141 tccgcggccg ggagacgggc cgggggcggg gtctcaccgg ccgcccccgg ccgccggggt + 19201 caggcgtcga gggccgccac gatgccgtcc cagagggcga cccgggcgcg cagcgcggcg + 19261 gtcaccgtct cggcggcctc ctgccacttg gcctcgtcct cgccgcacag gtcggcgacc + 19321 atcgccatgg ccatcggggt gtgctcctcc ccgtcgacct cgatgtgccg ggccaggtac + 19381 tcgcggaagg tggcgagctt gccgccctgg tcgtcgacct tgatgacctg gtcgaacatc + 19441 tccgggatca ggtcctcgcg gccgaaggcg aaggccgcgg cccggcagtg cagcggggcc + 19501 ccctcgatga agtcgaaggt ggcgttcacg aaggtggcgg ccgccgccgg gaccgaggcg + 19561 ccgaccaggg cggtgcgcac gccctcgccg ccgcggatgc ggtccaggaa gttgttgatc + 19621 acggtgacgt cggcgcccgc ctcggccatg ccgttgacgt acagctcgaa gtggctgatg + 19681 aagccgtcgc cgagctcgtc gctctcctcg accaggacga tgtcgttgat cagccgccgg + 19741 ctctccgagc tgccctgcgg cacccagggc acgtccacgc aggtgaggct gcgctggagg + 19801 ctcttcagga gggacatgaa gtcccagacc gcgaagacat ggttctcgtt gaaggtgttg + 19861 acgtcttcga gcgttgcaag gcggtggtag atcgggtgct tcaccacttc gaggcgggcg + 19921 tcgtcgatga ctttccgcag tttctcgatg gaagcgttct ctttgcccca gtcgtagcgc + 19981 gacacagaaa tgtctcccgt ccaaagaatg ccgtgtgttc gatctgttcc agtgcgttcg + 20041 gcgagcacta tggccgcatc tcacagcgcc cggcaagggg atgtgaggac gggcaatcgg + 20101 ggtgaagcgg gcggctgacg cggtgtccca tggggttttc ccgcggcgcg ctgtgcgact + 20161 gcgggatttc cgcccttgca cgccggggtg ctcttcggcg cggtcggccg tgatcccgcg + 20221 gccgggttcc ggttctgccg ggctccgggc cgaacggctt gtcctggcag gtcagttggg + 20281 ctctgatggg ggagcggcgg tccggttccg cggcggcccg gtgtgaaagt tggaccgcgt + 20341 tgcgccccct ggccgatcgg gggaccatcg gtcgcacttc cctgcggacg gtgattgctg + 20401 tccgattacc gcgaatccag gcggcggtgt tctccgtacc gaatacggga acggcgttcc + 20461 tgcttgtccc cgaaatggga ttccgcatgc gcgcgccgac aggtcggcac accggctcgg + 20521 cgatttctgg tctcttgccg tggacgcgag agaagaagac acgaggggga cttcgaaatg + 20581 ccctgggaaa agaacgaggc ggccggcggg gagacgagcg gacgggacgc gcggatcgcc + 20641 gcacgcgccc gtgaggagaa ctggaagaag cccccgcggc gcatcgagtc cgccgagtgc + 20701 atcacctgcg acagctgcct gcgcggctgc cccgcggagt tcggcgccat cttcgaccgc + 20761 ggcctcgacg tcgtcatcat ccccgagctg tgctcgggct gcccggcctg cgtcctggag + 20821 tgccccgtcg actgcatcta cgtcgacgag gactgggcgc ccaccgacga gagcctgtgg + 20881 aagcacatcg agctgaccgc ggacggtgcc tgatgccctc accggccgaa cgcggcctga + 20941 gccgccgcga gatcaacgcg aggaagcggc agagccgcag acccagcagg cacggcagcg + 21001 ccgccggcgc ggcgcccggc cccgactatc cgcgcgagga cggcgtgggc ttccccgggc + 21061 tgctcgaccg cgcctggcgc gcggcgctcg ccgccgggga gctgcccgcc gcggtggacg + 21121 cgctgctcac cctcgacggg cacgtccccg gcgacatcca gctgcgcgcc ctgcgcaccg + 21181 ccgacgaggc cgccctgaag gtgctctgcg gcgcctcctg gcgcggggtg cgcgacggcg + 21241 gccaggcgtc cggcgcgtct gccgagcggg cccaagtccc gccgcaggac gcggtgttcg + 21301 acggggagat cgccctgtcc accaccggcc ggatcctggt ccgggtgccc tcgcagggcc + 21361 cgctcgcgga gagcgggaac ctggtcgccc ccgccctcca ggtgccctgg tccgcggcgg + 21421 atctcgccgc ctaccgcacc gagtcggcgc gggcggcggc ccgctactcc tcggcggtgg + 21481 tcgactgccg ccagtggctc gcggcgcaca gcacccaggc ccgcgaggaa ctgctcgacc + 21541 tgctcaagga cgccgccctg cgcaccgcgc ccttcgtgct ctaccaggag gaccggcagt + 21601 acaccaactt ccgggacccc aacaccctca ccggcaagac cctgtggccc gggcatccgg + 21661 actgcgcgct gagcagcctc gcggggctcc cgctcgacca gtggtcggac agcgaggccg + 21721 tcctggtggt ctgcctgacc ctgctggtgc gctccgcctc gtacgcgcgc atcgaggagg + 21781 ccaacggcac ccagctgacc ccggaccacg tcggccacct cctggagggg gtgcggcgca + 21841 actacaacgc gcactcccgg ggcgaggcgg tgccgcccgc cgcctcggcg cgggtggccg + 21901 acctcgacgc gctggccggg gcgctgcgcg cgcgccggac cgaggtgctc ggcgaggtgc + 21961 agctctaccg ggagatccac ggccccctga tgcacaagat cgagcggacc gccgcccccc + 22021 ggggcgcggc cgcccgccac cgcgaggccg aggtcaccgc ccgcctcacc gaggcgctgc + 22081 cgctcgcggg cgaggacctc ggcgcgctcg ccgcgcacct cgccgagtcc ccggcctggc + 22141 tgaccaagcc gcacggcgag ttccgcaccg ggctcgaggc gctggtgcac gcctcggtgg + 22201 ccgcctccac cgaggccttc gaggccgact tcgcgatgag ccgcggcatg cgctcgctcg + 22261 cggggctgcg ggaggcgctg cgggcgcagg cctgggcgga gatcaccgac tgggggatca + 22321 ccgacttctt ctgctgcgtg gtgcccgacc cggcggcccg ccgccacttc ggcgactcgg + 22381 tggaccggct ggccgacacc gcctgggcga tgtcctcccg gatgcagtac aactcctggc + 22441 acttcatcgc gggcaatctg ccgaaggtgc ccgcggtggt ggcccgggac cacttcgtcc + 22501 cgccgaccct gccggacatc gccttctact ccgaccagca ccaccacggg cacgtcgccg + 22561 ccaaggtccg cttcagcatc cgcagcccgc aggcggtgga gatcgacggg cgccgcttca + 22621 acggcttcat ggacctccgg ctgctgcgct gcgagggcac ccccttcggc gaacaggacc + 22681 tgctcgccgc ccaccgggtc tccgccttcg tcgccggggc caccggcctc gccgccgaac + 22741 tcgtcgccgc cggtgaggag atcgaggtca cctccttcga ctcggcctgg cacggggagt + 22801 ccgtccgcgc ggccgtgaag gcgcgcggct gagccggatg agcccgtccg aggccggatc + 22861 cgtccgcccc gtcaccagcg aggagaccca gttgaccgcc tacggcatcg ccgcgacccg + 22921 ggcgctgctc ggccgcgggg agcgcaccgc caccgagcac ctcgccgccc acctcgccgc + 22981 gatcgaggaa cgcgaccccg gcctcggcgc cttcgtcgcg gtcgcgggcg agggggcgct + 23041 gcgggccgcc gcggccgccg acgcccggct gcgcgcgctc ggcccggccg ccttccagga + 23101 ccagccgctg ctcggcgtcc cggtctcggt caaggacctc atccagaccg gtgaactccc + 23161 cacccgccgc ggctccttgc tgcccaaccg ccgcccggcc gcggacgccc ccgcggtcgc + 23221 ccggctgaag gccgccgggg cgatcgtcgt cggcaagacc accacctccg agtacggctg + 23281 gagcgccagt accgtcagcc gggtctcgcc gcccacccgc aacccctggg acccggcgta + 23341 ctcggcgggc ggctccagcg ggggagcggc ggcctcggtg gcggccggac tgtgcaccgc + 23401 cgcgctcggc accgacggcg ccggatcgat ccgcatcccg gccgccttct gcggggtggt + 23461 cggctacaag ccctccttcg ggcgggtccc ctacgtcccc gcgggcgccg accggctctc + 23521 ccacctcggc ccgctggccc gcagcgtcga ggacgtgatg gagatcgccg cggtgctgcc + 23581 gggcccgcac cgccaggacc cggactccgg tctcggcgcc ctggagtcgc gtcccgagcg + 23641 gcgcggcctc cgggtcggct ggatcgagtt cccgggcact gcgcccgagg tgcgccgggt + 23701 cagcgaacgc gccctggagg ccctggccgc cctcgggcac caccccgagc gcatcgaggt + 23761 gcccttccgc gacccgtatc cggcgctcct ggacatcctc gccgccgccg aggccgccgg + 23821 tgccgcgccc ggcgacgagg cggacggcga ccccgggcgg ctggcggtgg tacgccacgg + 23881 ccgcgggctc gacggggccg cggtgatgcg cgccgaggag gtccggatgg agctgcgcac + 23941 ccgcctcgcc gcggtgatgg agcgccatga cctcctcgcg atggccaccg tcccggtgga + 24001 gcccttcgcc ccggaggcga tcggtcccga ctgggcgagc gaccccgaga gcctgctctg + 24061 gctcgcctgg agcccggcca cctacccctt caacatgacc ggccagcccg ccgtctcgct + 24121 gcccgcgggc ctcagccgcg ccgggctgcc ggtcggggtc cagctggtgg gccccgtcgg + 24181 cgcggacgcc ctggtcctcg acaccgcgcg ggacctggag gcgggactcg gtccgctgcc + 24241 cgaagtaccc cagcgcgtct ccgaaaggat gctctagcga tgtacacccg caagtggtcc + 24301 cggcccgccg ccgaggacgg agtcggccgc agcgacttcg tcgccgagca cggtctgtgg + 24361 gacgagcggc agcgcgccgc ggccgcggag atcgaggccc acctcggcga agtcgacctc + 24421 atacggctgg tgttcggcga tccgcacggg ctcgcccggt ccaagacgct caccgtggag + 24481 gccttccgcg cggccctgcg cggcgggatg gactacagcc cgggcccctt cctcttcgac + 24541 accggccacg cggtcgccgt cgacttcctc tccgacccgg gcgtggacgt ccccgaactc + 24601 ctcggcgcgg gcaacttcgt ggtcgtcccc gacccggtga ccttccagct gctgcccggc + 24661 ggcgaggccc gtaccgcctg ggtgatcggc gaggagtacc tgcccgacgg aaggccgcac + 24721 ccgctctcct cccggcacgt cctgcgcaag gtgatcgcgg cctacgcggc ccaggagtac + 24781 accccggtcc tcggtctgga ggtggagtgg tacctcaccc gcaggctgga gggcccggtg + 24841 gggaacgcgg gcaacggctt cggcctccag ggggaggcac cccgggtggc ggccatgaac + 24901 ccgggctacc agttcaactc cgacaacgcc ttcgcctcgg tggccgcctt cgcccatccg + 24961 ctgagcgcgc tccttcgcca actcggcctg ccgctgcggt cgatggagca cgagtcgggt + 25021 ccggggcaga tcgagaccac cttcgcgccg atgcacgccc tggacaccgc cgacgccatg + 25081 ctgctcttcc gcaccctggt caagcagcgg gccgcgcagg gcggttacca cgccaccttc + 25141 atgtcgctgc cgcgtatcga cggcttcgac ccgagcggct ggcatgtgca ccagtcggtc + 25201 gtcgacaccc gtaccggacg caacctcttc gcccccgacg accccgcggc cccgctctcc + 25261 gccgccggac tcgcctacgc ggagggcctg ttgcggcgcg cccgcgagct gtgcctgctc + 25321 tcggtgccga cggtcaacgg ccaccggcgc ctcggctccg gcttctcgct ctcgcccacc + 25381 cggatcggct ggagcccgga ggaccgcacc gcgatggtcc gggtggtcgg cgcgggcggc + 25441 tcccggcacc tggagaaccg caccggcgaa ccctgcgcca acccctatct cgccctggcc + 25501 gcccagctgt tcgccggtct ggagggcatg aacagcgact ccctcgtgcc gcgccccgcc + 25561 ctcggcccgg acgccgcggg cgccgagacg ctgccgggct ccctcgagga gtccctggcc + 25621 gctttccgcc agggcagccc cgccgatctg ctcggcaccc cgctcgcccg ctgcctggcc + 25681 aagctcaagc agagcgagct ggaccgcttc cgcacctggg ccgagaagga gcagccgccg + 25741 gagggcgagg tcaccgagtg ggagcagcgc gagtacttcg aggccttctg acccggactt + 25801 gggggctcaa ctcccttaca cacacggcca gttcgtccac cgactgaggg gcagccaccg + 25861 atgattcccc gctacacccg gcccgagatg gcggaactct tctcggacca ggcacgctac + 25921 gagacctggg tgcgggtgga gatcctcgcc accgaggccc aggtgcggct cggcgccgta + 25981 cccggcagcg cccttgcgga catgcggcgc gcgcccgtgc cgctcgcctc ccgggtcgcc + 26041 gagatcgaga aggagcgcga ccacgaggtg ctctccttcc tcgccgccta ctgcgaggag + 26101 atccccgagg agtcggcccg ctgggtccac ctcggcatga ccagctacga cctggtcgac + 26161 accgcgctcg gccacaccct cgcccgcggc accgacctgc tgctcgacgc ggcccgcgcc + 26221 ctgcgccgga tcctcgccga gcgggccgtg gagcactggg acaccgtctg cgtcggccgc + 26281 acccacgggg tgcacgccga gcccaccacc ttcgggcaca agctcgccgg gtacgccttc + 26341 gcggtggacc gctcgctgac ccggctgcgg gcggcacgcg aggcggtcgc ggtgggcacg + 26401 gtctccggct cggtgggtac gtacgcgctg atcgacccgg cggtggagcg gcacgtcctc + 26461 accgcgctcg gcctcgcggc ggagccggcg ccgagccagg tggtggcgcg cgaccggcac + 26521 gcccagctgg tgcaggcggt ggccgcgctc ggcgccgtgg tcgagcaagt cgccctggag + 26581 atgcggctgt tgcagcgcac cgaggtccgc gaggtggagg agcggcgcac cggcgcctac + 26641 cagggctcca gcgcgatgcc gcacaagcgc aacccgacca ccagcgaacg cctggtcggc + 26701 ctcgcgcggc tgctgcgcgg gcacgccggc accgccctgg agaacgtcgc gctctggcac + 26761 gagcgcgacc tcgcccacca gtccgtggag cgggtgatcc tcccggacag cctgagcgtg + 26821 ggccacttcc aggtgaccat ggccaccgaa ctgctcaccc atctcgccgt cttccccgag + 26881 cggatgcgcg cgcacctgga gcagaccggc gggctcgtct acagctccgc cgtcctcgcc + 26941 gaactgctcg ccacgggcac cgaacgcgag aaggcctacc ggggtgtgca ggcggcggcg + 27001 aaccgcaccc tggcgggcgg cgcggacttc gccgccgcgc tcgccgagga ggggatcgac + 27061 ctcgggccac tgggccccga gcgcttcctc ggccaccatg atgtgatccg cgagcgattg + 27121 gagcagctac gtgacctgga agattgagcg ggtaccgggg gacggcctgg acctggacga + 27181 agtcctcacc gtctaccggg agtcggggct cggcgagcgc cgcccgatcg aggaccggga + 27241 gcgcttcgcg gcgatgctgc gcggggcgaa tctggtggtc gtctgccgta ccgaggaggg + 27301 gcggctgatc ggcatcgccc gcagcgtctc cgacttcagc tatgtcacct acctctccga + 27361 catcgcggtc agcgccgact tccagcgcgc gggcatcggg cgggccctga tcgcggggac + 27421 ccaggccgag acccccgggg tgaagatcgt gctcctctcg gcgccggcgg cggtcgacta + 27481 ctacccgcac ctcggcttca cccggcacga gagcgcctgg gtgctccagc cctgaacccc + 27541 cgaggaatcg ggagcaagca gagcgcggcc gtctccccgg ggaggcggcc gagcggtctt + 27601 ccctctttct ctacggtggc tcaggcgctg cccagtttga atccgacgcc gcgcaccgtg + 27661 atgatccatc cgctgtcgcc gagtttgctg cgcagactgc ttacgtgggt atcgacggtt + 27721 cggcgcgacc aggaatctcc ccatacctgc tgcagtaaac gtttgcgggg aatcacggtg + 27781 tcgggattcg aggcgagcag gtgcagaaga tcgaattctt tcctggtgag tccgacctcg + 27841 cgtccgtcca ggctcacttc ccgggagctg gcatcgatct tgaggggccc gtgctggatt + 27901 tcccgtaccc gctgcggctg ttgatggacg cgccgcatca cggcgtcgat ccgggcgagg + 27961 agttcgcgga atccataggg tttgacgagg aaatcgtccg ccccggcctg gagtccgagg + 28021 acccggtcca gctcggtccc gcgggcggtc acgatgatca ccggcaggca gctgacggag + 28081 cggatcgccc cgcatacctc cagtccgtcc aggtccggca gctccagatc gagcaggacg + 28141 agatcgatgt cctccaggga ctgcaaggcg gtgccgccct gctggacgcg cgtagtctca + 28201 tgcccgtggc ggcgcagtcg gcagaccagc gcctcggcgt agtcgctgtc gttgtccacc + 28261 acgaggatcc gctggccggt gggcagtccc gcgaccttgc gggtggtggg gccgaagccc + 28321 tcgtcctccg cgaaccgggg cgagggcatg gcacgctgaa agggaatacc agattccagt + 28381 acggcctcgg tcgagctttg tgccatgtct gtcccccgtg agtcatgagc cccgttcggt + 28441 gaactgatgg gaatccgaag cgaaacggag cgcttacctg caagacgagc ggcatcggaa + 28501 tgcagaaaca cgagcgtcgt caggcactct gcgacgcctc ccgcgtggcg tcgcacggcc + 28561 cagaacacgg ggattcaccc cgcagggcgg acgttacctg attccgtgag acttgcggag + 28621 gggaaacgga cagaagttgt caggcggaga gaatggctac atcgagaccg gcgagacggg + 28681 tggggtccgc gatgatgttc attgcggtga tgcgtccctc ggaaacggtg aagtccatga + 28741 ccacggagag ttgcctgggc gccgccgtgg ccaggccgag acgcccgtcg accagcgccg + 28801 tccgcgccag atgcgcacgt cccgagtaga gaccggcctg cgccgccacg ggctgggcac + 28861 cgacgatctc catgggggcg ccggcggggg tggcggccgc gtccacccgc agcacgacat + 28921 ccgggtcgag cagggcgagc agcgcctcga actccccgcc gcgcgccgcc gcgaggaagg + 28981 cgtcgaccac cgcgcgctgg cgcggcaggt cggagtcggg cgaggtgtcc acggcctgca + 29041 cccggcggcg ggcgcggctg gcgagctgac gtgcggcgac gggggtgcgg ccgacgatcg + 29101 gcgcgatctc cccgaagggc acggagaaca tgtcgtgcag gacgaaggcg atccgctccg + 29161 ccgggtcgag ggtgtccagg acgacgagca gggcgagccc gacggagtcc accagctgcg + 29221 cctcgtgcgc cgggtcggtc ggcgcggcgg cctggtcgcg cgggccgtgc tcgggcaggt + 29281 ggtcgccgag cgggtcctcc cggcgcgagg agcgcgagcg cagcatgtcc aggcagatgc + 29341 ggccggccac ggtggtcagc cagccgccga ggttgccgat ctccccggcc tcgctccggc + 29401 tcagccgcag ccaggtctcc tggaccgcgt cgtccgcctc cgccacggaa ccgagcatcc + 29461 ggtaggccac cgcgcgcaga tggggccgct gggactcgaa cttctccgcc agcgccggcc + 29521 attcgccctt gtccaccggt cacatcctcc gctcggctcc cgtcatagcg ttgacggctg + 29581 tcactcagcg tatgtgaagg gaccccgccg cagcaggttc cgcgcgcaag ccgcccggcg + 29641 gggcctccgg gctgcccgcg gccgggcgga cgagccggtg cgcgcggccg gtcctgacct + 29701 cggtaaagtc aacgaggcat atccaccggg cagttggcga gtgctcgcgc cgcagatcac + 29761 ggtgccgggc ggtgtgcgcc cccgcttccc gggcccgctg tccgtgcgcg cggccccgcg + 29821 gcggtcgccg gtcgcccggg cccgccccgc cggaaccggc cgcaggttgg ccggaatccg + 29881 cccctgccca attacccctc ctgacacggc tgttgacacc gctgagcggg gtcccctcta + 29941 atgccgctac cggaactgga ttccgcttcc gcatcgctgt caggaggtgc accttgtctc + 30001 tggccgaaca gttgacctat ccggcagtcg atctcgacga gatcgagtcg tcggccatct + 30061 ggatcgaatc gcacccgatc acccgcgtac ggatcgactc cctcgtcttc gagggctccc + 30121 cgcgtctcgg cggcgaggac cacgaccacg tacgcgtgct cgccgaagcg ggggactccc + 30181 tgcccgcgat caccgtgcac cgccccaccc tgcgcgtcat cgacggcacc caccgggtcc + 30241 gcgcggccct gctcaacggc cgtaccgaga tcgcggcccg gatgctcgac tgcgacgagg + 30301 ccgcggcctt cgtcctgtcc gtcaaggcca acgtcaccca tggactgccg ctcagccgcc + 30361 aggagcgggc cgccgccgcg gcgcggatca tcatgaccca tccgcagtgg tcggaccggg + 30421 cggtcgccgc cgccaccggg atctccgaca agacggtctc ccggatccgc tcccagtcgg + 30481 gcgccgactc cgcgcagtcc gccacccgcc tgggccgcga cgggcggctg cgcccgctcg + 30541 acagcgggca gcgccgccgc cgcgccgccg cgatgttcct ggaccgcccc gacgcgggac + 30601 tgcgcgaggt ggccagggcc accggcctct ccccggcgac ggtacgggac gtgcgccagc + 30661 gcatcgaccg cggcgaggac ccggtacccg gccgctaccg cacggcggag agtcccggcg + 30721 gcgccaccgc ggcccggcag cgccccgccg ccggacgcct ggaccgcagg accgtggtgg + 30781 tggaccggca gcggctgctc gccaagctca gcgaggaccc ctcgctgcgc ctcaacgagg + 30841 cgggacggcg cgccctgcgc tggctgcacc actactccgt ggacggaaac ggcatcgaga + 30901 ccctcggcca ggggctgccc tgccactggg cccccgacgt cgccgacctg gcccgcagct + 30961 gcgccgccgc ctgggccgaa ctcgccgagc agctccagca gcgcgccgag taggcaggct + 31021 gccgcaactc ccttctccac ggctcgactt cgcagcggga gagggcaggg acaccgccgc + 31081 ccgcggcacc gtcccgcagc acctcggacc tcggtcgacc ggtccgcgca ccgccccacc + 31141 tcgtacgacc cggtcccgta ccggccggct ccaccccgca ccaccggact cccgggcgag + 31201 ccgccccgcg actcccgcac ctgagcacct cccggaccgc gcaccgcgcc tcccgcgccg + 31261 ccgccccgcc ggtcccgttc cgcgcaccgc cgctcgtgca ccgccgctcc gcgcaccgac + 31321 tgcgtcaact gccctccccg gcagcgcact tggcaccacc ggctccccgc accccgcagg + 31381 cgcgccacac ccgcaccgcg caccgccccg caccgcgtac cgccgcaccg cgcacctccc + 31441 gtaccgcgta ccacgtaccg ccgcaccgcg caccgccccg cacccacccg caccgccaga + 31501 gccccacacg ctcagcaccg ccctatccgc taccgggccc caccccggag ccgtcccagc + 31561 cgctccacgc tccaacgcct ctgcccaccc gggtggttga gcctctttcg gccacccgtc + 31621 ggcggtgccg aggggcggtg ggcgcggggc gggaaccgac gtcatccagg aggcatcccg + 31681 tgtcccagca ccccgagaag gccggtccgc ccggtgcccc tgcgagcggt cccggtaccg + 31741 gtgtgtggtt catcggggcc aggggctccg tcgccaccac cgcggtgacc ggcgcggcgg + 31801 cgctcgccgc cgggctccag ccgccgaccg gactggtcac cgaggcaccg gagttcgcgg + 31861 gcagcgggct gcccgcgctg tcctcgctcg tcttcggcgg gcacgacacc gccgactggc + 31921 cgctgcccaa gcgcgccgag gcgctggccg agggcggggt gctgccgcgc gggctcgccg + 31981 ccgcggtgca gcgcgaactc gccgccgccg acgaggagat ccgccccggc ggaccgctgc + 32041 ccggcgaccg gcgcggcgac gaggagctga tcgccgactt cgccgccgac atcgcggact + 32101 tcacccgccg caccggggtg gcccgcacgg tcgtggtcaa cctggcctcc accgagcccc + 32161 tgcccgaacc caacagcgcc cggctgcccg ccagttcgct gtacgcggcg gccgccctgc + 32221 gcgccggtgc ggcctacgtc aacttcaccc cctcggcggg gctgcaccac cccgcgctcg + 32281 ccgaggccgc ggccagcgcc cgggtcccgt acgcgggccg cgacgggaag accggccaga + 32341 ccctgctgcg ctcggtgctc gcgccgatgt tccggcagcg cgccctggac gtgcgggcct + 32401 ggtccgggac caatctgctg ggcggcggtg acggcgccgc cctcgccgac ccggccgccg + 32461 ccgaggcgaa gaacgcgggc aagaaccggg tcctggagga caccctcgga gcactgcccg + 32521 agggcgaggt gcacatcgac gaggtaccgg cgctcggcga gtggaagacc gcctgggacc + 32581 atgtcgcctt cgagggcttc ctcggctccc ggatgatcct gcagaccatc tggcagggct + 32641 gcgactcggc gctcgccgcc cccctggtcc tggacctggc ccggctcgcc gcccgcgccc + 32701 aggaggccgg gctcaccggg caactccccg cgctcggctt ctacttcaag gaccccgacg + 32761 gcggctcctc ggccctggcc gagcagtacg ccgcgctcct cgccttcgcc gcgcggctcg + 32821 gggcccgtcc tgcggaggcc tcgtgagcac cccccgcgac tgggccgaac tcctgcgcgt + 32881 ctccgccctg ctgtccgtgc ccggcgacgc cctcgcgggc gccgcggcca gccgccggcg + 32941 ccccaactcc cgtaccgcgc ttgccttgtg ctcctcgctc tgcctctacg aggcgggcat + 33001 ggcgctcaac gactgggcgg accgcgcgga ggacgccgag gagcgcccgc accgcccgct + 33061 gccctcgggc cgcatcgccc ccggcgccgc gctcgccgcg gcggccgggc tgaccgccgc + 33121 cgggctcggc ctcgccgccc gcgccggacg ccccgccgcg ctgtgcgcca ccgccctcgc + 33181 gggcgccgtc tgggcctacg acctgcgcct gaagcacact gcggccggtc ccgccgcgat + 33241 ggccgccgcg cgcgggctcg acctggtgct cggcgccctc gccaccgcgg gcccgcgctc + 33301 cggcgaggcg gccgggagcg tgctcggccg ggcgctgccg cccgccgcgg tgctcggcgc + 33361 ccacacctgg gcggtgaccg cggtctcccg cgccgagacc cagggcggct cggccggacg + 33421 gccgctcgcc gccctcggca cgacggccgc gctcggcacc ctcctcgccc ccgccggggc + 33481 ccggccgctg cgcctggagc gggcccgcag gctccccgag accccgcggg agctggccca + 33541 ggccgcgctg gccggggcct acgccgccac cgcggggcgg tcctatctgc acgccgcgct + 33601 gaacccctcg ccgccgctga cccagcgggc cgtcggcggc gggatccgcg cgatgatccc + 33661 gctgcaggcg gcgctcgccg cccgctccgg ggccctcgcc accgcggcct cgctcggcgc + 33721 gctggtcccg ctcgcccgca gcctcgcgag gaaggtcagc ccgacatgag catccgactc + 33781 ggctacggca ccaatggact caccgacctg cgcctgcgcg aggccctcac cctgctcgcc + 33841 gaactcggct accagggcgt cggcctgacg ctcgatcaca tgcatctgga cccgctggcg + 33901 cgcgggctga gcggccgggc caaggcgctc gcccgcaccc tcggcgcgct cggcctggac + 33961 gtcaccgtgg agaccggcgc ccgctatgtc ctcgacccgc gccgcaagca cgggccgagc + 34021 ctgctcgacc cggacccgga ggcgcgggtg gcccgcgagg cgctcctggt caccgcggtc + 34081 gaggtcgcgg cggaactcgg cgcccacgcc gtgcactgct tcagcggcgt ccggcccgag + 34141 ggcaccgacg agggcacggc ctggcagcgg ctcgccgact ccctcggccc ggtgctcgac + 34201 gcggcgcagc gcgacgggat cccgctcgcc ctggaacccg aacccggcca cctggtcgag + 34261 tcgctggccg acttccaccg gctgcgcgcg ctcctcggcg atcccgaact cctgggcctc + 34321 accctggaca tcgggcactg ccagtgcctg gagcccgcct cgcctgcgga gtgcgtgacc + 34381 gccgcggcgc cctggctgcg gcatgtgcag atcgaggaca tgcggcgcgg ggtgcacgag + 34441 catctgccct tcggcgaggg cgagatcgac ttcccgcccg tgctcgcggc cctggaggcc + 34501 agcggctacc ggggcctgac cgtggtcgaa ctgccgcgcc actcgcacgc cgggcccgaa + 34561 ctcgcccgcc ggtccatgga gttcctgcgc cccctggtcg ccgccgcggc ccgcgaggac + 34621 cgcgccgccg gggcgccgtc gccggtccgc gcccgtcccg taccactgct gaccgggccg + 34681 cccctgcggc aggaagcacc gtcccgtacc tgaggaagca ccatgccgat cactccgatc + 34741 acccctgagg aaccgcgccc cgccccggag cccgcggacg gcaccgaggc cgaactgcgc + 34801 cgagaggccg ccgagttgcg cgagcggctg agcgccgagg gcgccgactg gctggacggg + 34861 gcgctcgccg aggccgcccg ggcggcggcc gagcccgcac ccgcggagtc ccgtgcggtg + 34921 cccggctggg agctgcgctt cgcggcggcg ggccgcgcct gcgggaccga ggccgccgaa + 34981 tccgcccggg tactgctgct gcgcgccgcc cgccccggcc ccgccgccct cacccgcctc + 35041 taccggcacg gcaccggcga ggagcgccgc gccgtgctgc gggccctgcc gcggctgccg + 35101 ctcgcgccgg gggaggggct gccgctggtc gaggacgcgc tgcgcaccaa cgacacccgc + 35161 ctggtcgcgg ccgccgtcgg gccctacgcc gccgcccacc tggacgacca cgcctggcgg + 35221 cacgccgtcc tcaagtgcct gttcacccag gtccccgtgc gggccctggc ccggctgccc + 35281 gagcgggccc gcggcgacgc cgaactcgcc cgcatgctgc gggacttcgc cgccgaacgc + 35341 accgccgccg gacgcgccgt cccggccgac ctcgaccacg tactcgccct gaccgccaag + 35401 gacgcctgat gcgcatcttc gacccgcaca tccatatgac ctcgcgcacc accgacgact + 35461 acgaggcgat gtacgcggcc ggggtgcgcg ccctggtcga gcccgccttc tggctcggcc + 35521 agccccgcac ctccccggag agcttcttcg actacttcga cgcgctgctc ggctgggagc + 35581 ccttccgggc cgcgcagtac gggatcgcgc accactgcac cctcgcgctc aacccgaagg + 35641 aggcgaacga cccgcgctgc ctgcccgtcc tcgacgccct cccgcgctac ctggtcaagg + 35701 accatgtggt cgcggtcggc gagatcggct acgacgcgat gaccccggcc gaggacaccg + 35761 cgctcgccgc gcagctcgaa ctcgccgccg agcacggcct gcccgccctg gtgcacaccc + 35821 cgcaccgcga caagctcacc gggctgcgcc gcaccctcga cgtggtcgcc gagtcgaagc + 35881 tgcccaccga gcgggtcctg atcgaccacc tcaacgagac caccgtcaag gaggcccggg + 35941 agagcggcag ttggctcggc ttctccgtct acccggacac caagatggac gagcaccgca + 36001 tggtcgccct gctgaaggag tacggacccg aacgcgtcct ggtcaactcc gccgcggact + 36061 ggggcaagag cgacccgctg aagacccgca aggtcggcga ggccatgctc gccgcgggct + 36121 tcggcgagga cgaggtgcac cgggtgctgt gggagaaccc ggtcgccttc tacgggctca + 36181 gcggccgcct cgacctggag gtccccggca ccgaggccct gcacgagggc aactccctgc + 36241 tgcgcggggg cgaatgagcc gtgcgcttcc gccacccgga cggctccctc gtccacctcg + 36301 cctactgcac caatgtccac cccgccgagg acctggacgg ggtcctcgcc caactgggcg + 36361 cctactgcga gccggtgcgc agacgcctcg gcaccgaacg cctcggcatc ggcctgtggc + 36421 tggcccggga cgccgcccgc gccctgacca ccgaggcctc cgccctgcgc cgcctgcgca + 36481 ccgaactcga ccggcgcggc ctcgaagtgg tcaccctcaa cggcttcccc taccgcggct + 36541 tcggcgccga gaaggtcaag taccgcgtct accagcccga ttggcgggac gccgagcgcc + 36601 tggagtacac cgccgagctg gccgggctgc tcgccgaact gctgccgccg gatgtcaccg + 36661 agggcaccct ctccaccctg ccgctcgcct ggcgcagcga cttcgacgcg gccggtgccg + 36721 ccgcggccga gcggcagctc accgaactgg cccgccgcct ggacgacttg gaggagcgca + 36781 ccggccgctc catccgggtc gccctggagc cggagccggg ctgcgcggtg gagcggaccg + 36841 ccgacgccct cgccccgctc gccgcgctgc ccgcccaccg cttcgggctc tgcctggaca + 36901 cctgccacct ggccacctgc ttcgaggaac cggccgccgc cctcgccgcc ctggagcgcg + 36961 cgggcgccac cgtcccgaag gtgcagctct ccgccgccct gcacgccgag gacccggccg + 37021 acccggcggt acgggccgcg ctcgccgcct tcgacgagcc ccgcttcctg caccagaccc + 37081 gcgccctggc cgagggggtg ctgcacggca ccgacgacct gggcccggcg ctcgcgggcg + 37141 ggacgctgcc cgagaccgtg ccctggcgcg cccacttcca cgtaccgctg cacgcgccgc + 37201 ccgccccgcc gctcacctcc acgatggacg tcctgcgtgg ctccctcgat gtgctgctcg + 37261 gtcaagacgc cccgcgcagc cgccacttcg aggtggagac ctacacctgg caggccctgc + 37321 cgcccgaggc gcgaccggcc gacgcggcgc agctcgccga cggtatcgcc gccgaactcg + 37381 ccctcgcccg cggcctcttc cgcgacctcg gcctcaagga gctgccgtga ccgccacccc + 37441 gaccccgctg ctcgtgctcg acgtggtggg cctgacgccc gccctcctgg agcagatgcc + 37501 gcgcctgaag tcccttgccc gcaagggctc ttcggccgga ctcggcaccg tgctgcccgc + 37561 ggtgacctgc gccgcccagt ccaccttcct caccggagcg ccgcccgccg agcacgggat + 37621 cgtcggcaac ggctggtact tccgcgagct gggcgaggtg ctgctctggc gccagcacaa + 37681 cgggctcgtc gcgggcgaca agctctggga cgcggcccgc cgcgcccacc ccggctacac + 37741 ggtcgccaat gtctgctggt ggtacgcgat gggcgcggac accgactgga ccgtcacccc + 37801 gcggccggtg tactacgccg acggccgcaa ggagccggac tgctacaccc gccccgtcga + 37861 gctgcacgac gaactcaccg acgccctcgg caccttcccc ctcttccact tctggggacc + 37921 cggcgccgac ctggtctcca gccggtggat catcgacgcc acccggcacc tcaaccgcac + 37981 ccgccacccg gacctgaccc tctgctacct cccgcacctc gactacgacc tccagcgctt + 38041 cggcccccgc gacccgcgct cgctgcgcgc cgccgccgaa ctcgacgcgg cgctcggccc + 38101 cttgctggac gaggccgagg cggagggccg caccgtggtg gtgctgtccg agtacggcat + 38161 caccgaggtg tcccgccccg tcgacatcaa ccgcgccctg cgccgcgccg ggctcctgga + 38221 ggtgcacacc caggacggca tggagtacct ggacccgatg gcctcccgtg ccttcgcggt + 38281 cgccgaccac cagctcgccc atgtctacgt acggcgcccg gaggacctgg cccgggtgcg + 38341 ggaggtgctc gaagggctcg acggggtcgc cgaactcctc ggcgacgagg gcaagaaggc + 38401 gcacggcctc gaccacccgc gggccgggga actcgtcgcg ctcgcggcgc cggaggcctg + 38461 gttcacgtac tactactggc tggacgacga gcgggcgccg gacttcgcgc agctggtgga + 38521 gatccaccgc aagcccggct acgaccccgc cgaactcttc ctggacccgc tcgaccccta + 38581 tgtgaagctc cgggcggccg gtgcgctggc ccgcaagaag ctcgggatgc gctaccggat + 38641 ggcggtggtc ccgctcgacc cggcgccggt gcgcggcagc cacggcaggc tcccggcccg + 38701 ccccgaggac gggccggtgc tgctctgctc gcgccccggc gccctgccgg gggaggtcgc + 38761 cgccaccgag gtcaagtcgc tgctgctcgg gctcgcgggt ctcgccgagg tgcccgccac + 38821 ggggtgaggg ctcagaccgc ggcggcgccc ggccactcgg gggcgagcag cgaccagacc + 38881 tccttgtcgt gccggaagcc gcggttcggg aagtactccc gcagggtgcc gtcgagctgc + 38941 atgcccaccc gctgggcgac cgcgcggctg cgcgcgttgc gggtgctgct gaaccactcg + 39001 acgcggtgca tgccccgctc ggcgaaggcg tagtcgatca ggtgccgcac ggccgcggtg + 39061 atcaagccgt ggccctcgcc cgccggttcg gtccacaccc cgatctcgca gttgccgagc + 39121 cgggtgtcga agtgcacgaa catcaccccg ccgaccaggg tgcccgcccg ccagatcccg + 39181 tagaggcggc cggtgtcggc ggcctgcttg tccgcgtagt cctggagggt ggcccgggcc + 39241 gagtccaggt cggtggagcg ggaggcccag gggatccagg ggtcggtgtg cgggcgggcc + 39301 cggtccatgt gggcgaggaa ctcctcggcc tgccagggtt cgagcgggcg cagcgcggcg + 39361 tcctcggcga gcggtacggc gtacatggcg gtcctcagcg gtcggcgggg gcggacggcc + 39421 cgctccccgg tacataacaa acgttgggta tgtaccctac tcgtatgccg cccgcacgtg + 39481 gagaccatga agcccgccgg agagaggtct ccgaggcggt gtggcaggtg ctcgccgcgc + 39541 ggggcttcgg ggggctgacc ctgcgggccg tggccgcgca gatgggggcc accaccgggc + 39601 tgctcacgca ctacttcccc ggcaagcggg cgctgctcgc gcacgccctg gacgtactgg + 39661 accgccgctc ggccgagcgc ccgcgccccg ccgccgagga ggcgggggag gccgccggtc + 39721 tggtgatgct gcgggcgatg ctgctcgaca tcctgccgct ggacgccgcg agcgcggcca + 39781 gcaaccggat ctgggtcggc tcctgggacg cggcgctcac cgacccggag ctggccgagg + 39841 agcacgccgc ccgctaccgc cgcgcccgcg cgcggatgac cgggtacgtc gcggacgccc + 39901 agcggctcgg cgaactgccg gccggccccg cggccgagga gatcgcggcg gcggcgcaga + 39961 gcttcgtcct cggtcttgtc gtacaggcgc tcttcgcgcc cggggagttc ccgcccgagc + 40021 gccaagtcgc tttgctcgac gcccacttgg cgaaggccgc cgccggggcg gaccgggcgc + 40081 cggggacgcc gccggtcccg gcaggggagt cctgaccggg accggacggg cgcggggcgc + 40141 cgggtgcagt gcgcgcgggc tcagaccggg cgggcctcga tcaccgagat cggggcggcc + 40201 gtctcggtga tcttctccag gcggaagcca ccggcggcga gcacttccgc gtactgcttc + 40261 tcgctgcgct ccttgccgcc gacgagcagc atcagccaca ggtcgaccag cttggccggg + 40321 tgcggcttgt tcggcttgtc gtcgggggtc acgaactcca tgaggaggat ccggccgtcc + 40381 gggtcgatga ccttgcggac attgcgcagg atctcgatca cctgctcctc gggccagtcg + 40441 tgcacgatgt gcttgaggag ataggcgtcc ccgcccgcgg gggccgggtc gaagaggccg + 40501 cccttctcca gggtgcagcg gtcggccacg ccctgctcgc gcaggtagtc ggcggcgccg + 40561 ttggtgtcga tccgcgcgtc gaagaggacc ccgcgggcgt ccttcgcctg ctggagcgcg + 40621 gcggcgagca gaccgccgcg ccccgcgccg tagtcgacga tggtgcggaa ccggcggaag + 40681 tcgtaggcgg cgagcagcgg cagggtctcc gtctcggaca tcgcgcccat gcccgcggtg + 40741 aagatctccc cgtactccgg gttggcgtcg atgaactcga aggcgcccat gccgcgcagc + 40801 ttgggcaggc tggcctcgcc ggtgcgcacc gcgtcgacca ggtgcgccca ctcctcccag + 40861 tgggtcgggt gccccatcag caggacggtg gcgcgcatcg actgcggggt gtcggagcgc + 40921 agcgcctgcc ccatcggctt cagcttgaag ctgccgtcgg cgcgctcctc gaagaccgag + 40981 taggtggcga gcaggcgcag cagccggtgc agcgactcgg ggtcggcgcc gacccgctgg + 41041 gccagctggg cggcggtcag cggaccgtcc ttcagctcgt cggcgacctt caactcggcg + 41101 gccacgtaca gggcttgggt gaccatcgag ccctgggaga gttcgagcag cgcgaacggc + 41161 ggcggggcga gcagccgggt cagcttcacc aggccggcgc gcacaccctc cacggcgcgg + 41221 acgactttgg cgggggggag tttgggcatg cgtatcctcc gtggcggtgt cgcggaactc + 41281 gtgcctgcgg gacgtacgga ccgccgcgta cacgggggct gaactggagc cctggcgcag + 41341 gggaaagcct cgaacggagc cgttcgccgg gcggtgcccg ctcaccgaaa ccagcggtgt + 41401 cccgggccga ctgtaggggc gcctcttccc ttgcgccacc gtgtgcagaa agcccgggaa + 41461 ttgcgcaccg gcagttcggc ggagtttccg gtgagcggcc cggtgcgcct tctcgccgag + 41521 ttctcgaccg gggtgtgcaa ccgcgatatt tccgaggtcg cacacttgat ttccgaggtc + 41581 ggacacgtac cgccgcccaa atcccgggaa gagcaggcaa tttcacccgg gacggctgcg + 41641 gccgcgtacg tctatggtga cgccggtcga atgcacgccc cccattccgg gggtgtgcca + 41701 ggaaaaggga gagacatgtc aagagcacac aagccttggg cgggggccct ccttgcggca + 41761 gcggtggtgg cggggctcac ggccaccgcc gcacccagcc aggccgcgca ccgcgcgggc + 41821 cccgaggtcc tcgcgaccaa cctgaacaac ccgcgggaca tcacgctcca ggcggacggt + 41881 tcgatcctcg tcgccgagtc cggcagcggt cccgccacgg cctgtgcgcc gggcacctcc + 41941 tgcctcggct tcaccggctc gatctaccgg gtcaacggca gccagaaggg ccgcgtcgtc + 42001 accgggctgc cctccaagct ggaggtccgc gcggacggcg gcgcctcggt cgccggaccc + 42061 aaccaggtcg aggcccgcac cggcggctac accgtctcca gcagcttcgg cggcgacgcc + 42121 gcggaccgca aggcgctggg cgcgggcggc gagaccctcg gcaccctgca catagccaag + 42181 ggcaaggtgc tcggcgacct cgtcgaccac gagacccggc tcgacccgga cggcccgctc + 42241 ggcaacaacg acgtgcactc caacgcgtgg atgttcgccc accacggcaa ggactacctg + 42301 gtcaccgacg cgggcggcaa cgacctgatc cgggtgctcc cggacggcac caccaagacc + 42361 gagttcgtct tcccgaacaa cggcgagaac gagacggtgc ccaccgggat cgtggccgcc + 42421 cccgacggct ccttctacat ctccgacctc agcggccagg ccgcgggcaa gtcccgcatc + 42481 tggcgctacg ttcccggcag cgccccgaag gtcttcgcca ccggtctgac gaacgtcacc + 42541 gacctcgccc tggacggcaa gggcgggctg atcgccctca ccctcaccaa gggctacacg + 42601 gagaccggcc cgctgcccgg cgccctgaac cgcgtcgacc tgaagagcgg caaggcgacc + 42661 gagatcccga ccgccgaccg gctggtcaac tccctcggcc tcgccgtcgg caagggcggc + 42721 gagatctatg tgaccaacaa gacggtgggc accaccggcg aactcctgaa gttccccgcc + 42781 gcgcgccggt gagcaccggc cgccggaact gacaccggcc ggggcgcact tcggccccgg + 42841 ccgatgtcag gatttccccc gccgggtgaa atcccggcag gcccgtctcc ggttccgcac + 42901 agagaacgga caggtcttcc gcgacagcgg ccctcggccg gaaatccggg cgaccatgcg + 42961 gtagggatgt cgcctgcgga tgtcgtgcac ggacatcgtg cacggatgtc gcgtacgtca + 43021 tcgagtacgg cccggagtgc gtatcgccta cggctccgcg ttcggcctcg gagtccggcc + 43081 ggggaatccg cagtcgcaca gcaaaaggga atccggtggg cccgagtacg ctgtggccgc + 43141 tccggtgatc cgcgggaatc cggccttccc ccgcggaagg aagaagtccc ctcgcgcgcc + 43201 ctttccgctc gtattttggg cgtgcgcggc acgtgacacc gcacgcacca tttcgcgtct + 43261 ccgcttttac gccaccgcag gaactcacgc cagagaggga ctcatgacga agatcatcct + 43321 tcccgaggac cgccccgcag gccgccgcgg gttcgagatc gtcctgccca gctccttgac + 43381 cgacggggcc gcctcgctcg tcgaggcgca tgtctccgag gcgatgtccg ggccgccgct + 43441 gcacacccac gcggagtcgg acgagaccta cttcgtcctc ggcggcgcgc tcatcatgat + 43501 catcgacggc aagctcaccg agctgcgcgc cggtggcctc gcccacatca gcaaggacac + 43561 ctcgcacacc tgggccaccc gtcccgacga gggcgcccac ttcctcaccc tgcacctgcc + 43621 gggcggctac gagctgtacc acccgaccgc gctccacgcc gagcacgaga agggcggccc + 43681 cctggagcag aaggacctct tcgagctggc ggcccgcttc gactggcgcc tggccggccc + 43741 gcccgagccg caccgcctga ccccgaccgg cgtcctggtc cccgcgggca aggcggacgc + 43801 cgaggcggag gccaccaagg cactcgccac ggcggagtac gaacgcgccc tcgccgcgtc + 43861 catcgaggcc gccgactccg gctcctgagg cgcgagtcgg cggacgggca cggcggaggc + 43921 ggggagcgtc atgggggcgg caccgtgagc gggccggggt ccggcgggcc gggcaccgcc + 43981 gccgtaccgg gcgccgcccc gcccggtgcc gccggggcgc ccgacccccg gcgatggttc + 44041 gccctggtgg tgatcctggt cgccgggttc atggacctgc tcgatgtgac catcgtgaac + 44101 gtggtcctgc cgagcgtcct cgcggacctg gacgccgcct acacgcacgg ggagtggatc + 44161 gtcgccgggt acgtgctcgg cttcgccgcg ctgatgatca ccggcgggcg gctcggcgac + 44221 atcctcggcc gccgcaaggt cttcctcgcc ggggtggccg gattcaccgc ggcctcactg + 44281 ctctgcgggc tcgccgacgg gcccggggcg ctgatcgcgg cccgcttcct gcaaggcgcc + 44341 atggccgggc tgatggtgcc gcagatcctc gcgatcatcc atgtcacctt ccccgccgag + 44401 gagcgcggca aggtcctcgg catctggggc ggcgtactcg gcgccgcctc ggccgcgggc + 44461 ctggtcgccg ggggactgct cgccgaggcg gatccgtacg gactcggctg gcgcgcggtc + 44521 ttcctggtca atgtgccggt cggcgccgcg gccctgctcg ccgcctggtt cctcgtcccg + 44581 gactcccgcg ctcccgagcg gccccggctc gatccgctcg gcgcgctgct gtccgccgcg + 44641 ggcatcctgc tcctggtcta tccgctcacc gaggggcgcg gcctcggctg gccgccgtgg + 44701 accttcctgc tgatgggcgc cgcggtcctg gtgctcgggc tcttcgtgct ccagcagcgc + 44761 gggcgcaccc gggccgacaa ctccccgctg atgtcgctgc gtctgttccg ggcgcgcgcc + 44821 ttctcggcgg ggatggcggt gtgggcgctc ttctggatcg ccctcggcgg cttcttcttc + 44881 atctggaccc tgtacatgca agtggggctc ggctggccgc cgttgcgggc gggactgacc + 44941 agttccgcct tcgcggtggg ctgcgccgcc gggtccggga ccgccgtcga gttcttcacc + 45001 ccgcgcttcg gccgcaaggc cctgctcgcg ggcgccctcc tctgcggcac cggcttcctc + 45061 ggctacgtcc tggtcgccgc ccactacgga cccgccgtcg ccccctggca gatggtcgcc + 45121 ccgctcctcg tcgccggtat cggcttcggg ctggtggtgg cgccgatgat cgacgcggtg + 45181 ctcaccgagg tcccggtgcg cgaggcgggc tcggcctccg gggtcctcgg caccgtgcag + 45241 cagatcggca tcgcgctcgg caccgccctc gccggggtgc tcttcttcca gcagctcgac + 45301 cacgacgcgg cgcgtgccgt ggcgcgggcc gcccccgcgc tgcgccagga actcacccgg + 45361 gccgaggtgc ccgccgccga gcgcgagcgg atcctcgacg ccttcgccga ctgcctcgcg + 45421 gaccgcgccg cggcgaccga cccgaccgcc gaacccgcct cctgccgggg cccgttgccc + 45481 tctcccgagg tccgcgcgct ggtgatcggg gccgggcagc gggccaccgc cgacaacttc + 45541 tcccgcacct tcgcgctgac cctcagatgg ggcgcgggca gcatgggcct ggtcttcctc + 45601 ggcctcttcg ccctgccgcg gcgggtggag ttccgggggc tcgacggggg cggtccgggt + 45661 ccggggtccg gaccttccgt gccgggcgcc tcggagggtg gcgctgccgt cggtccgggc + 45721 gccggtccgg cctccggtcc cgggaaggag cgctccgccc ccgcgcggtc cggtggccag + 45781 gacgccggca ctcaccccgc cgggtgatcc ggccgcattc cgtttcccgc gagcccgggg + 45841 cacgccccga tgccgcgcgc cccctcgtcc ccgtaccgcc gcccgtgccg cgcccggtgg + 45901 ggcaaaggcg cgcaccgtac cgtaccggca ccagtcgtgc acacccggca gccggggcat + 45961 tcgccgggag tgggggaagt ctgtccttcg ccggaccatg tccggactgt tctctgacgt + 46021 ttctctgaat ttctgtcagc ggatttgtcc tgaccgacag ttgcccggca acagggcgcg + 46081 aagaattcac ctccggctcg ctgccgcggt ctgttcgcgg gccccgcgag gcggcaggct + 46141 ggggccgcct cgaccgcgta cggcgaggcg ccccacgtcc cccctcacct ccggaggtcc + 46201 ccatgcgccg ccgtcacgtc ctgccgctcg ccgccgccgc gctggcgatg cccgccgctc + 46261 tcctgtcgac cggttccgct tcggccgcac ccgccgacaa gccgcaggtg ctcagctcct + 46321 tcacgcagac cagcgcctcc agctacaacg cctggaacgc cgcccgcaac aaccaggggc + 46381 agtgggccgc ctacggcttc gactggtcca cggactactg cagcacctcg cccgacaacc + 46441 ccttcggctt ccccttcgaa accgcctgtg cgcgccacga cttcggctac cgcaactaca + 46501 aggcgatggg caccttcagc gccaacaagg cccggatcga ctccgccctc tacgaggacc + 46561 tgaagcgggt ctgcagccgc tactccggcg cgaccaagac ctcctgcgac gggctggcct + 46621 ggacctacta ccacgccgtc gacatcttcg gcatcaaggg cttcaagcag ctcgacaagg + 46681 ccgcctga +// diff --git a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/JCM_4504.region33.gbk b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/JCM_4504.region33.gbk new file mode 100755 index 000000000..2d779dfa5 --- /dev/null +++ b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/JCM_4504.region33.gbk @@ -0,0 +1,1730 @@ +LOCUS NZ_BMUJ01000032 33697 bp DNA linear CON 19-APR-2022 +DEFINITION Streptomyces plicatus strain JCM 4504 sequence032, whole genome + shotgun sequence. +ACCESSION NZ_BMUJ01000032 +VERSION NZ_BMUJ01000032 +KEYWORDS . +SOURCE Streptomyces plicatus + ORGANISM Streptomyces plicatus + Bacteria; Actinobacteria; Streptomycetales; Streptomycetaceae; + Streptomyces; Streptomyces rochei group. +COMMENT REFSEQ INFORMATION: The reference sequence is identical to + BMUJ01000032.1. + The annotation was added by the NCBI Prokaryotic Genome Annotation + Pipeline (PGAP). Information about PGAP can be found here: + https://www.ncbi.nlm.nih.gov/genome/annotation_prok/ + ##antiSMASH-Data-START## + Version :: 6.1.1 + Run date :: 2023-02-07 14:24:16 + Original ID :: NZ_BMUJ01000032.1 + NOTE: This is a single cluster extracted from a larger record! + Orig. start :: 0 + Orig. end :: 33697 + ##antiSMASH-Data-END## +FEATURES Location/Qualifiers + gene <1..508 + /locus_tag="IE211_RS35055" + /old_locus_tag="GCM10010301_70910" + /pseudo="" + source 1..33697 + /culture_collection="JCM:4504" + /db_xref="taxon:1922" + /mol_type="genomic DNA" + /organism="Streptomyces plicatus" + /strain="JCM 4504" + /submitter_seqid="sequence032" + /type_material="type strain of Streptomyces plicatus" + protocluster 1..33697 + /aStool="rule-based-clusters" + /category="PKS" + /contig_edge="True" + /core_location="[5971:21826]" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + /tool="antismash" + proto_core 5972..21826 + /aStool="rule-based-clusters" + /tool="antismash" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + cand_cluster 1..33697 + /candidate_cluster_number="1" + /contig_edge="True" + /detection_rules="(t2ks and t2clf)" + /kind="single" + /product="T2PKS" + /protoclusters="1" + /tool="antismash" + region 1..33697 + /candidate_cluster_numbers="1" + /contig_edge="True" + /product="T2PKS" + /region_number="1" + /rules="(t2ks and t2clf)" + /tool="antismash" + CDS <1..508 + /codon_start=2 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019058637.1" + /locus_tag="IE211_RS35055" + /note="incomplete; too short partial abutting assembly gap; + missing N-terminus; Derived by automated computational + analysis using gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70910" + /product="methylmalonyl-CoA carboxyltransferase" + /pseudo="" + /transl_table=11 + /translation="MCDAFNIPLVTFLDVPGFLPGVDQEHGGIIRHGAKLLYAYCNATV + PRISLILRKAYGGAYIVMDSQSIGADLTYAWPTNEIAVMGAEGAANVIFRRQIAEAEDP + DAVRARMVKEYRAELMHPYYAAERGLVDDVIDPAETREVLIESLAMLRTKDADVPSRKH + GNPPQ" + gene 520..1152 + /locus_tag="IE211_RS35060" + /old_locus_tag="GCM10010301_70920" + CDS 520..1152 + /GO_function="GO:0003677 - DNA binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_006344625.1" + /locus_tag="IE211_RS35060" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70920" + /product="TetR family transcriptional regulator" + /protein_id="WP_019330965.1" + /transl_table=11 + /translation="MARQERAVRTREALIRSAAEIFHDEGFHAAALTTISSRAGVSNGA + LHFHFASKAALADAVEEAAADVLRAVVGRWDGGPPGVLQCLVNATHELACALQNDVVLR + AGFELSREAGRQPRTDLRLCWQNWVTDMVGRAGRGGELRESVAPESAVAAVVAATSGFE + VLGMRNQAWLSRSTVAQFWLLLLPALAPAPHAGLWQAEGSWTGTATG" + gene 1554..2369 + /locus_tag="IE211_RS35065" + /old_locus_tag="GCM10010301_70930" + CDS 1554..2369 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330964.1" + /locus_tag="IE211_RS35065" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70930" + /product="AfsR/SARP family transcriptional regulator" + /protein_id="WP_031022565.1" + /transl_table=11 + /translation="MDIEVLGALSVREHGVSVVPTAPKPRQVLALLALNADQVVPVAAL + VDELWGENPPRSARTTLQTYVLQLRELMAQALAHGPDERCTAKDILATVPGGYRLQTRG + GHVDYREFDQRAGLGYRAMDAEDYAGAARRLADALALWNGQALTDIQAGLRIDTEVKRL + EEARLCALDQRIEADLRLGRHRELLSELTVLVNQYRMHESLHGQFMLALHRSGRRGEAL + NVYQRLRSTLVHELGLEPSAALSRLQRSILMARPETPAAAGGSGRLVTR" + gene complement(2385..3299) + /locus_tag="IE211_RS35070" + /old_locus_tag="GCM10010301_70940" + CDS complement(2385..3299) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330963.1" + /locus_tag="IE211_RS35070" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70940" + /product="AfsR/SARP family transcriptional regulator" + /protein_id="WP_246559116.1" + /transl_table=11 + /translation="MQIHDERFGVRIVPAGAKQRALLGALLVRAGQAVPAECLVEELWG + GHPPVNAANALQAHVARLRRLLPAPGPGGPRHVWLRTSPLGYTLSLGPAATDAQRFHRL + VGQGRELAATAPGRAVEVLREALALWRGPALQGSGQGPICSAEAALLEESRLRALEVLY + DVCLRADRCAEITGELEELVAVHPLRERFHEQLMTALHRCGRRAEALSTYDRARRRLAR + DLGIGPGQVLSRRREAILRSCEPAADSADRAGAGTAGQGGDELGVLREELVRLRGHVEL + LRRQQRELSEQVARLTAHHPCGP" + gene 4117..4938 + /locus_tag="IE211_RS35075" + /old_locus_tag="GCM10010301_70960" + CDS 4117..4938 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007268976.1" + /locus_tag="IE211_RS35075" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70960" + /product="AfsR/SARP family transcriptional regulator" + /protein_id="WP_031022570.1" + /transl_table=11 + /translation="MEIKVLGALNAEFEGISVVPSAGKPRQILALLALYPGRVVPVPTL + MEEIWGTDLPQSSMTTLQTYILQLRRLLGTAMGPDVPGSAKDVLATRYGGYLLQIPAEA + VDAFTYERLVTEGRQAYEDGEDERAATVLRRALDLWDGPALVDVRVGPVLEIEAMRLEQ + SRLVARERRIDADLRLGRHVELIAELTDLIARHPQHEGLHSQAMVALYRSGRQAAALDV + YRRLRQRLIDELGVEPSPQLQRLHQAMLAVDPRLDIVAGPRRTSTFDLYAA" + gene 5196..5975 + /locus_tag="IE211_RS35080" + /old_locus_tag="GCM10010301_70970" + CDS 5196..5975 + /NRPS_PKS="Domain: Thioesterase (15-242). E-value: 4.5e-38. + Score: 123.7. Matches aSDomain: + nrpspksdomains_IE211_RS35080_Thioesterase.1" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF013166.2" + /locus_tag="IE211_RS35080" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70970" + /product="alpha/beta fold hydrolase" + /protein_id="WP_046249271.1" + /transl_table=11 + /translation="MASRSRDREAGTARITLTCLAHAGAGVASYRGWAAAVGPGIDVAA + LPLPGRDSRRREPRLTERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALAD + SGLPPLFLAVGACPPPHTTTVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTF + LPVLRDDLRLARSLRNAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIE + LHTVAGGHFFASSSSLAQHVGRACRGHVTALPTGGGR" + aSDomain 5241..5921 + /aSDomain="Thioesterase" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35080_Thioesterase.1" + /evalue="4.50E-38" + /label="IE211_RS35080_Thioesterase.1" + /locus_tag="IE211_RS35080" + /protein_end="242" + /protein_start="15" + /score="123.7" + /tool="antismash" + /translation="TLTCLAHAGAGVASYRGWAAAVGPGIDVAALPLPGRDSRRREPRL + TERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALADSGLPPLFLAVGACPP + PHTTTVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTFLPVLRDDLRLARSLR + NAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIELHTVAGGHFFASSSS + LAQHV" + CDS_motif 5433..5501 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35080_0001" + /evalue="3.80E-07" + /label="NRPS-te1" + /locus_tag="IE211_RS35080" + /protein_end="102" + /protein_start="79" + /score="22.6" + /tool="antismash" + /translation="RGPYALYGHSMGALVGYTLTRAL" + gene 5972..7243 + /locus_tag="IE211_RS35085" + /old_locus_tag="GCM10010301_70980" + CDS 5972..7243 + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (3-396). E-value: + 1.7e-49. Score: 160.7. Matches aSDomain: + nrpspksdomains_IE211_RS35085_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_005321633.1" + /locus_tag="IE211_RS35085" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70980" + /product="beta-ketoacyl-[acyl-carrier-protein] synthase + family protein" + /protein_id="WP_192342468.1" + /sec_met_domain="t2ks (E-value: 2.2e-202, bitscore: 663.6, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MNRVVITGIGVVAPGAVGTADFWDLLTVGRTATRRVTLFDACGYR + SRVAAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSL + GSAIGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVA + LVSSGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPA + TASRPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAVTAHSSAHHMTGLRPG + ALEMADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSI + KSMIGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTSTVL + TVASGFGGFHTAAVLTRPRLKEAA" + aSDomain 5981..7159 + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35085_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="1.70E-49" + /label="IE211_RS35085_PKS_KS.1" + /locus_tag="IE211_RS35085" + /protein_end="396" + /protein_start="3" + /score="160.7" + /tool="antismash" + /translation="VVITGIGVVAPGAVGTADFWDLLTVGRTATRRVTLFDACGYRSRV + AAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSLGSA + IGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVALVS + SGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPATAS + RPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAVTAHSSAHHMTGLRPGALE + MADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSIKSM + IGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTS" + gene 7240..8505 + /locus_tag="IE211_RS35090" + /old_locus_tag="GCM10010301_70990" + CDS 7240..8505 + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (85-417). E-value: + 2.9e-25. Score: 80.8. Matches aSDomain: + nrpspksdomains_IE211_RS35090_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007269014.1" + /locus_tag="IE211_RS35090" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_70990" + /product="ketosynthase chain-length factor" + /protein_id="WP_193450422.1" + /sec_met_domain="t2clf (E-value: 2.7e-172, bitscore: 564.0, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTKATQAPEPARPAGAEGPRQTLVTGIGVAAPNGLGTRAWWDAVL + CGRTGLGPITRFDASGYPVRIAGEIPGFVDEDHIPSRLLPSTDRGTRIALVAAEEALRD + ANVSPADLPAYGAGVITASSAGGAEFGERGLAALWSKGAQHVSAYQSFASFHAAAPAQI + SIRHRLRGHGSTVVSEQAGGIDALARARRRIRDGACLMVTGGIDSTLCAWGWAAHLADG + RLSPATEPARAYRPFAATADGHAVGEGGALLVLEDARAAARRGATGYGVIAGCAATFDG + PDRPTLRQAAELALADAGLAPEHVDVVFADGAAERRADLVESQALCALFGPYGVPVTVP + KTMTGRLGAGGSALDVAAALLALREKVVPPTTGTGRVADDCPLDLVTGAPRELPRLRVA + LVLARGRGGFNSAAVLQAPQTE" + aSDomain 7495..8490 + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35090_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="2.90E-25" + /label="IE211_RS35090_PKS_KS.1" + /locus_tag="IE211_RS35090" + /protein_end="417" + /protein_start="85" + /score="80.8" + /tool="antismash" + /translation="STDRGTRIALVAAEEALRDANVSPADLPAYGAGVITASSAGGAEF + GERGLAALWSKGAQHVSAYQSFASFHAAAPAQISIRHRLRGHGSTVVSEQAGGIDALAR + ARRRIRDGACLMVTGGIDSTLCAWGWAAHLADGRLSPATEPARAYRPFAATADGHAVGE + GGALLVLEDARAAARRGATGYGVIAGCAATFDGPDRPTLRQAAELALADAGLAPEHVDV + VFADGAAERRADLVESQALCALFGPYGVPVTVPKTMTGRLGAGGSALDVAAALLALREK + VVPPTTGTGRVADDCPLDLVTGAPRELPRLRVALVLARGRGGFNSAAVLQA" + gene complement(8863..9099) + /locus_tag="IE211_RS35095" + /old_locus_tag="GCM10010301_71000" + CDS complement(8863..9099) + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF039972.1" + /locus_tag="IE211_RS35095" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71000" + /product="hypothetical protein" + /protein_id="WP_193450423.1" + /transl_table=11 + /translation="MRRFRPRRCIRGLWEGLVAYGRLCLAGETDRYDPPPHPRIRWHRP + PPGHPERVRDDMPLTDLERRLARELTDEDHDVR" + gene 9413..10297 + /locus_tag="IE211_RS35100" + /old_locus_tag="GCM10010301_71010" + CDS 9413..10297 + /NRPS_PKS="Domain: Polyketide_cyc (3-131). E-value: + 2.6e-13. Score: 42.2. Matches aSDomain: + nrpspksdomains_IE211_RS35100_Polyketide_cyc.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (146-253). E-value: + 1e-07. Score: 24.3. Matches aSDomain: + nrpspksdomains_IE211_RS35100_Polyketide_cyc2.1" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330954.1" + /locus_tag="IE211_RS35100" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71010" + /product="SRPBCC family protein" + /protein_id="WP_193450424.1" + /transl_table=11 + /translation="MTAPAPSGVLYGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMW + AVAGDRISSWVSHRRLDVGQRQVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFT + VIGDAPADAAWTERVTRANSRAQLQRLAWLAERWTRLDDLVMSFEDTVRVNVPAELVFD + FLYRAGDWPDDLAGTRPLTVQEDTPGIQVLALDGRSATGGEAVRISFPAAGRLVHKHTR + TSGPLAAYTGEWTIEPQPGAGLDVTVRHDVLLNDDAALDQDAARRACDEVGRAGRRLLE + HAVRHASDAVRVL" + aSDomain 9422..9805 + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35100_Polyketide_cyc.1" + /domain_subtype="Polyketide_cyc" + /evalue="2.60E-13" + /label="IE211_RS35100_Polyketide_cyc.1" + /locus_tag="IE211_RS35100" + /protein_end="131" + /protein_start="3" + /score="42.2" + /tool="antismash" + /translation="PAPSGVLYGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMWAVA + GDRISSWVSHRRLDVGQRQVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFTVIG + DAPADAAWTERVTRANSRAQLQRL" + aSModule 9422..10171 + /domains="nrpspksdomains_IE211_RS35100_Polyketide_cyc.1" + /domains="nrpspksdomains_IE211_RS35100_Polyketide_cyc2.1" + /incomplete + /locus_tags="IE211_RS35100" + /tool="antismash" + /type="unknown" + aSDomain 9851..10171 + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35100_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="1.00E-07" + /label="IE211_RS35100_Polyketide_cyc2.1" + /locus_tag="IE211_RS35100" + /protein_end="253" + /protein_start="146" + /score="24.3" + /tool="antismash" + /translation="SFEDTVRVNVPAELVFDFLYRAGDWPDDLAGTRPLTVQEDTPGIQ + VLALDGRSATGGEAVRISFPAAGRLVHKHTRTSGPLAAYTGEWTIEPQPGAGLDVTVRH + DVL" + gene 10294..12162 + /locus_tag="IE211_RS35105" + /old_locus_tag="GCM10010301_71020" + CDS 10294..12162 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330953.1" + /locus_tag="IE211_RS35105" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71020" + /product="acyl-CoA dehydrogenase" + /protein_id="WP_193450425.1" + /transl_table=11 + /translation="MTAALDTAAGPTGQTPAPRSTTPTPEHTTPTPEPEHTTRAPAPES + QHTTPERECAARVPEPERAARLEAALGDPFDPANPHGHLALVRADDTREAPHATEALLT + EHGLSAEFVPHDLGGRLRDLEELARVLRPLFRRDLALGYGFGITSLFAASSVWTAGDPH + QRAALADVLLGGGRVAIVHREVAHANAILRREVRAQRPAGGGFLLNGSKDAVMNADRTD + TFVVYARTSAGSGSASHSVLLLPGPPASGEVRRLARVEMPGMRGARFHGLRLADVRLPD + SALVGSLGEGVTLALRSFQISHCLIPGTVLAGVDSVLRLAVRAATENRPDGRPARRWHK + ALSGVFADLLACDAMAVTGLRALSLVPQHAHLLAAAVKYTMPDLLREDLEELAAVLGAR + GYDRGPLYGGFQKLARDLPVAGLGHSGTAVCQAVLVPQLPALARTAWFRTAEPSAALFL + PGAPLPPLDHRRLTHSGTDDPLTATLIGAAERLAARTGTQPLHAALAALARALVEELRV + LRARCAALPAAGSTVFDPLACALADRYALLLCAAACLGVWEGQADGDGFLADPAWAVLV + LSRIGRRLGIAVPETPADAEQAVLAEALGRCRHGRSLDLYDTPLAG" + gene 12253..13062 + /locus_tag="IE211_RS35110" + /old_locus_tag="GCM10010301_71030" + CDS 12253..13062 + /GO_function="GO:0008897 - holo-[acyl-carrier-protein] + synthase activity [Evidence IEA]" + /NRPS_PKS="Domain: ACPS (134-195). E-value: 7e-12. Score: + 37.1. Matches aSDomain: + nrpspksdomains_IE211_RS35110_ACPS.1" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007389988.1" + /locus_tag="IE211_RS35110" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71030" + /product="4'-phosphopantetheinyl transferase superfamily + protein" + /protein_id="WP_029394636.1" + /transl_table=11 + /translation="MERVTCAAPLHVPRPHGPWPAVREDLFRHGNALVCTTWSEWLPSV + LTTPRLRELLGDDWQRYRRTRDAAVRYRFAASRMLIKYTAAAALAVPPEYLDLAYRLGG + RPYLRGFDQIELSLSHTGDVMAVGLSRIGRIGVDVEPAERPVRLDLLETQVFTPAEARE + LAELPEGERTAHALRLWTLKEAYSKALGQGLRFGFKEFGFRQGRLSAPDGSRVTRDEWG + FATYPVMDRFLLSVACHNAGLSTAGDTSVGTMLDQGFLSAMTDTGQQ" + aSDomain 12655..12837 + /aSDomain="ACPS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35110_ACPS.1" + /evalue="7.00E-12" + /label="IE211_RS35110_ACPS.1" + /locus_tag="IE211_RS35110" + /protein_end="195" + /protein_start="134" + /score="37.1" + /tool="antismash" + /translation="IGVDVEPAERPVRLDLLETQVFTPAEARELAELPEGERTAHALRL + WTLKEAYSKALGQGLR" + gene 13267..14757 + /locus_tag="IE211_RS35115" + /old_locus_tag="GCM10010301_71040" + CDS 13267..14757 + /NRPS_PKS="Domain: Condensation_DCL (38-314). E-value: + 1.6e-48. Score: 157.2. Matches aSDomain: + nrpspksdomains_IE211_RS35115_Condensation_DCL.1" + /NRPS_PKS="type: NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) Condensation" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: protein motif:HMM:NF012873.2" + /locus_tag="IE211_RS35115" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71040" + /product="condensation domain-containing protein" + /protein_id="WP_051890455.1" + /sec_met_domain="Condensation (E-value: 3.4e-30, bitscore: + 96.2, seeds: 42, tool: rule-based-clusters)" + /transl_table=11 + /translation="MAWHSRPRALRGPGTARPPGVPALWPHLDLLGDFGGRRGAGRHVE + QLVWRWHGPLDTERFTAAWQSVVDRESVLRAALAPGPRPHLVLHEHAHGDVVRHRAGGA + GWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGPVTRVVLTFHHALLDAWSVCLL + MQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGARDFWRGTVPDGPVAVLPARPG + PRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSALETVWALLLYRAAGPGGAATVG + FGVTVSGRGITLDCAERLPGPLRNCLPMVVRVDPGETVGRLLTALRDRALDMAAYEWVS + TRRIHRWTGRCPDGELLQSVVSVDRLPRPPGNLRNELADAGIALEPEPAHGACPDLPVA + LLVRPGGDGRLTFCVDHDRNRISDADARLLAGHCARLLRHLPGTDEATTNGAVLDVLAG + EALPRIAPRPSRPRPAGSWLRPRSTSSGAAVDRAASHP" + aSDomain 13381..14208 + /aSDomain="Condensation" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35115_Condensation_DCL.1 + " + /domain_subtype="Condensation_DCL" + /evalue="1.60E-48" + /label="IE211_RS35115_Condensation_DCL.1" + /locus_tag="IE211_RS35115" + /protein_end="314" + /protein_start="38" + /score="157.2" + /tool="antismash" + /translation="GAGRHVEQLVWRWHGPLDTERFTAAWQSVVDRESVLRAALAPGPR + PHLVLHEHAHGDVVRHRAGGAGWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGP + VTRVVLTFHHALLDAWSVCLLMQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGA + RDFWRGTVPDGPVAVLPARPGPRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSAL + ETVWALLLYRAAGPGGAATVGFGVTVSGRGITLDCAERLPGPLRNCLPMVVRVD" + CDS_motif 13396..13497 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35115_0001" + /evalue="4.80E-10" + /label="C2_DCL_024-062" + /locus_tag="IE211_RS35115" + /protein_end="77" + /protein_start="43" + /score="31.7" + /tool="antismash" + /translation="VEQLVWRWHGPLDTERFTAAWQSVVDRESVLRAA" + CDS_motif 13714..13779 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35115_0002" + /evalue="4.90E-08" + /label="C3_DCL_135-156" + /locus_tag="IE211_RS35115" + /protein_end="171" + /protein_start="149" + /score="25.5" + /tool="antismash" + /translation="FHHALLDAWSVCLLMQELCRAY" + CDS_motif 14107..14193 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35115_0003" + /evalue="6.10E-06" + /label="C5_DCL_263-294" + /locus_tag="IE211_RS35115" + /protein_end="309" + /protein_start="280" + /score="18.7" + /tool="antismash" + /translation="GFGVTVSGRGITLDCAERLPGPLRNCLPM" + CDS_motif 14185..14244 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35115_0004" + /evalue="3.90E+01" + /label="C2_LCL_024-062" + /locus_tag="IE211_RS35115" + /protein_end="326" + /protein_start="306" + /score="-3.2" + /tool="antismash" + /translation="LPMVVRVDPGETVGRLLTAL" + gene 14792..14938 + /locus_tag="IE211_RS35120" + /old_locus_tag="GCM10010301_71050" + CDS 14792..14938 + /codon_start=1 + /inference="COORDINATES: ab initio prediction:GeneMarkS-2+" + /locus_tag="IE211_RS35120" + /note="Derived by automated computational analysis using + gene prediction method: GeneMarkS-2+." + /old_locus_tag="GCM10010301_71050" + /product="hypothetical protein" + /protein_id="WP_019330950.1" + /transl_table=11 + /translation="MHEGDDERHEGDTARCARAVHGGPPPLRLAGAEEREDEDGRVIVR + SID" + gene 15232..15648 + /locus_tag="IE211_RS35125" + /old_locus_tag="GCM10010301_71060" + CDS 15232..15648 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330949.1" + /locus_tag="IE211_RS35125" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71060" + /product="pyridoxamine 5'-phosphate oxidase family protein" + /protein_id="WP_193450426.1" + /transl_table=11 + /translation="MPSMPRPDAVTVPDSVQAFLTGTALVAAFTTMRPDGTPHVAPVRF + TWDSDAQLARVMTVRSSRKARNLLATPGAPVALCQVDGFRWVTLEGTGTVVTDPERVAL + GARLYAKRYWSAPPTPSDRVVIEIAVDRVLSLNA" + gene complement(15887..16369) + /locus_tag="IE211_RS35130" + /old_locus_tag="GCM10010301_71070" + CDS complement(15887..16369) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007389987.1" + /locus_tag="IE211_RS35130" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71070" + /product="nuclear transport factor 2 family protein" + /protein_id="WP_052731589.1" + /transl_table=11 + /translation="MTSSLTTDQSASVSAAESSAQVAGLLHRYLVSLDDERLDDAWTAG + LFTEDAVVAFPVSRHEGADGMAEYHRSALSAFAATQHLGSPAVVDVDGDRAVFRANLIS + THVHHPHHTPPEGDLPPLFATGTFVNGEARRTARGWRLSLLAFRLLWADGSPPPAR" + gene 16536..18008 + /locus_tag="IE211_RS35135" + /old_locus_tag="GCM10010301_71080" + CDS 16536..18008 + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007385270.1" + /locus_tag="IE211_RS35135" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71080" + /product="FAD-dependent monooxygenase" + /protein_id="WP_029394635.1" + /transl_table=11 + /translation="MEFYDSDVIVVGAGPTGLMLAGELRLAGVSVVVLDKLSEPIQESR + ALGFSARTIEEFAQRGLMDRFGEVGVIPVGHFGGVPLDYRVIEGGSYGARGIPQARTEG + VLGGWARELGADIRRGCEVTGIEQTDASVTVTAAGADGPFSLRARHVVGCDGARSIVRK + LAGIGFPGTEPAIELRFADLAGVALRPRFSGERVAGGMVMVIPMGPDRCRVIYFDSSEP + LRTSPDPITFDEVAQTWQRLTGEDVSGATPLWVSSTTDVSRQADRYRHGRVFLAGDAAH + IHLPIGAQGMSAGVQDAVNLGWKLALDIKGQAPEGLLDTYHAERHPVGARILTNTLAQR + ILYLGGDEITPMREVLAELMGAHESVQRHLAGMVTGLDIRHDVGEGDHPLLGRRLPDRE + LVVDGEKTPFYALLRTARPVLLELGGDHGLRTAAAGWADRVDLVAAEFDGCEAPVDGIL + VRPDGYVAWVAGLGAGPDGLTAALGRWFGPTA" + gene 18065..18763 + /locus_tag="IE211_RS35140" + /old_locus_tag="GCM10010301_71090" + CDS 18065..18763 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018383121.1" + /locus_tag="IE211_RS35140" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71090" + /product="antibiotic biosynthesis monooxygenase" + /protein_id="WP_019330946.1" + /transl_table=11 + /translation="MPIISAEDKHLTVLNLFTTDTPEKQAKLIEEMTKIVNAAAYEGWM + SSTVHSGVDGYGTLNFIQWRSGEDLEKRYAGEEFKHRTLPVFGEITTSIRLMQNEVAHT + LTSDALGGKIEIGPDRDDYTVFTLFPVTPEGQDEAVDALGPGQAFLADVPGFRAHVVLK + GLRARGLEGSFVISYSQWDSKEAFEVYRDQAPEEQADARKAAVARVRAVVTGEPYLNTY + RVVHTRSAGE" + gene 19021..19350 + /locus_tag="IE211_RS35145" + /old_locus_tag="GCM10010301_71100" + CDS 19021..19350 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019767153.1" + /locus_tag="IE211_RS35145" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71100" + /product="TcmI family type II polyketide cyclase" + /protein_id="WP_019330945.1" + /transl_table=11 + /translation="MHSTLIVARMAATSSNDVAQLFADFDATEMPHRMGTRRRQLFSYR + GLYFHLQDFDEDNGGELIEAAKADPRFVRISEDLKPFIEAYDPTTWRSPADAMATRFYS + WEASR" + gene 19347..20618 + /locus_tag="IE211_RS35150" + /old_locus_tag="GCM10010301_71110" + CDS 19347..20618 + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (5-395). E-value: + 3.7e-53. Score: 172.7. Matches aSDomain: + nrpspksdomains_IE211_RS35150_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007385254.1" + /locus_tag="IE211_RS35150" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71110" + /product="beta-ketoacyl-[acyl-carrier-protein] synthase + family protein" + /protein_id="WP_029394634.1" + /sec_met_domain="t2ks (E-value: 2.3e-248, bitscore: 815.1, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MSGRRVVITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAP + FRSRVAAEADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVT + VGSAVGATMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPS + TVVSTGCTSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEP + ECASRPFDKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRP + DGVEMAEAIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSS + IKSMVGHSLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQLIDAV + LTVGSGFGGFQSAMVLATPERSLV" + aSDomain 19362..20531 + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35150_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="3.70E-53" + /label="IE211_RS35150_PKS_KS.1" + /locus_tag="IE211_RS35150" + /protein_end="395" + /protein_start="5" + /score="172.7" + /tool="antismash" + /translation="VVITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAPFRSRV + AAEADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVTVGSAV + GATMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPSTVVST + GCTSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEPECASR + PFDKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRPDGVEM + AEAIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSSIKSMV + GHSLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQL" + gene 20615..21826 + /locus_tag="IE211_RS35155" + /old_locus_tag="GCM10010301_71120" + CDS 20615..21826 + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (48-401). E-value: + 9.4e-31. Score: 98.9. Matches aSDomain: + nrpspksdomains_IE211_RS35155_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330943.1" + /locus_tag="IE211_RS35155" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71120" + /product="ketosynthase chain-length factor" + /protein_id="WP_030970827.1" + /sec_met_domain="t2clf (E-value: 2e-209, bitscore: 686.3, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTASVVVTGLGVVSPNGMGVKDYWAATLGGKHGIGRITRFDPTGY + PARLAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPAHLPEFDMGVIT + ASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSEG + AGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSDEPDHAYLPFDR + DANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGREPNLAKAIETA + LADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKTMTGRLYSGGAP + LDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLARGAGGFNSAMV + VRAA" + aSDomain 20759..21817 + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35155_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="9.40E-31" + /label="IE211_RS35155_PKS_KS.1" + /locus_tag="IE211_RS35155" + /protein_end="401" + /protein_start="48" + /score="98.9" + /tool="antismash" + /translation="LAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPA + HLPEFDMGVITASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGM + KGPSGVVVSEGAGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSD + EPDHAYLPFDRDANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGR + EPNLAKAIETALADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKT + MTGRLYSGGAPLDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLA + RGAGGFNSAMVVR" + CDS_motif 21080..21103 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35155_0001" + /evalue="9.90E+01" + /label="PKSI-KS_m4" + /locus_tag="IE211_RS35155" + /protein_end="163" + /protein_start="155" + /score="-2.9" + /tool="antismash" + /translation="SGVVVSEG" + CDS_motif 21272..21310 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35155_0002" + /evalue="1.20E-04" + /label="PKSI-KS_m4" + /locus_tag="IE211_RS35155" + /protein_end="232" + /protein_start="219" + /score="15.0" + /tool="antismash" + /translation="FDRDANGYVPGEG" + gene 21895..22164 + /locus_tag="IE211_RS35160" + /old_locus_tag="GCM10010301_71130" + CDS 21895..22164 + /NRPS_PKS="Domain: ACP (12-83). E-value: 9.1e-13. Score: + 40.2. Matches aSDomain: nrpspksdomains_IE211_RS35160_ACP.1" + /NRPS_PKS="type: other" + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) PP-binding" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015037163.1" + /locus_tag="IE211_RS35160" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71130" + /product="acyl carrier protein" + /protein_id="WP_019330942.1" + /sec_met_domain="PP-binding (E-value: 1.7e-08, bitscore: + 26.1, seeds: 164, tool: rule-based-clusters)" + /transl_table=11 + /translation="MASKSFTLDDLKRTLREAAGVAEGVDLDGDILDTEFEVIGYESLA + LLEAGSLIEREYGISLDEEAVGEANTPRSFIEVVNAQLAPAKAA" + aSDomain 21931..22143 + /aSDomain="ACP" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35160_ACP.1" + /evalue="9.10E-13" + /label="IE211_RS35160_ACP.1" + /locus_tag="IE211_RS35160" + /protein_end="83" + /protein_start="12" + /score="40.2" + /tool="antismash" + /translation="RTLREAAGVAEGVDLDGDILDTEFEVIGYESLALLEAGSLIEREY + GISLDEEAVGEANTPRSFIEVVNAQL" + gene 22177..22965 + /gene="fabG" + /locus_tag="IE211_RS35165" + /old_locus_tag="GCM10010301_71140" + CDS 22177..22965 + /EC_number="1.1.1.100" + /GO_function="GO:0016491 - oxidoreductase activity + [Evidence IEA]" + /NRPS_PKS="Domain: PKS_KR (8-164). E-value: 7.1e-11. Score: + 34.2. Matches aSDomain: + nrpspksdomains_IE211_RS35165_PKS_KR.1" + /NRPS_PKS="type: other" + /codon_start=1 + /gene="fabG" + /gene_functions="biosynthetic-additional + (rule-based-clusters) adh_short" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330941.1" + /locus_tag="IE211_RS35165" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71140" + /product="3-oxoacyl-ACP reductase FabG" + /protein_id="WP_030970829.1" + /sec_met_domain="adh_short (E-value: 6.5e-36, bitscore: + 115.1, seeds: 230, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTDTTTQRVAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVA + ATVKELQGEGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIA + DELWDDVIDTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKH + GVVGFTKALGNELAPTGITVNAVCPGYVETPMAQRVRQGYAAAYDTSEDAILEKFQAKI + PLGRYSTPEEVAGLVGYLASDTAASITSQALNVCGGLGNF" + aSDomain 22201..22668 + /aSDomain="PKS_KR" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35165_PKS_KR.1" + /evalue="7.10E-11" + /label="IE211_RS35165_PKS_KR.1" + /locus_tag="IE211_RS35165" + /protein_end="164" + /protein_start="8" + /score="34.2" + /tool="antismash" + /translation="VAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVAATVKELQG + EGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIADELWDDVI + DTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKHG" + CDS_motif 22207..22269 + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE211_RS35165_0001" + /evalue="6.00E-05" + /label="PKSI-KR_m1" + /locus_tag="IE211_RS35165" + /protein_end="31" + /protein_start="10" + /score="15.7" + /tool="antismash" + /translation="VVTGATSGIGLASARLLGRQG" + gene 23006..23947 + /locus_tag="IE211_RS35170" + /old_locus_tag="GCM10010301_71150" + CDS 23006..23947 + /NRPS_PKS="Domain: Polyketide_cyc2 (4-146). E-value: + 2.8e-16. Score: 52.0. Matches aSDomain: + nrpspksdomains_IE211_RS35170_Polyketide_cyc2.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (156-309). E-value: + 1.8e-08. Score: 26.7. Matches aSDomain: + nrpspksdomains_IE211_RS35170_Polyketide_cyc2.2" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330940.1" + /locus_tag="IE211_RS35170" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71150" + /product="aromatase/cyclase" + /protein_id="WP_193450427.1" + /transl_table=11 + /translation="MTTREVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEAD + GDHERIHIWATANGQAKEWTSHRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDR + SRVRLLHDYSAIGDDPHDLLWIEQAVDKNSTSELAALKVNVEAAHAAAEELTFSFADTV + QIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGLQELEMDTRAKDGSVHTTKSYR + VVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTASSQHTVTLNTANIARILGQEAT + VADARAYVHTALSTNSRATLAHAKAYAEQKKG" + aSDomain 23018..23443 + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35170_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="2.80E-16" + /label="IE211_RS35170_Polyketide_cyc2.1" + /locus_tag="IE211_RS35170" + /protein_end="146" + /protein_start="4" + /score="52.0" + /tool="antismash" + /translation="EVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEADGDHE + RIHIWATANGQAKEWTSHRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDRSRVR + LLHDYSAIGDDPHDLLWIEQAVDKNSTSELAALKVNVE" + aSModule 23018..23932 + /domains="nrpspksdomains_IE211_RS35170_Polyketide_cyc2.1" + /domains="nrpspksdomains_IE211_RS35170_Polyketide_cyc2.2" + /incomplete + /locus_tags="IE211_RS35170" + /tool="antismash" + /type="unknown" + aSDomain 23474..23932 + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE211_RS35170_Polyketide_cyc2.2" + /domain_subtype="Polyketide_cyc2" + /evalue="1.80E-08" + /label="IE211_RS35170_Polyketide_cyc2.2" + /locus_tag="IE211_RS35170" + /protein_end="309" + /protein_start="156" + /score="26.7" + /tool="antismash" + /translation="FSFADTVQIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGL + QELEMDTRAKDGSVHTTKSYRVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTAS + SQHTVTLNTANIARILGQEATVADARAYVHTALSTNSRATLAHAKAYAE" + gene 24008..25426 + /locus_tag="IE211_RS35175" + /old_locus_tag="GCM10010301_71160" + CDS 24008..25426 + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018511397.1" + /locus_tag="IE211_RS35175" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71160" + /product="FAD-dependent monooxygenase" + /protein_id="WP_051890464.1" + /transl_table=11 + /translation="MMLAGELAHGGVGVVVVEKRRAPSTESRASTLHARTMEILDSRSL + LPEFGDPPNEPRGHFGGIPLDLTLPSSHPGQWKVPQTRTEVILGEWALSLGAELQCKHE + LTALDDSGDLVEAEAAGPDGRTLRLRCRYLVACDGEESTVRRLIGADFPGRDATRELLR + ADVAGIDIPGRRFERLEHGLAIAARRPDGVTRVMVHEFGSAARARPHGDASFEEITAVW + KRVTGEDISGGTPLWANAFGDASRQLTRYRHGRVLFAGDAAHRQMPVGGQALNLGMQDA + FNLGWKLALVVRGKAPQTLLDSYHDERHEVGRQVLANIRAQSLLLLGGPEVEPLRDLLT + ELIGQEDVRRRLAGMISGLDVRYDVGGPAHPLLGARLPCTEVRARRRLLTTTHLVRSGG + GVLLDLTGRPGRPPAVLDGWADRVTALDAQPSPGSSLQGTDRVLVRPDGHVAWAGPGTD + GLAEALTRWFGPPR" + gene 25529..27043 + /locus_tag="IE211_RS35180" + /old_locus_tag="GCM10010301_71170" + CDS 25529..27043 + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330938.1" + /locus_tag="IE211_RS35180" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71170" + /product="FAD-dependent monooxygenase" + /protein_id="WP_193450428.1" + /transl_table=11 + /translation="MEGTAADTDVIVVGAGPTGLMLAGELRLGGARVVVIEKLAAPTGQ + SRGLGFTARAMETFDERGLLPRFGQGETLATSPVGHFGGAQFDFTVLEDAHFGARGIPQ + GDTEAVLEGWAGELGADIRRGWEFVSLTDGFLDGDGVEITVRTPQGEERTLRASYLAGC + DGGSSRVRRAAGFDFPGTDATQGMYLADITGVELTPRFLGERLNNGMVMAAPLSQGVWR + IIVCPDGRPAHDRERTVTFEEVAAAWQDITGEDISHGGASWVSSFTNATRQASEYRRGR + VFLAGDAAHIHLPAGGQGLSTGVQDAANLGWKLASVIRGDAPRELLDTYHAERHPVGAR + LLMNTRAQGIVFLGGAESDPLRELMAELVRYDDVKRHLAGIVSHLDIRYDLADTATGPT + HPLLGRRMPPRLLVGADGETRIARLLHAGHGVLLDLADDETVRATAAGHADRVDVVTAV + AKPTDGPDALAGATAVLIRPDGYVAWTGTCAQGLETALERWCGPPR" + gene complement(27262..28224) + /locus_tag="IE211_RS35185" + /old_locus_tag="GCM10010301_71180" + CDS complement(27262..28224) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330937.1" + /locus_tag="IE211_RS35185" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71180" + /product="acetylserotonin O-methyltransferase" + /protein_id="WP_234311021.1" + /transl_table=11 + /translation="MVTRAVHVAAELKVAEALAEGPLSADELAGRVGADADALGRVLRL + LASNGVFATRPDGAFELTPMADALRADHPMSMRGIALLMGHPIHWEDWSGFPETVVTGE + PALPKLRGMHAFEFLTKNAEYGQVFFQGMGSMSASETEPILAAYDFSQFGTVVDFCGGQ + GALLAGILGAAPGCEGVLFDPRVEENGAAEFLAAQGVADRTKRVAGDLFDVPPGGADAY + VLKHIVHDWPEEQALRILRNVRAAIKPGGKLLIAEMVIPEQGDQPHSGKLVDLWLMLLV + GGRERTPGQYADLLARAGFRLERVVETAAAISLVEAVPV" + gene 28591..29706 + /locus_tag="IE211_RS35190" + /old_locus_tag="GCM10010301_71190" + CDS 28591..29706 + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF033206.1" + /locus_tag="IE211_RS35190" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71190" + /product="ScyD/ScyE family protein" + /protein_id="WP_193450429.1" + /transl_table=11 + /translation="MANSRNSWTKILLAAGAAGAVAVPLTAGPVQAQPQAHRHGHTHTR + TEATVTVVASQLNNPRGVTALGDGGVLVAEAGAGLADCPVDQTCVGTTGSVYKVKGSFQ + GRVATGLASTAKGVAPGAPISANGPSDVVPDRFGGYVVVSGLGGTTESRAALGEGAQTL + GTVFRTRDHKVLADLTDHETRLNPDGGDVHANPWRLARSGSGYLATDAGANTVVRGNAD + GTTATEYLLPKNELPTGAAETVPTGIAKAADGTVYVADMSGGRVGASRVWKIAPGRQPE + ILATGMTNLIDLDLDRDGDLIALSYSAAALAGPPQPGALFEIDADSGAVTEIPTGDQLK + QPTGVAVDPCGKVYVTNNTLGTNGQLVRVNR" + gene 29956..31071 + /locus_tag="IE211_RS35195" + /old_locus_tag="GCM10010301_71200" + CDS 29956..31071 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003962403.1" + /locus_tag="IE211_RS35195" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71200" + /product="inositol-3-phosphate synthase" + /protein_id="WP_127437809.1" + /transl_table=11 + /translation="MTSADETRTGVWLVGARGSVATTAVSGCAALAAGLLPPTGMVTET + PPFADCGLPALASLVFGGHDTATTPLPKRAEELAAQGVLPPWLPTAVQGELAAADEHIR + PGGPVPGDRRATEELIADFATDLRTFARTTGVARTVVVNVASTEPDPAHGAWPASSLYA + AAALRAGCPYVNFTPSTGLSHPQLAGAARASGLPYAGRDGKTGQTLLRSVLGPMFAQRA + LAVRAWSGTNLLGGGDGAALADPAAAAAKNAGKERVLTDTLGTRVEGEVHIDDVPALGD + WKTAWDHVAFDGFLGTRMVLQTIWQGCDSALAAPLVLDLARLLARAHERGLSGPLGELG + FYFKDPDAEGSALAEQYTRLLTLADRLGGTR" + gene 31068..32021 + /locus_tag="IE211_RS35200" + /old_locus_tag="GCM10010301_71210" + CDS 31068..32021 + /GO_component="GO:0016021 - integral component of membrane + [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330933.1" + /locus_tag="IE211_RS35200" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71210" + /product="UbiA family prenyltransferase" + /protein_id="WP_193450430.1" + /transl_table=11 + /translation="MSAQRPAHGPARDGHLHAWAELLRAPAALTVPGDVLAGTAAAGTR + PTGRTALAAGASLCLYEAGMALNDWADREEDATARPHRPLPSGRVRPGAALAAAGLLSA + AGLALAACAGRRALAVAGPLAATVWAYDLGLKHTPAGPAAMAAARSLDLLLGAAAGPGA + VRRAIVPAAFLGSHTLAVSLVSRRETEGGSSTAPLTALAAAGALTTVLAGRPTAHPAPD + ASTGAPTPATPADKATRAVRAALAASYAATFARPLAHAALNPSPELTQRAVGAGVRATI + ALQSGLMARAGAPGTGVLTAALAPLAAHLARKVSTT" + gene 32018..32863 + /locus_tag="IE211_RS35205" + /old_locus_tag="GCM10010301_71220" + CDS 32018..32863 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018384637.1" + /locus_tag="IE211_RS35205" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71220" + /product="sugar phosphate isomerase/epimerase" + /protein_id="WP_019330932.1" + /transl_table=11 + /translation="MSPLRLGYGTNGLTDLRLEDALRLLADLGYDGVGLTLDHMHLDPL + APDLAARTRHVARQLHRLGLAVTVETGARYVLDPRRKHGPSLLDDDPDARWARVRLLIR + SVRVAADLGAHAVHCFSGPRPAGLDQDTAWKRLADALGPVLDAAEDTGVPLAVEPEPGH + LLATLTDFHRLRTELGDPEPLGLTLDIGHCQCLEPLPPADCVRAAAPWLRHVQIEDMRR + GVHEHLPFGDGEIDFPPVLDALAATGYQGLTVVELPRHSHAGPELAAQSMRFLRNGGTR + " + gene 32860..33459 + /locus_tag="IE211_RS35210" + /old_locus_tag="GCM10010301_71230" + CDS 32860..33459 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019890542.1" + /locus_tag="IE211_RS35210" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010301_71230" + /product="EboA domain-containing protein" + /protein_id="WP_079126814.1" + /transl_table=11 + /translation="MTVVHTPPDADLPGEFAGLGTDARRWLTAARASATARDTDWELRF + AEAGRRCGTEHADAARVLLLTAARPDAETVTLLYHRGTAAERRAVLLALDGLDTEPAHA + LPLVEDALRANDTTLLAAALGPYAARHLDAHQWRHAVLKCLFTGVPVATVANLAARARA + DAELARMLRAYAAERTAAHRDIPADLDRVLALTQEQ" + gene 33461..>33697 + /locus_tag="IE211_RS35215" + /pseudo="" + CDS 33461..>33697 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_016327783.1" + /locus_tag="IE211_RS35215" + /note="incomplete; too short partial abutting assembly gap; + missing C-terminus; Derived by automated computational + analysis using gene prediction method: Protein Homology." + /product="hydrolase TatD" + /pseudo="" + /transl_table=11 + /translation="LRIFDPHIHMTSRTTDDYEAMHAAGVRAVVEPAFWLGQPRTSPAS + FRDYFDALLGWEPFRAAQYGIAHHCTIALNPKEA" +ORIGIN + 1 gatgtgcgac gccttcaaca tccccctcgt caccttcctg gacgtccccg gcttcctgcc + 61 gggtgtggac caggagcacg gcgggatcat ccgtcacggg gccaagctgc tgtacgcgta + 121 ctgcaacgcg accgtcccgc ggatctcgct gatcctgcgc aaggcctacg gcggcgccta + 181 catcgtgatg gactcccagt ccatcggcgc cgacctcacc tacgcctggc cgaccaacga + 241 gatcgcggtg atgggcgcgg agggcgccgc caacgtcatc ttccgccggc agatcgccga + 301 ggccgaggac cccgacgcgg tgcgcgcccg catggtcaag gagtacaggg ccgagctgat + 361 gcacccctac tacgcggccg aacgcggcct ggtcgacgac gtcatcgacc ccgccgagac + 421 ccgcgaggtg ctgatcgagt ccctggcgat gctgcgcacc aaggacgccg acgtgccctc + 481 ccgcaagcac ggcaaccccc cgcagtgacg gagtgatcga tggccagaca ggaacgtgcg + 541 gtgcgtacgc gggaagccct gatcaggtct gcggccgaga tcttccacga cgagggcttc + 601 cacgccgccg cgctcaccac gatcagctcc agggcggggg tgagcaacgg cgcactgcac + 661 ttccacttcg ccagcaaggc ggcgctggcg gacgcggtgg aggaagcggc cgcagacgtg + 721 ctgcgggccg tcgtcggccg gtgggacggg ggaccgcccg gggttctgca gtgcctggtg + 781 aacgccaccc atgagctggc ctgcgccctg cagaacgacg tggtgctgcg ggcgggtttc + 841 gagctgagcc gggaggccgg ccggcagccg cggaccgacc tgcggctgtg ctggcagaac + 901 tgggtcaccg acatggtcgg ccgggccggg cgcggcggcg agctgcgcga gagcgtggcg + 961 ccggagagcg ccgtggccgc cgtggtcgcc gccaccagcg gcttcgaggt gctcggcatg + 1021 cgcaaccagg cgtggctgtc ccgcagtacg gtcgcccagt tctggctgct gctcctgccc + 1081 gcgctcgcgc cggcgccgca cgccgggctc tggcaggccg agggctcctg gaccgggacc + 1141 gccaccggat aattaaagac cgtacggtct cctttggggg cgccgaccgg acgcccgaat + 1201 cgggcattcg ggaaacggcg ccccttttcc ctgtgcgggg cttccccgtc ccgcgcgatc + 1261 cgcgccgatg gtttccagtc aatcgctccg gtgctggaca gggcgcggtt tcgcgcaaca + 1321 ctggcgaatc atgggcgggt tgagtgatga agggcctgtt cggagccggg ttgtgggcag + 1381 atgttcgatc agggtttgac tggatctggg cgatgccggg gcggcgcgtc gagtccacat + 1441 tgacaaaccg actgagctgt ttttttatcg ggactgcagc cgcgccgggt cccggtcagc + 1501 gggagacgcg caggccggcc accggcctgc ggccttgaaa acatggggga aacgtggaca + 1561 tcgaagtgct gggtgcgctg tcggtgcgcg agcacggggt gtcggtcgtg ccgaccgcac + 1621 ccaagccgcg ccaggtcctg gccctgctcg cgctcaacgc cgaccaggtg gtcccggtgg + 1681 ccgcgctcgt cgacgaactg tggggggaga acccgccgcg cagcgcgcgg accaccctgc + 1741 agacctacgt cctgcagctg cgcgagctga tggcccaggc gctggcccac ggccccgacg + 1801 aacgctgcac cgccaaggac atcctcgcca cggttcccgg cggctaccgc ctgcagacac + 1861 gcggcggcca cgtcgactac cgcgagttcg accagcgcgc cggcctcggc taccgggcca + 1921 tggacgccga ggactacgcc ggcgcggccc gccggctggc cgacgcgctc gcgctgtgga + 1981 acgggcaggc cctgaccgac atccaggccg gcctgcgcat cgacacggag gtcaagcggc + 2041 tggaggaggc ccggctgtgc gcgctcgacc agcgcatcga ggccgacctg cggctcggac + 2101 gccaccggga actgctgtcg gaactgacgg tcctggtcaa ccagtaccgc atgcacgaga + 2161 gcctgcacgg ccagttcatg ctggccctgc accgctcggg ccggcgcggt gaggccctca + 2221 acgtctacca gcggctgcgc agcacactcg tgcacgaact gggcctggaa ccctccgccg + 2281 cgctcagccg cctgcagcgc tccatcctca tggcccgccc cgagacgccc gccgccgccg + 2341 gcggcagcgg ccgcctcgtc acccgctgac ccggccgccg ttcctcacgg gccgcacgga + 2401 tggtgtgccg tgagccgggc gacctgctcg gacagctccc gctgctgccg gcgcagcagc + 2461 tccacgtggc cgcgcagccg caccagctcc tcccggagca ccccgagttc gtccccgccc + 2521 tgcccggccg tcccggcccc cgcccggtcg gcggagtccg ccgccggctc acaagagcgc + 2581 agaatcgctt ctctgcgacg gctgagcacc tggcccggcc cgatacccag atcacgggcc + 2641 agccgccggc gcgccctgtc gtaggtgctc agcgcctcgg cccggcggcc gcagcggtgc + 2701 agcgccgtca tcagctgctc gtggaaccgc tcacgcagcg ggtgcacggc gaccagctcc + 2761 tccagctcac cggtgatctc cgcacagcgg tccgcccgca gacagacgtc gtagagcacc + 2821 tccagggcac gcagccggct ctcctccagc agcgccgcct cggccgaaca gatgggcccc + 2881 tggccgctgc cctgcagagc gggcccgcgc cacagcgcca gagcctcacg cagcacctcc + 2941 accgcccggc ccggggcggt ggcggccagc tcgcgcccct ggcccaccag acggtggaag + 3001 cgctgcgcgt ccgtcgccgc cggccccagg ctcagggtgt agcccagcgg ggaggtccgc + 3061 agccacacat ggcgcggccc gcccgggccc ggggccggca gcagccgccg cagccgggcc + 3121 acatgggcct gcagcgcgtt ggcggcgttg accggagggt gcccgcccca cagctcctcc + 3181 acgaggcact cggcgggcac cgcctgcccg gcccgcacca gcagcgcgcc cagcagcgca + 3241 cgctgcttcg cacccgcggg aacgatccgt acgccgaaac gctcgtcgtg gatctgcacg + 3301 gaaccaagaa tccggaactc catctcgccc ttgcccggga agcacccgat tccgcatccg + 3361 ccggcccgga tcacggcccc ggtattccct cacgaatagc aggtgcactt ccttccgcac + 3421 ggactctatc cgcccatggt ttccggcacg ctattctcca gccggccccg taccggcgtg + 3481 ggcgattcct cgagagttct tcagcccccg cggccctggc ccgcccgaaa aggacaggac + 3541 accgcgaccg aaaagcccgc cccgcccgga cagccggtga cacccacccg ccgcccgcca + 3601 ggacaggaaa cccggtaccg cccgccagga caggaaaccc tccgccggcg gccggaacag + 3661 ggaaccctcc gccaccggcc gggacagggg acccggcgcc gccgcccggg acagggcatc + 3721 ctccgccgcc ggacggccgg ccgcgaccgt ccccggacgg ccggcaccgc tccccggccc + 3781 ccgcacgcgc cgggcgacgc cgtcaccgcg gccctcgccg cggctctcgc cgtggccgga + 3841 aaaacaaccg aaacgaatac gcccccgacc gtaccgggcg caaaatcacc acccgtgagc + 3901 ggtaacccgg cgacagtccg gacaaagccg cagcctcctg tcttccaggg gcgggtcaag + 3961 cataactaga gccgccctcg cgcgccgatc agagaaccgt ccggttcctc ttgccgcgga + 4021 gtggcgggaa tgacgcggac aggcgcaagg aggcagtatc aagtagctcc gtcaacggct + 4081 cagaaccagt cgccccgaaa cattgcggag ggaattatgg aaataaaagt cctgggtgcg + 4141 ttgaacgccg aattcgaggg aatctcggtc gtccccagtg cgggcaagcc ccggcagatc + 4201 ctggcgctgc tcgccctgta ccccggccgg gtggtgccgg tgcccaccct catggaggag + 4261 atctggggca ccgacctgcc gcagagttcg atgaccacgc tgcagacgta catcctccag + 4321 ctgcgccgcc tgctgggcac ggccatgggc cccgacgtgc cgggctcggc caaggacgtc + 4381 ctggccaccc gctacggcgg gtacctgctg cagatacccg ccgaggcggt cgacgcgttc + 4441 acctacgagc ggctcgtgac cgaaggacga caggcctacg aggacggcga ggacgagcgg + 4501 gcggccacgg tgctgcgccg ggcgctcgac ctgtgggacg gccccgccct ggtcgacgtg + 4561 cgggtcgggc ccgtcctgga gatcgaggcg atgcgcctgg agcagagccg gctggtggcc + 4621 cgcgagcgcc gcatcgacgc cgacctgcgg ctgggccggc acgtcgaact catcgccgaa + 4681 ctcaccgacc tgatcgcccg ccacccccag cacgaagggc tgcactccca ggccatggtg + 4741 gcgctctacc gctccggcag gcaggccgcc gccctcgacg tctaccgcag gctccgccag + 4801 cggctcatcg acgaactcgg cgtcgaaccc tccccgcaac tgcagcggct gcaccaggcg + 4861 atgctcgccg tcgacccgcg cctggacatc gtggcgggcc cccggcgcac ctccacgttc + 4921 gacctgtacg cggcatgagg cgccggtgcc ctcgccgccc ggccggaccc ggcaggccgg + 4981 cccccgcggg gtcggcggcc gccgcggccg ccggccgggg ccgccgcccg cctcgccgcg + 5041 gggttgagcg ccgcacgagc cgcgcgggcg acgctcggtg cgcaggggca cccacccccc + 5101 ggaccggcgc cgggacggca ccgcgtggca cgcgccacgc cggcggcgcc cgcccggatg + 5161 gggccggacc ggaccgttca caaggagggc gacgcatggc ttcccgctcc agggaccgtg + 5221 aggcgggcac cgcacggatc acactcacct gcctcgccca cgccggagcg ggcgtggcga + 5281 gctaccgcgg ctgggccgcg gcggtcggac ccggcatcga cgtggccgcc ctgccgctcc + 5341 cgggccgcga cagccgccgc cgcgaaccac gcctgaccga acgcgccggc ctgctcgccg + 5401 acttcctgcc gaccctgctt cagacggcac gccgcggccc ctacgcgctc tacggacaca + 5461 gcatgggagc cctcgtcggc tacacgctca cccgggccct ggccgactcc ggcctgcccc + 5521 cgctgttcct ggccgtcggc gcctgcccgc ccccgcacac caccaccgtc ctggcggacg + 5581 cggcggacct gcccgacgag gacctgctgc cgctgctcga cgagatcggc tccctgccgc + 5641 cgggcgcctc cgcctccccc ggcggactgt ggcggcgcac cttcctgccc gtcctgcgcg + 5701 acgacctgcg cctggcccga tcgctgcgca acgccgccct ggacccggtc accggagggc + 5761 cgctggacgt gcccgtcctg gtcttcgcgg gccgcgacga cccgctcgcc gcacccgccg + 5821 ccctgcgcca ctggcagcag tggaccacca acctgatcga actgcacacc gtcgccgggg + 5881 gacacttctt cgcaagctcc tcgagcctgg cccagcacgt cggccgggcc tgccgcggcc + 5941 acgtgaccgc gctgcccaca ggaggcggcc ggtgaaccgc gtcgtgatca ccgggatcgg + 6001 cgtcgtcgcc cccggcgcgg tgggcaccgc cgacttctgg gacctgctca ccgtcggccg + 6061 caccgccacc cgccgcgtca ccctcttcga cgcctgcggc taccgctccc gcgtcgccgc + 6121 cgaggtcgac ttcacccccg ccgcccacgg attcgacctc gccgacaccg aacgcctgga + 6181 ccgcgcggca cagttcgcgc tggtcgccgc acgcgaagcc gtcgccgaca gcggcgtcgc + 6241 ggaccgcatc ggccgcaacc ccctgcgcac cggcgtcagc ctgggcagcg ccatcggctg + 6301 caccacgagc ctggccaccc agtacgccat cctcagcgac tgcggcacca cctggaccct + 6361 cgaccacacc gaggccgccg aatccctcta cgactacttc gtccccagct ccctggccgc + 6421 caccgtcgcc cgcgaccggg gcgcacaggg ccccgtcgcc ctcgtctcca gcggctgcac + 6481 ctccggcctg gacgccgtcg gccacggcgc cgacctgatc cgggaaggca gcgccgacat + 6541 cgtcgtcgcc ggcggaacgg aagcacccat cgtgcccatc gccatggcct gcttcgaccg + 6601 cctgcgcctc accagctccc gcaacgacga ccccgccacc gccagccgcc ccttcgaccg + 6661 cacccgcgac ggattcgtgc tcggcgaggg cgccgccgta ctggtcctgg aagaactcga + 6721 acacgcccgc cgccgaggcg cccgccccta cgcggaactg tccgccgtca ccgcccacag + 6781 cagcgcccac cacatgacgg gactgcgccc cggggcactg gagatggccg acgccatccg + 6841 cgccgccctc gaccaggcac ggctgaaccc cgccgacgtc gactacatca gcgcccacgg + 6901 cgcgggaacc cggcacaacg accggcacga gacacacgcc ctcaaggaaa gcctgggcgg + 6961 cagcgcccac cgcgtgcccg tcagctccat caagtcgatg atcgggcacg ccctgggcgc + 7021 cgccggcgcc ctggacctgg ccgccagcgc cctggccatc cggcacgaca ccgtcccgcc + 7081 caccgccaac ctgcacgaac ccgaccccac ctgcgacctc gactacaccc ccctgttcgc + 7141 ccgggaacag cgcaccagca ccgtcctcac cgtcgccagc ggcttcggcg gcttccacac + 7201 ggccgccgtc ctcacccggc cccggctcaa ggaggcggca tgaccaaggc gacccaggcc + 7261 cccgaaccgg cccggcccgc cggcgccgag ggcccccgcc agaccctggt caccggcatc + 7321 ggagtcgccg cacccaacgg cctgggcacc agagcctggt gggacgccgt gctgtgcggg + 7381 cgcaccggac tgggtcccat cacccgcttc gacgcctccg gctaccccgt acgcatcgcc + 7441 ggcgagatcc ccggcttcgt cgacgaggac cacatcccca gcagactgct gccctccacc + 7501 gaccgcggca cccgcatcgc cctggtcgcg gccgaagaag cactgcgcga cgcgaacgtg + 7561 agcccggccg acctgcccgc atacggcgcc ggcgtgatca ccgccagctc cgcgggcggc + 7621 gccgaattcg gcgaacgggg actggccgcg ctgtggagca aaggcgccca gcacgtcagc + 7681 gcctaccagt ccttcgcgtc cttccacgcg gcagcccccg cacagatctc catccggcac + 7741 cggctgcgcg gccacggctc gaccgtcgtc agcgaacagg ccggcggcat cgacgcactc + 7801 gcccgcgccc ggcggcggat ccgcgacggg gcatgcctca tggtcaccgg cgggatcgac + 7861 tccacactgt gcgcatgggg ctgggccgcg cacctggcgg acggccggct cagccccgcc + 7921 accgaacccg cccgggccta ccggcccttc gcggccacgg ccgacggcca cgcggtcggc + 7981 gagggcggcg ccctactggt cctggaggac gcccgggccg ccgcccgccg gggcgccacc + 8041 ggctacggcg tcatcgccgg ctgcgccgcc accttcgacg gccccgaccg ccccacactg + 8101 cgccaggccg cggaactcgc cctggccgac gccggcctgg cccccgaaca cgtggacgtg + 8161 gtcttcgccg acggcgccgc cgagcggcgc gccgacctcg tcgagagcca ggcgctgtgc + 8221 gcgctgttcg gaccctacgg agtaccggtc accgtgccga agacgatgac cgggcggctg + 8281 ggcgcgggcg gctcggccct ggacgtggca gccgcgctgc tcgccctgcg cgagaaggtc + 8341 gtacccccga ccaccggaac cggacgcgtc gccgacgact gcccgctgga cctggtcacc + 8401 ggggccccac gggaactgcc ccggctgcga gtggcgctgg tactggcccg cggacggggc + 8461 ggcttcaact ccgccgcagt gctccaggcc cctcagacgg agtgacggcc cgcccctaat + 8521 gagacggagc ggaacacacc ggcggccagg aacggcccgc ggccccgcgg accgcgcaaa + 8581 gggaaacacc cccggcgccg actccccggc cctcctggct ccccggcccg cccgggctcc + 8641 cggccttccg gctcctggcc tcctggcctt ccggcctccc ggccttccga gctcccggcc + 8701 ctcccgggct cccggcctcc cgggctcccg gcctcccggg tccctggcct tccggccttc + 8761 ccggtctctt ggcctcccgg ctcccggccc ccggccgttc gtctctgccg gctgcccggc + 8821 gttccgccgc cccgctcggg gcacgcgtgg tggcgtcctg gcctagcgga cgtcgtggtc + 8881 ctcgtcggtc agttcgcggg ccaggcgccg ctccaggtcg gtcagaggca tgtcgtcgcg + 8941 cacccgttcc gggtgtcccg gcggcggccg gtgccaccgg atgcgcgggt gcggaggggg + 9001 gtcgtaccgg tccgtctcgc cggccaggca gagccgcccg taggcgacca ggccctccca + 9061 caggccgcgg atgcatcggc gcgggcggaa gcgtctcatc cctgccacct cccggatcgc + 9121 ttctggggcc gcaggccacc gtcggtcacc gggctcgagg acccgacggt tcccgctgga + 9181 gcgcgtgccc ctgggcgccg ctccagcggg acacgagcgc gctaccggca catccctagc + 9241 ggttccggac agggtcgaga aaagccgcag tacgacgggc ccggccgcac cggcccgccc + 9301 cggtggaccc ggcacgcgtg cggcccagcg gggaccggcc cggcggcgac gccttggacg + 9361 acggagggtg tggacgatgc cggatgcgcg agtgcaccgt actgcctgtg agatgacggc + 9421 cccggccccg agcggagtgc tctacggcct gatcgcggac gccaccgtgt ggccgctgtt + 9481 cttccctccc agcgtccacg tggaacaact ggacttcgac gggacacggg aacggctgcg + 9541 catgtgggcc gtggcgggcg accggatcag ctcctgggtc tcccaccgcc gcctggacgt + 9601 cggacagcgg caggtggagt tccgccagga acggccctcc gccccggtcg agacgatgac + 9661 cggcctgtgg accgtcgagc ccctgggcga cggctcccgg gtgaccctgg aacacgcctt + 9721 caccgtcatc ggcgacgctc cggccgacgc ggcctggacc gagcgggtca cccgcgccaa + 9781 cagccgcgcc cagctccagc gcctggcctg gctcgccgag cgctggaccc ggctggacga + 9841 cctcgtgatg tccttcgagg acaccgtccg ggtcaacgtg cccgccgagc tggtcttcga + 9901 cttcctctac cgggccggcg actggcccga cgacctcgcc ggcacccgcc ccctgacggt + 9961 gcaggaggac acccccggca tccaggtcct cgccctggac ggccggtcgg ccaccggcgg + 10021 cgaggcggtg cgcatcagct tccccgccgc cggccgcctc gtgcacaaac acacccgcac + 10081 atccggaccg ctggccgcgt acaccggcga gtggaccatc gagccccagc ccggagccgg + 10141 cctcgacgtc accgtgcggc acgacgtgct gctcaacgac gacgccgcac tggaccagga + 10201 cgccgcccgg cgggcgtgcg acgaggtcgg ccgggccggc cgccgcctgc tggagcacgc + 10261 cgtgcgccac gcctccgacg cggtgcgggt cctgtgaccg ccgccctcga cacggccgcc + 10321 gggccgacgg ggcagacccc cgccccgcgc agcaccaccc ccacacccga acacaccacc + 10381 cccacacccg aacccgaaca caccacccgc gcacccgccc ccgaatccca acacaccacc + 10441 cccgaacgcg agtgcgccgc ccgcgtaccc gaacccgagc gcgccgcccg gctggaggcc + 10501 gcgctcggcg accccttcga cccggccaac ccgcacggac acctcgccct ggtccgggcc + 10561 gacgacaccc gcgaggcacc acacgccacc gaggcgctcc tgaccgagca cggcctgtcc + 10621 gccgagttcg tcccccacga cctcggcgga cgcctgaggg acctcgaaga gctggcccgc + 10681 gtgctgcgcc cgctcttccg ccgcgacctg gccctcggct acggcttcgg catcacctcg + 10741 ctgttcgccg cgtcctcggt gtggaccgcg ggcgaccccc accagcgcgc ggccctcgcg + 10801 gacgtcctgc tcggcggagg ccgggtcgcg atcgtgcacc gggaggtggc acacgccaac + 10861 gccatcctgc gccgcgaggt ccgcgcacaa cgccctgcgg gcggcggctt cctgctcaac + 10921 ggcagcaagg acgccgtcat gaacgccgac cgcaccgaca ccttcgtcgt ctacgcccgc + 10981 acctccgccg gctccggctc cgccagccac tcggtgctcc tgctgcccgg accacccgcc + 11041 tccggagaag tgcgccggct ggcgcgggtg gagatgcccg gcatgcgcgg ggcccgcttc + 11101 cacggactgc gcctggccga cgtacgactg cccgacagcg ccctggtcgg ctcgctcggc + 11161 gagggcgtca ccctggccct gcgcagcttc cagatcagcc actgcctcat cccgggcacg + 11221 gtgctcgcgg gcgtggacag cgtcctgcgg ctcgcggtgc gcgccgccac cgagaaccgg + 11281 cccgacggac ggcccgcccg ccgctggcac aaggcactca gcggggtctt cgcggacctg + 11341 ctcgcctgcg acgccatggc cgtcacggga ctgcgggcgc tcagcctcgt accccagcac + 11401 gcccatctgc tcgcggcggc ggtcaaatac accatgccgg acctgctgcg cgaggacctg + 11461 gaagaactcg ccgccgtgct cggcgcccgc ggctacgacc gcggcccgct gtacggcggc + 11521 ttccagaaac tcgcccgcga cctgcccgtg gccggactcg gccactcggg aacggccgtc + 11581 tgccaggcgg tgctcgtacc ccagctgccg gccctggcac gcacggcatg gttccggacc + 11641 gccgaaccga gcgccgcact gttcctgccg ggcgcgccgc tgccaccgct cgaccaccgc + 11701 aggctgacgc actccgggac cgacgacccg ctcacggcca ccctgatcgg ggccgccgaa + 11761 cggctggccg cacggacggg gacacaacca ctgcacgccg ccctcgccgc gctggcccgc + 11821 gccctggtgg aggagctgcg ggtgctgcgc gcgcgctgcg cggccctgcc ggccgccggg + 11881 agcaccgtgt tcgacccgct ggcctgcgcc ctggccgacc ggtacgccct gctgctgtgc + 11941 gccgccgcct gcctcggggt ctgggaggga caggcggacg gtgacggctt cctcgccgac + 12001 ccggcctggg cggtgctcgt cctcagccgc atcggccgca gactcggcat cgccgtaccc + 12061 gagacaccgg cggacgcgga acaggcggtc ctggccgagg cgctgggacg ctgccggcac + 12121 ggccgcagtc tcgacctgta cgacacccca ctggccggct gaccgagacg gcacggcaag + 12181 acgcccccca cctcggcccg ccccccccaa agggggagcg ggccggcgag aaccacacgc + 12241 agggagacga cgatggagcg ggtcacatgt gccgcgcccc ttcacgtgcc gcggccccac + 12301 ggcccctggc ccgcggtgcg cgaggacctc ttccggcacg gcaacgcact ggtctgcacg + 12361 acgtggagcg aatggctgcc cagcgtgctg accaccccgc ggctgcggga actgctcggc + 12421 gacgactggc agcgctaccg gcgtacccgc gacgccgcgg tgcgctaccg gttcgccgcc + 12481 tcccgcatgc tgatcaagta cacggcggcc gccgccctgg ccgtcccgcc cgagtacctg + 12541 gacctggcct accggctggg cggccggccc tacctgcgcg gcttcgacca gatcgaactg + 12601 agcctgagcc acaccgggga cgtcatggcc gtcggcctga gccgcatcgg ccggatcggg + 12661 gtggacgtgg aaccggccga gcggcccgta cggctggacc tgctcgagac ccaggtcttc + 12721 acaccggccg aggcccggga actggccgag ctgcccgaag gcgagcggac cgcccacgca + 12781 ctgcgcctgt ggaccctgaa ggaggcctac agcaaggccc tcgggcaggg actgcggttc + 12841 ggcttcaagg agttcggctt ccggcagggc cggctgagcg cacccgacgg cagccgggtc + 12901 acccgcgacg agtggggctt cgccacctac cccgtcatgg accgcttcct gctcagcgtg + 12961 gcctgccaca acgccggact gagcaccgcc ggggacacct ccgtggggac catgctggac + 13021 caggggttcc tgtcggcgat gacggacacg ggacagcagt agcgggcgtt ccggtacggc + 13081 cccaccgctg cagaagcgtt tctccgcccg gtcgcgagca gcgtcagcgg gccgtcaggc + 13141 ccatggcagc caccggtgcc acgatgccgg gggagtaccg cgccccctca acgggcccgc + 13201 cgctccccga gaaccgtgcg cacggccggc ccgtgcggga ggaggcagcg acgaggaggg + 13261 cgtcccatgg cgtggcacag ccgcccgcgt gccctgcggg gccccggcac ggcccgtccg + 13321 ccgggcgtac cggccctgtg gccccacctc gacctgctgg gcgacttcgg cgggcgccgt + 13381 ggcgccgggc gccacgtcga gcagctcgtc tggcgctggc acggcccgct ggacaccgag + 13441 cggttcaccg cggcctggca gtcggtcgtc gaccgcgaga gcgtgctgcg ggccgccctg + 13501 gcccccgggc cccggccgca cctggtcctg cacgagcacg cccacggcga cgtcgtgcgc + 13561 caccgtgcgg gcggcgccgg atgggaccgg ctgctggagc gggaccgccg gcgcggcctc + 13621 gaccccagcc gcccctgccc gctgcgcgtc accctcgtgg agcgcaccga cgacccggcc + 13681 ggtgccgggc cggtgacccg ggtggtcctc accttccacc acgcgctgct ggacgcgtgg + 13741 agcgtgtgcc tgctgatgca ggagctgtgc cgggcctacc tcgccggcgg cgagctgccc + 13801 ggcggcgagc gccgccccga cctgcgcgac tgggcgggct ggctccagcg gcaggacccc + 13861 gccggagccc gggacttctg gcggggcacc gtgcccgacg gaccggtcgc cgtgctgccc + 13921 gcccggcccg gcccgcgcac ccgccagcgg ggccggggca ggaccgaggt acggctgagc + 13981 cccgccgagg ccgaacggct ccaccgctgg gccgccctgc gcgccgtacc cgactccagc + 14041 gccctggaga cggtctgggc gctgctgctg taccgcgcgg ccgggcccgg cggggccgcg + 14101 acggtgggct tcggcgtcac cgtctccggc cgcggcatca ccctggactg cgccgagcgg + 14161 ctgcccgggc cgctgcgcaa ctgcctgccg atggtggtcc gcgtggaccc cggcgagacg + 14221 gtcggccggc tgctgacggc cctgcgggac cgggcgctgg acatggccgc ctacgaatgg + 14281 gtctccaccc gccggatcca ccgctggacg ggccgctgcc ccgacgggga actgctgcag + 14341 agcgtggtct cggtggacag acttccgcgc ccgccgggca acctgaggaa cgaactcgcc + 14401 gacgccggca tcgcgctgga gccggaaccg gcgcacggcg cctgccccga cctgcccgtc + 14461 gccctgctgg tccgtcccgg cggcgacggc cgcctcacct tctgcgtcga ccacgaccgc + 14521 aaccggatct ccgacgccga cgcccgcctg ctggccgggc actgcgcccg gctgctgcgg + 14581 cacctgcccg gcaccgacga ggccaccacc aacggggccg tgctggacgt gctcgccggt + 14641 gaggcactgc cgcgcatcgc gccgcggccc tcaaggccgc gaccggccgg gtcctggctc + 14701 cggccgcgct ccacttcctc cggggcggcc gtcgaccggg ccgcgagcca cccttgacac + 14761 tctgggccga ccgatcaccg aggaggtgcc catgcacgaa ggcgacgacg aacggcacga + 14821 gggtgacacg gcccgatgcg ccagggcggt ccacggcggc ccgccgcccc tgcggctggc + 14881 gggcgcggag gagcgcgagg acgaggacgg acgcgtcatc gtccgcagca tcgactagcc + 14941 cggacacccg aaacgacgca cgacgcacag cgcacgaccc acgggcgcac agcgcacagc + 15001 gcacgaccca cgggcgcaca gcgcacggcg cacagcgcac ggcgcacagc gcacggcgca + 15061 cggcggaggc gggcggcggg ccgggcgggg ggagccgggt ccagcgaggg tcgagcggcc + 15121 cccggcaagc tggccccgga cccacggccg cccccgacgc ccgcgcgaca gccgcccgga + 15181 gcacgggaag cgcccacgca cgcagcaccc tctggaagcg aggacccgcc catgccgtcg + 15241 atgccgcgcc cggacgccgt gacggtgccc gactccgtcc aggcgttcct gaccggtacg + 15301 gcgctcgtcg ccgcgttcac gacgatgcgg ccggacggca caccgcacgt ggcccccgtg + 15361 cgcttcacct gggactcgga cgcccagctc gcgcgggtga tgacggtgcg ctcctcccgc + 15421 aaggcccgca acctgctggc cacgcccggc gccccggtgg cgctctgcca ggtggacggc + 15481 ttccgctggg tcacgctgga ggggaccggc acggtcgtga ccgaccccga acgggtggcg + 15541 ctcggagcac ggctgtacgc caagcggtac tggtccgccc cgccgacccc gtccgaccgg + 15601 gtggtcatcg agatcgcggt cgaccgcgtc ctcagcctga acgcctgaac gcctgaacgc + 15661 ctgccccgcc ggctccgcac caccaccccc accacccacc acccatcacc gcccccatcg + 15721 ccccccaccg cccccgccgc cccggaccgc gtccggggcg gcacgcgcgt gtaccgcggc + 15781 gcggcgccgc cggacgtccc ggcgccgccg caccacggcc gcggtcaccc caccgcgccc + 15841 gcggtcgccc caccgcggct cggggtcacc gcaccgcggc ccggggtcac cgggccgggg + 15901 gaggggagcc gtccgcccac agcagccgga aggccagcag gctcagccgc cagccccgcg + 15961 cggtgcggcg cgcctcgccg ttcacgaacg tgcccgtcgc gaagagcggg ggcaggtccc + 16021 cctcgggagg cgtgtgatgc gggtggtgca catgggtgga gatcaggttc gcccggaaca + 16081 cggcccggtc cccgtccacg tcgaccacgg ccggagaacc gaggtgctgg gtggccgcga + 16141 acgccgacag cgccgaccgg tggtactcgg ccatgccgtc ggcgccctcg tgccggctga + 16201 ccgggaacgc gacgaccgcg tcctcggtga acaggccggc ggtccaggcg tcgtcgagcc + 16261 gctcgtcgtc gagcgagacc agataccggt gcagcagacc ggcgacctgt gcgctcgact + 16321 cggcggcgga cacggatgcg gattgatcgg tcgtcagact ggaggtcatg ccagagaatg + 16381 ccgtcacccc acgcgcccgg ggcaagaccg cttgtcgaag ctctgacgta ccagacgttt + 16441 ttctggcatt gactgcacaa gacctgtaac aacgcctatt tacagccctc gtaagccctc + 16501 gcactattga tggaacacca gtgagaagag ggcagatgga attctacgat tcagatgtca + 16561 ttgtcgtggg agccggtccc accggtctta tgctcgcagg tgaattgagg ctcgctggag + 16621 tctcggtggt ggttctcgac aaactttccg agccgattca ggaatcccgc gccctgggtt + 16681 tctcggcgcg gaccatcgag gaattcgcgc agcgcgggct gatggaccgg ttcggcgagg + 16741 tcggagtcat cccggtcggc cacttcggcg gcgtcccgct cgactaccgg gtgatcgagg + 16801 gcggttcgta cggggcgcgc ggcatcccgc aggcccgcac cgagggcgtc ctgggcggct + 16861 gggcgcgcga gctgggcgcc gacatccgcc gcgggtgcga ggtcacgggc atcgagcaga + 16921 ccgacgcctc ggtgaccgtc accgccgcgg gcgccgacgg ccccttctcc ctgcgcgccc + 16981 gccacgtggt gggctgcgac ggtgcccgca gcatcgtgcg caagctcgcg ggcatcggct + 17041 tccccggcac cgagccggcc atcgagctgc gcttcgccga cctggccgga gtggcgctgc + 17101 ggccccggtt cagcggggag cgcgtcgccg gcggcatggt catggtcatc ccgatgggcc + 17161 cggaccgctg ccgcgtcatc tacttcgaca gctccgagcc gctgcgcacc agcccggacc + 17221 cgatcacctt cgacgaggtc gcccagacct ggcagcgcct gaccggcgag gacgtcagcg + 17281 gcgccacccc gctgtgggtc agctccacca cggacgtcag ccgccaggcc gaccggtacc + 17341 gccacggccg cgtcttcctg gccggcgacg ccgcgcacat ccacctgccg atcggcgcgc + 17401 agggcatgag cgcgggcgtg caggacgccg tgaacctcgg ctggaagctc gccctcgaca + 17461 tcaagggcca ggcgcccgaa gggctgctcg acacctacca cgccgagcgc caccccgtcg + 17521 gggcccgcat cctgaccaac accctcgccc agcgcatcct ctacctcggc ggcgacgaga + 17581 tcacgccgat gcgcgaggtg ctcgccgagc tgatgggcgc ccacgaatcc gtccagcgcc + 17641 acctggccgg catggtcacc ggcctggaca tccggcacga cgtcggcgaa ggcgaccacc + 17701 ccctgctcgg ccggcgcctg ccggaccggg aactggtcgt cgacggtgag aagaccccgt + 17761 tctacgcgct gctgcgcacc gcacgccccg tgctcctgga actcgggggc gaccacggcc + 17821 tgcgcaccgc ggccgccggc tgggccgacc gggtcgacct cgtcgcggcc gagttcgacg + 17881 gctgcgaggc ccccgtggac ggcatcctcg tccgccccga cggctacgtc gcctgggtcg + 17941 ccggcctcgg cgccgggccg gacggtctca ccgccgccct cggccgctgg ttcggcccca + 18001 ccgcctgacc gtcgcgggcc gcgcagcgac acccaccgca cccaccaagg aaagcgaagg + 18061 acccatgccc atcatctccg ccgaggacaa gcacctcacc gtcctgaacc tgttcaccac + 18121 ggacactccc gagaagcagg ccaagctgat cgaggagatg acgaagatcg tcaacgcggc + 18181 cgcgtacgag ggctggatgt cctccaccgt ccactcgggc gtcgacggct acggcaccct + 18241 caacttcatc cagtggcgca gcggcgagga cctcgagaag cgctacgcgg gcgaggagtt + 18301 caagcaccgc acgctcccgg tcttcggcga gatcaccacc tcgatccggc tgatgcagaa + 18361 cgaggtcgcc cacacgctga cctcggacgc cctcggcggc aagatcgaga tcggaccgga + 18421 ccgcgacgac tacaccgtct tcaccctctt cccggtcacc cccgaggggc aggacgaggc + 18481 cgtcgacgcc ctcggccccg gccaggcctt cctcgccgac gtgcccggct tccgcgccca + 18541 cgtcgtgctc aagggcctgc gcgcccgcgg cctggaggga tccttcgtca tctcctactc + 18601 ccagtgggac agcaaggagg ccttcgaggt ctaccgcgac caggcccccg aggagcaggc + 18661 cgacgcccgc aaggccgccg tggcccgcgt ccgcgccgtc gtcaccggcg agccctacct + 18721 caacacctac cgggtcgtgc acacgcgctc tgccggcgag tgagcccggc gcgccggacg + 18781 gcgcacggga cccgcacgcc ttcggacctc gtccccggca cccgggggcg caggcccgaa + 18841 ggcgtgctcg tgtgcacccg ccgcttcggc tcaggcggga ctcaggcagg ccccgtgcgg + 18901 ggcgctaccg ccaggccgca ccgtcgaagg cggtggcgcc gcagcccccc gggccgccgg + 18961 gccgggccgg tccgcccgct tcgagaaccc ttccgcgcaa ccgccgagga gctaatccct + 19021 atgcacagca cgctgatcgt cgcccggatg gcggccacct cgagcaacga cgtggcccag + 19081 ttgttcgccg acttcgacgc caccgagatg ccgcaccgca tgggcacacg gcgccgccag + 19141 ctcttctcct accggggcct gtacttccac ctccaggact tcgacgagga caacggcggt + 19201 gaactgatcg aggccgccaa ggccgacccg cgcttcgtgc ggatcagcga ggacctcaag + 19261 cccttcatcg aggcctacga ccccacgacc tggcgctcgc cggccgacgc gatggccacg + 19321 cgcttctaca gctgggaggc ctcccgttga gcgggcgacg cgttgtgatc accgggatcg + 19381 aggtgatcgc ccccggcggt gtcggcaggg agaacttctg gaacctgctg agcaacggcc + 19441 gcaccgcgac acggggcatc accttcttcg accccgcccc cttccgctcc cgggtggccg + 19501 ccgaagcgga cttcgacccc tacgagcacg gcctgacccc gcaggaggtc cgccgcctgg + 19561 accgggccgc gcagttcgcc gtcgtcgcct cacgcggcgc cgtcgccgac agcggcctcg + 19621 acatcccctc cctggacccg caccgcgtgg gcgtcaccgt cggcagcgcc gtcggcgcca + 19681 cgatgggcct ggaccaggag taccgggtgg tcagcgacgg gggacggctg gacacggtcg + 19741 accacaccta cgcggtcccg cacctgtacg actacatggt gcccagctcc ttcgccgccg + 19801 aggtcgcctg ggcggtgggg gccgaaggcc ccagcaccgt ggtctccacc ggctgcacct + 19861 ccggcatcga ctccgtcggc tacgccgtcg aactggtccg cgagggatcg gccgacgtcg + 19921 tgatcgccgg ctcctccgac gcgccgatct caccgatcac catggcctgc ttcgacgcga + 19981 tcaaggcgac caccccgcgc cacgacgaac ccgagtgcgc ctcccggccg ttcgacaaga + 20041 cccgcaacgg attcgtcctc ggcgagggaa ccgccttctt cgtcctggag gaactcgaca + 20101 gcgcccgcaa gcgcggcgcc cacatctacg ccgagatcgc cggctacgcc acccgctcca + 20161 acgcctacca catgacgggc ctgcgccccg acggcgtgga gatggccgag gcgatcgacc + 20221 tggccctggg cgaggcccgg ctgaacccgc agtccatcga ctacatcaac gcccacggct + 20281 cgggcaccaa gcagaacgac cggcacgaga cggccgcgtt caagcgcagc ctcggcgacc + 20341 acgcctaccg caccccggtc agctccatca agtcgatggt cgggcactcg ctcggcgcga + 20401 tcggctccat cgagatcgcc gcctcggcac tcgccatgga gtacgacgtc gtcccgccca + 20461 ccgccaacct gcacaccccc gaccccgagt gcgacctcga ctacgtgccc ctggtcgccc + 20521 gcgaccagct gatcgacgcg gtcctcacgg tcggcagcgg attcggcggc ttccagagcg + 20581 ccatggtgct cgccaccccc gaaaggagcc tcgtatgacc gcctccgtgg tggtgaccgg + 20641 cctgggcgtc gtctcaccca acggcatggg ggtgaaggac tactgggcgg ccaccctggg + 20701 cggcaagcac ggcatcggcc gcatcacccg cttcgacccc accggctacc cggcccgtct + 20761 ggccgggcag atcgaggact tcgacgccga ggaactgctg cccagccggc tgctgccgca + 20821 gaccgaccgc gtcacccggc tggccctggt ggccgccgac tgggcactcg cggacgccgg + 20881 cgccgacccc gcgcacctgc ccgagttcga catgggcgtc atcacggcct ccgccgcggg + 20941 cggcttcgag ttcggccagg gcgaactgca ggccctgtgg agccagggca gccagtacgt + 21001 ctccgcctac cagtccttcg cctggttcta cgccgtcaac agcggccaga tctccatccg + 21061 caacggcatg aagggcccct ccggcgtcgt cgtcagcgaa ggcgcgggcg gcctggacgc + 21121 cgtcgcgcag gcccgccggc agatccgccg gggcaccccg ctgatcgtca ccggcggcgt + 21181 cgacgcctcc atctgcccct ggggctgggt ggcccagctg gcctgcggcc ggctcaccac + 21241 cagcgacgaa cccgaccacg cctacctgcc cttcgaccgc gacgcgaacg gctacgtccc + 21301 cggagagggc ggcgcgatcc tcatcgccga ggacgccgac gccgcacgcg cccgcggcgt + 21361 ccgcccctac ggcgagatcg ccggctacgg agccaccatc gacccccggc ccggcagcgg + 21421 acgcgaaccc aacctggcca aggccatcga gacggcactg gccgacgccg acgtgaacgc + 21481 cgccgacatc gacgtggtct tcgccgacgg cgccggcgac ccggccggcg acctcgccga + 21541 ggcccgcgcc gtcagcacgg tcttcggcga ccggggcgtg ccggtgacgg tgcccaagac + 21601 catgaccggg cgcctgtact ccggcggcgc gcccctggac ctggcggccg cgttcctcgc + 21661 cctgcgcgac ggcgtcatcc cgcccaccgt gcacatcgac ccgtgcgccg actaccccct + 21721 cgacctggtc ctgggcgaac cccgcccggc cgagctgcgc accgccctgg tcctggcccg + 21781 gggagccggc ggcttcaact ccgccatggt cgtgcgcgcc gcctgaggac ccccgcgcac + 21841 cgcacccgac cgacgcaccg caaccgccac cacgtactga cgaaaggacc caccatggcc + 21901 agcaagtcct tcaccctcga cgacctcaag cgcaccctgc gggaggccgc gggcgtcgcc + 21961 gagggcgtgg acctggacgg cgacatcctc gacaccgagt tcgaggtgat cggctacgag + 22021 tccctcgccc tgctggaggc cggcagcctc atcgagcgcg agtacggcat ctccctggac + 22081 gaggaggccg tcggcgaggc caacacgccg cgcagcttca tcgaggtcgt caacgcgcag + 22141 ctcgcgcccg ccaaggccgc ctgaaggagc cccaccatga ccgacaccac cacccagcgc + 22201 gtcgccgtcg tcaccggcgc caccagcggc atcggcctgg cctccgcccg gctcctcggc + 22261 cggcagggcc accaagtctt catcggcgcc cgcaacgccg agaacgtcgc cgccaccgtc + 22321 aaggaactcc agggcgaggg catcgacgcg gacggcacgg tcgtcgacgt ccgcgacacc + 22381 gagtccgtca acgcctggat ccaggccgcc gtcgaccgct tcggcagcgt cgacgtcgtc + 22441 gtcaacaacg ccggccgctc cggcggcggc cccaccgccg acatcgcgga cgagctgtgg + 22501 gacgacgtga tcgacaccaa cctcaacagc gtcttccgcg tcacccgcgc cgccctgacc + 22561 atcggcggcc tgcgcgccaa ggaccgcggc cggatcatca acgtcgcctc caccgcgggc + 22621 aagcagggcg tcgtcctggg cgccccgtac tcggcgtcca agcacggcgt cgtcggcttc + 22681 accaaggcac tgggcaacga gctggccccc accggcatca ccgtcaacgc ggtctgcccc + 22741 ggctacgtcg agaccccgat ggcccagcgc gtgcgccagg gatacgccgc cgcctacgac + 22801 acctccgagg acgccatcct cgagaagttc caggcgaaga tccccctcgg ccgctactcc + 22861 acccccgagg aggtcgccgg cctcgtcggc tacctggcct ccgacaccgc cgcgtccatc + 22921 acctcgcagg ccctcaacgt ctgcggcggc ctcggcaact tctgacgcac ccggcacccg + 22981 acccctttcc cgaggagtga gcctcatgac cacacgtgag gtcgagcacg agatcacgat + 23041 cggcgcaccg gccgacgccg tctaccagct gctcgcggac gtgaccaact ggccgcgcat + 23101 cttcccgccc accatccacg tggaccgcac cgaggccgac ggcgaccacg aacgcatcca + 23161 catctgggcg accgccaacg gccaggccaa ggagtggacc tcgcaccgca cgctcgaccg + 23221 cgagaacctg accatcacct tccgccagga gatccccgcc gccccggtca agcacatggg + 23281 cggcacctgg atcatcgagc cgctcgccga cgaccggtcg cgggtgcggc tcctgcacga + 23341 ctacagcgcc atcggcgacg acccgcacga cctgctgtgg atcgagcagg ccgtggacaa + 23401 gaacagcacc tccgagctgg ccgccctgaa ggtcaacgtc gaggccgcgc acgccgccgc + 23461 cgaggagctg acgttctcct tcgccgacac cgtgcagatc gacggcgccg ccaaggacgt + 23521 cttcgacttc atcaacgagg cccagctgtg ggccgaacgg ctcccgcacg tcgccgtggt + 23581 gcgcctgagc gaggacaccc ccggcctgca ggagctggag atggacaccc gcgccaagga + 23641 cggctcggtg cacaccacca agtcctaccg ggtcgtcttc ccccaccaca agatcgccta + 23701 caagcaggtc accctgcccg cgctgatgac cctgcacacc ggcgaatgga ccttcaccga + 23761 gggcgacgag gcgaccaccg cctcctccca gcacaccgtc accctcaaca ccgccaacat + 23821 cgcccgcatc ctcggccagg aagccaccgt cgccgacgcc cgcgcctacg tccacacggc + 23881 cctgtccacc aacagccgcg ccaccctcgc ccacgccaag gcctacgccg agcagaagaa + 23941 gggctgaacc gtggcagcgg acgccctgac caccgacgtc gtcgtcgtcg gagccggccc + 24001 cgtcgggatg atgctcgccg gggaactggc ccacggcggc gtcggcgtgg tggtcgtgga + 24061 gaagcgacgc gctcccagca ccgagtcccg ggcctccacc ctgcacgccc gcacgatgga + 24121 gatcctcgac agccggagcc tgctgcccga gttcggcgac ccgccgaacg agccgcgcgg + 24181 ccacttcggg ggcatcccgc tggatctgac gctgccctcc tcccaccccg gccagtggaa + 24241 ggtgccgcag accaggaccg aggtgatcct gggggagtgg gcgctgtcac tgggcgccga + 24301 actgcagtgc aagcacgaac tgaccgcgct cgacgacagc ggcgacctgg tggaggccga + 24361 agccgccggc ccggacggac ggacgctgcg gctgcgctgc cgctacctgg tcgcctgcga + 24421 cggcgaggag agcaccgtac gccgcctgat cggcgccgac ttccccggca gggacgcgac + 24481 gcgggaactg ctgcgcgccg acgtcgccgg catcgacatc ccgggccggc gcttcgaacg + 24541 cctggagcac ggcctggcga tcgccgcccg ccgccccgac ggggtgaccc gggtgatggt + 24601 ccacgagttc ggctccgccg cgcgggcccg cccgcacggc gacgcctcct tcgaggagat + 24661 caccgcggtg tggaagcggg tcaccggcga ggacatcagc ggcggcaccc ccctgtgggc + 24721 caacgccttc ggcgacgcct cccgccagct gacccgctac cggcacggcc gcgtcctctt + 24781 cgcgggcgac gccgcccacc ggcagatgcc ggtcggcggc caggccctca acctcggcat + 24841 gcaggacgcc ttcaacctgg gctggaaact ggccctggtg gtacgcggca aggcaccgca + 24901 gaccctcctc gacagctacc acgacgaacg tcacgaggtc ggccggcagg tcctggccaa + 24961 catccgcgcc cagtcgctgc tgctgctcgg cggaccggag gtagagccgc tgcgcgacct + 25021 gctgacggag ttgatcgggc aggaggacgt acgccgtcgc ctggccggca tgatcagcgg + 25081 cctggacgtg cgctacgacg tcggcggccc cgcccacccg ctgctcgggg cccggctgcc + 25141 gtgcaccgag gtgcgggcac gccgacgcct gctcaccacc acccacctgg tgcgctcggg + 25201 cggcggcgtc ctgctggacc tgaccggccg gcccggccgg ccgccggcag tcctcgacgg + 25261 ctgggcggac cgcgtcaccg cactggacgc ccagccctcg ccgggcagtt cactgcaggg + 25321 caccgaccgt gtcctggtcc gccccgacgg ccacgtggcc tgggccggcc cgggcaccga + 25381 cggcctcgcc gaggcactca cccgctggtt cggacctccc cgctgacctg ccgtgcgccc + 25441 cggcccggcg gggacgaccg gcaccgcacg acgcgccgcc ccccaccgcc gggccccgaa + 25501 ccgaccccac tgccaggaag gaccacccat ggaagggaca gcggcggaca ccgacgtgat + 25561 cgtcgtcggt gccggcccga ccggactgat gctcgcgggc gaactgcgcc tgggcggggc + 25621 ccgtgtcgtc gtcatcgaga agctggccgc ccccaccggg cagtcccgcg gcctgggctt + 25681 caccgcccgc gccatggaga cgttcgacga acgcgggctg ctgccccggt tcggccaggg + 25741 agagaccctg gccaccagcc ccgtaggaca cttcggcggc gcccagttcg acttcaccgt + 25801 cctcgaggac gcccacttcg gggcccgggg catcccccag ggcgacaccg aggcggtcct + 25861 ggagggctgg gcgggcgaac tcggcgcgga catccggcgc ggctgggagt tcgtctccct + 25921 caccgacggc ttcctggacg gcgacggcgt cgagatcacc gtacgcaccc cgcagggcga + 25981 ggaacgcacc ctgcgcgcct cctacctggc gggctgcgac ggcggctcca gccgggtccg + 26041 cagggcggcc ggcttcgact tccccggaac cgacgccacc cagggcatgt acctggcgga + 26101 catcaccggt gtggagctga ccccgcgctt cctcggagag cgcctgaaca acggcatggt + 26161 gatggcggca ccgctctccc agggcgtgtg gcgcatcatc gtctgccccg acggccgccc + 26221 cgcgcacgac cgtgagcgga ccgtcacctt cgaggaggtc gccgccgcct ggcaggacat + 26281 caccggcgag gacatcagcc acggcggcgc gagctgggtc agctccttca ccaacgccac + 26341 ccggcaggcc tccgagtacc ggcgcggccg cgtcttcctg gcgggcgacg ccgcccacat + 26401 ccacctgccg gccggcggcc agggcctgag caccggcgtg caggacgccg ccaacctcgg + 26461 ctggaagctg gcctcggtga tccgcggcga cgccccccgg gaactgctgg acacctacca + 26521 cgccgaacgc cacccggtcg gcgcccggct gctgatgaac acccgcgccc agggcatcgt + 26581 cttcctcggc ggcgccgagt ccgacccact gcgcgagctg atggccgagc tggtccgcta + 26641 cgacgacgtc aaacgccacc tggccggcat cgtcagccac ctggacatcc gctacgacct + 26701 cgccgacacc gcgaccggcc ccacccaccc gctgctggga cgccggatgc cgccgcggct + 26761 gctcgtcggc gcggacggcg aaacccgcat cgcccgcctc ctgcacgccg ggcacggcgt + 26821 gctgctcgac ctcgccgacg acgagacggt acgcgcgacc gcggccggcc acgcggaccg + 26881 ggtggacgtg gtcaccgccg tcgccaagcc caccgacggc ccggacgccc tcgccggcgc + 26941 caccgccgtg ctgatccgcc ccgacggcta cgtcgcctgg acgggcacct gcgcgcaggg + 27001 cctggaaacg gccctggaac ggtggtgcgg cccgccccgc tgacccacac cccccccaac + 27061 ggcccccggc gtgcgcgcac gccgggggcc ttcgtccgcc gcccggcacc ccccgccgcc + 27121 cggcaccccc cgccgcccgg cgctccccgc gggcctgccc gccggcgccc ccgcccaccc + 27181 ggccgccgct gcccggccgc acacaccgga gggccccgcc gcgttccctc atcacgcgac + 27241 ggggccctcc ctccacggtg gtcacacggg gacggcctcc acgagggaga tcgccgccgc + 27301 cgtctccacg acccgctcca gacggaaccc ggcacgggcc aggagatcgg cgtactggcc + 27361 gggagtacgc tcacggccac cgaccaggag catcagccac aggtcgacca gcttcccgga + 27421 gtgcggctgg tcaccctgct ccggtatcac catctcggcg atcagcagct tgccgcccgg + 27481 cttgatcgcc gcccgcacgt tgcgcaggat ccgcagggcc tgctcctcgg gccagtcgtg + 27541 cacgatgtgc ttgaggacgt aggcgtcggc gccgcccggc ggcacgtcga acaggtcgcc + 27601 ggccacccgc ttcgtccggt cggccacacc ctgcgcggcc aggaactccg cagccccgtt + 27661 ctcctcgacc cgcgggtcga acagaacgcc ctcgcacccg ggcgccgcac ccaggatgcc + 27721 cgcgagcaac gcgccctggc cgccgcagaa gtccaccacc gtcccgaact gcgagaagtc + 27781 gtacgccgcc aggatcggct ccgtctccga ggcggacatg ctgcccatgc cctggaagaa + 27841 cacctggccg tactccgcgt tcttcgtcag gaactcgaag gcgtgcatac cgcgcagctt + 27901 cggcagcgcc ggctcgccgg tgaccaccgt ctccgggaag ccgctccagt cctcccagtg + 27961 gatcgggtgg cccatcagca gcgcgatgcc ccgcatcgac atcggatggt cggcgcgcag + 28021 cgcgtccgcc atcggcgtca gctcgaaggc accgtccggg cgcgtggcga acacaccgtt + 28081 gctcgccagc aggcgcagca cccggccgag cgcgtcggcg tccgcaccga cccgcccggc + 28141 gagctcgtcg gcggacagcg gaccctcggc gagcgcctcg gccaccttca gttcggcggc + 28201 gacgtgcacc gcacgcgtga ccatgacacc catgatcaat tccagcagag cgaacggcgg + 28261 aggcgcgagt tcccggctct gccgctgcag atccgctcgt gctttctccg cttcccgtac + 28321 gacgtgcgga ggcggcaatt cgggcatgag tttcctccat ggcaggagcg caaaagtctg + 28381 tcccaaccgc cggaagggac cgggactaca acgatatgga aaaaggtcga cgcctcctgg + 28441 agggagactc gaataccgct ggttcacggg tgcacccact ttttcctgcg gaaaatttga + 28501 cgcaataaaa ccggcgactg ccctagggtg gcgctgattt cgcatccgct ctccgggaaa + 28561 aggggggagc attggaaacc gaggagagaa atggcgaact cgcgtaactc ctggacgaag + 28621 atacttctgg cggcgggcgc ggccggcgcc gtcgccgtcc cgctgaccgc cggccccgtc + 28681 caggcccagc cccaggccca ccgccacggt cacacccaca cccgtaccga ggcgaccgtg + 28741 accgtcgtgg cctcccagct gaacaacccg cgcggcgtca ccgcgctggg cgacggcggc + 28801 gtgctggtcg ccgaggccgg cgccggactg gccgactgcc cggtcgacca gacgtgcgtg + 28861 ggcaccaccg gctccgtcta caaggtcaag ggcagcttcc agggccgcgt cgccaccggc + 28921 ctcgcctcca cggccaaggg cgtcgccccg ggcgccccga tctccgccaa cggccccagc + 28981 gacgtcgtgc ccgaccggtt cggcggctac gtcgtcgtca gcggcctcgg cggcaccacc + 29041 gagtcgcgcg ccgcgctggg cgagggcgcc cagaccctgg gcacggtctt ccgcacccgc + 29101 gaccacaagg tgctcgccga cctcaccgac cacgagacgc ggctgaaccc cgacggcggc + 29161 gacgtgcacg ccaacccgtg gcggctcgcg cgcagcggca gcggctacct ggccaccgac + 29221 gcgggcgcca acaccgtcgt acgcggcaac gccgacggca ccaccgccac cgagtacctc + 29281 ctgcccaaga acgaactgcc caccggcgcc gccgagaccg tacccaccgg catcgccaag + 29341 gccgccgacg gcaccgtgta cgtcgccgac atgagcggcg gccgggtcgg cgcctcccgc + 29401 gtctggaaga tcgccccggg ccggcagccc gagatcctcg ccaccggcat gaccaacctc + 29461 atcgacctgg acctggaccg ggacggcgac ctgatcgccc tgtcctacag cgccgccgcg + 29521 ctggccggcc cgccgcagcc gggcgccctg ttcgagatcg acgccgacag cggcgcggtc + 29581 accgagatcc ccaccggcga ccagctcaag cagcccaccg gcgtcgccgt cgacccctgc + 29641 ggcaaggtgt acgtcaccaa caacacgctc ggcaccaacg gccagctggt ccgcgtcaac + 29701 cgctgacccc cgcaggaggg tgcgccgcgc acacccccct gccaggcccc gccggtcccg + 29761 cacccctgcg accggcgggg cctcgctgtg cccggcgccg gacgcccgcg gccgatggga + 29821 atccgctcgg cggccgctcg acagccgacg gagggcgacg cccccgcaca gcccggctcg + 29881 gcatcctggc cgggcatcca cttgccggac aacacattcg acgctcaggg aggctgcccc + 29941 gtgacgcaag atgccatgac ctcggccgac gagacccgga ccggcgtgtg gctcgtcgga + 30001 gcccgcggtt cggtcgccac gacggcggtg tcgggctgcg cggcgctggc ggcaggactg + 30061 ctgccaccca ccggcatggt caccgagacg ccccccttcg ccgactgcgg cctgccggcc + 30121 ctggcctccc tcgtcttcgg cggccacgac acggcgacca cccccctgcc caaacgcgcc + 30181 gaggaactgg ccgcccaagg agtactgccg ccctggctgc cgaccgccgt ccagggggaa + 30241 ctggccgccg cggacgaaca catccgcccc ggaggaccgg tacccggcga ccgtcgcgcc + 30301 accgaagagc tgatagccga cttcgccacc gacctgcgca ccttcgcccg caccaccggc + 30361 gtcgcccgca cggtcgtcgt caacgtcgcc tccaccgaac cggaccccgc acacggcgcg + 30421 tggccggcca gctccctgta cgccgcggcg gccctgcggg cgggctgccc ctacgtcaac + 30481 ttcacgccgt cgaccgggct gagccacccc cagctggcgg gcgcggcccg cgcctcgggc + 30541 ctgccgtacg cgggccgcga cggcaagacc gggcagaccc tgctgcgttc ggtgctgggg + 30601 ccgatgttcg cccagcgggc actggcggta cgggcctggt ccggcacgaa cctgctgggc + 30661 ggcggcgacg gcgccgccct cgccgacccc gccgccgccg cggcgaagaa cgccggcaag + 30721 gaacgcgtcc tcaccgacac cctcggcacc cgggtcgaag gcgaagtgca catcgacgac + 30781 gtccccgccc tcggggactg gaagaccgcc tgggaccacg tcgccttcga cggcttcctc + 30841 ggcacccgca tggtcctgca gaccatctgg cagggctgcg actccgccct cgccgcaccg + 30901 ctcgtcctcg acctggcccg cctgctcgcc cgcgcccacg agcggggcct gtccggcccg + 30961 ctgggcgaac tcggcttcta cttcaaggac cccgacgccg aaggctccgc cctggccgag + 31021 cagtacaccc gactgctcac cctcgccgac cggctcggag gaaccaggtg agcgctcagc + 31081 ggcccgccca cggcccggcc cgcgacgggc acctccacgc ctgggccgaa ctgctgcgcg + 31141 cccccgccgc gctcaccgtc cccggtgacg tcctcgccgg caccgcggcc gccggcacac + 31201 ggcccaccgg acgcaccgcc ctcgcggccg gcgcctcact gtgcctgtac gaggcgggca + 31261 tggcactcaa cgactgggcg gaccgcgagg aggacgccac cgcccggccc caccgccccc + 31321 tgccgtccgg ccgcgtccgg cccggcgccg ccctcgccgc cgcgggcctc ctctccgccg + 31381 cgggcctggc cctcgccgca tgcgcgggac gacgggccct cgcggtcgcc ggccccctgg + 31441 ccgccaccgt atgggcctac gacctgggcc tgaaacacac cccggcggga cccgcggcga + 31501 tggccgccgc ccgctccctg gacctgctgc tgggcgcggc cgccggcccg ggcgccgtgc + 31561 gacgggcgat cgtcccggcg gcgttcctcg gcagccacac cctggccgtc tccctcgtct + 31621 cccgccgcga gaccgagggc ggctccagca ccgcccccct cacggccctc gccgccgcgg + 31681 gcgccctcac caccgtcctc gccggccgcc ccaccgccca ccccgcgccc gacgccagca + 31741 ccggcgcacc gacccccgcg acaccggccg acaaggccac ccgcgccgta cgcgccgccc + 31801 tggccgcttc ctacgccgcc accttcgccc gccccctggc ccacgccgcg ctcaacccct + 31861 ccccggaact gacacagcgg gccgtcggcg ccggcgtccg cgccacgatc gccctgcaga + 31921 gcggactgat ggcccgggcc ggcgcacccg gcaccggcgt cctcaccgcc gccctggcac + 31981 ccctcgccgc gcacctggcc cggaaagtga gcaccacatg agcccgctgc gcctcggcta + 32041 cggcaccaac gggctgaccg acctgcgcct ggaggacgcc ctgcgcctgc tggccgacct + 32101 cggctacgac ggcgtcggac tcaccctcga ccacatgcac ctcgacccgc tcgcccccga + 32161 cctcgcggcc cgcacccgcc acgtcgcccg gcaactgcac cgcctcggcc tcgcggtcac + 32221 cgtcgagacc ggcgcccgct acgtcctcga cccgcgccgc aagcacggac ccagcctgct + 32281 cgacgacgac ccggacgccc gctgggcacg cgtacgcctg ctgatccgct cggtacgcgt + 32341 cgccgccgac ctcggcgcgc acgccgtgca ctgcttcagc ggcccacggc ccgcgggcct + 32401 ggaccaggac accgcctgga aacgcctggc cgacgccctc ggccccgtcc tggacgccgc + 32461 ggaggacacc ggcgtccccc tggcggtcga acccgagccc ggccacctgc tggccacact + 32521 gaccgacttc caccgcctgc gcaccgaact gggcgacccc gaaccactgg gactgaccct + 32581 cgacatcggg cactgccagt gcctggagcc cctgccgccc gccgactgcg tacgggccgc + 32641 cgcgccctgg ctgcggcacg tgcagatcga ggacatgcgc cgcggcgtcc acgaacacct + 32701 ccccttcggg gacggcgaga tcgacttccc gcccgtactc gacgccctcg ccgccaccgg + 32761 ctaccagggc ctgaccgtcg tcgaactgcc ccggcactcc cacgccggac ccgaactggc + 32821 cgcacagtcg atgcggttcc tgcgcaacgg agggacgaga tgaccgtcgt acacaccccg + 32881 ccggacgcgg acctgcccgg cgagttcgcc ggcctcggca ccgacgcacg ccgctggctc + 32941 accgccgccc gcgcctcggc aaccgcccgg gacaccgact gggaactgcg cttcgccgag + 33001 gcgggccgcc gctgcggcac cgaacacgcc gacgccgccc gcgtactgct gctcacggcg + 33061 gcacgccccg acgcggagac cgtgaccctg ctgtaccacc gggggacagc cgccgaacgg + 33121 cgtgcggtcc tgctcgccct ggacggactc gacaccgaac ccgcccacgc cctgccgctg + 33181 gtcgaagacg ccctgcgcgc caacgacacc accctgctcg ccgccgccct cggcccctac + 33241 gcggcccggc acctggacgc ccaccaatgg cggcacgccg tactcaagtg cctgttcacc + 33301 ggcgtgcccg tggccaccgt ggcaaacctg gcggcccgcg cccgcgcaga cgcggaactg + 33361 gccagaatgc tgcgcgccta cgccgccgag cgcaccgccg cccaccgaga catcccggcc + 33421 gacctcgacc gcgtgctcgc cctgacccag gagcagtgac ttgcgcatct tcgaccccca + 33481 catccacatg acgtcccgga ccaccgacga ctacgaagcc atgcatgccg cgggtgtccg + 33541 tgccgtggtc gagcccgcct tctggctggg gcagccccgc acttctccgg cctccttccg + 33601 tgactacttc gacgcgttgc tgggctggga gcccttccgt gcggcgcagt acgggatcgc + 33661 ccatcactgc acgatcgcgt tgaacccgaa ggaggcg +// diff --git a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JCM_4529.region35.gbk b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JCM_4529.region35.gbk new file mode 100755 index 000000000..8e7c3b14b --- /dev/null +++ b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JCM_4529.region35.gbk @@ -0,0 +1,1627 @@ +LOCUS NZ_BMUN01000045 30675 bp DNA linear CON 19-APR-2022 +DEFINITION Streptomyces vinaceusdrappus strain JCM 4529 sequence45, whole + genome shotgun sequence. +ACCESSION NZ_BMUN01000045 +VERSION NZ_BMUN01000045 +KEYWORDS . +SOURCE Streptomyces vinaceusdrappus + ORGANISM Streptomyces vinaceusdrappus + Bacteria; Actinobacteria; Streptomycetales; Streptomycetaceae; + Streptomyces; Streptomyces rochei group. +COMMENT REFSEQ INFORMATION: The reference sequence is identical to + BMUN01000045.1. + The annotation was added by the NCBI Prokaryotic Genome Annotation + Pipeline (PGAP). Information about PGAP can be found here: + https://www.ncbi.nlm.nih.gov/genome/annotation_prok/ + ##antiSMASH-Data-START## + Version :: 6.1.1 + Run date :: 2023-02-07 14:34:49 + Original ID :: NZ_BMUN01000045.1 + NOTE: This is a single cluster extracted from a larger record! + Orig. start :: 0 + Orig. end :: 30675 + ##antiSMASH-Data-END## +FEATURES Location/Qualifiers + gene complement(<1..260) + /locus_tag="IE238_RS36835" + CDS complement(<1..260) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_011031019.1" + /locus_tag="IE238_RS36835" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /product="alkaline phosphatase family protein" + /protein_id="WP_193517002.1" + /transl_table=11 + /translation="MTPTTSSGGPVPLLVLDVVGLTPRLLDHMPHLKRLGQSGSRAPLG + TVLPAVTCAAQSTFLTGTYPSEHGIVGNGWYFRELGDVLLWR" + source 1..30675 + /culture_collection="JCM:4529" + /db_xref="taxon:67376" + /mol_type="genomic DNA" + /organism="Streptomyces vinaceusdrappus" + /strain="JCM 4529" + /submitter_seqid="sequence45" + /type_material="type strain of Streptomyces + vinaceusdrappus" + protocluster 1..30675 + /aStool="rule-based-clusters" + /category="PKS" + /contig_edge="True" + /core_location="[13949:29716]" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + /tool="antismash" + proto_core 13950..29716 + /aStool="rule-based-clusters" + /tool="antismash" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + cand_cluster 1..30675 + /candidate_cluster_number="1" + /contig_edge="True" + /detection_rules="(t2ks and t2clf)" + /kind="single" + /product="T2PKS" + /protoclusters="1" + /tool="antismash" + region 1..30675 + /candidate_cluster_numbers="1" + /contig_edge="True" + /product="T2PKS" + /region_number="1" + /rules="(t2ks and t2clf)" + /tool="antismash" + gene complement(257..1432) + /gene="eboE" + /locus_tag="IE238_RS36840" + /old_locus_tag="GCM10010308_74000" + CDS complement(257..1432) + /codon_start=1 + /gene="eboE" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003994192.1" + /locus_tag="IE238_RS36840" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74000" + /product="metabolite traffic protein EboE" + /protein_id="WP_193517003.1" + /transl_table=11 + /translation="MRFRHPDGSTVHLAYCTNVHPAETLDGVLAQLRDHCEPVRRRLGR + DRLGIGLWLAKDAAHALATDPSALRGLRTELDRRGLEVVTLNGFPYQGFGAEEVKYRVY + KPDWAHPERLEHTTALARVLAGLLPDDVSEGSVSTLPLAWRTAWDETRADKARTALATL + GERLDTLHELTGRSIRIGLEPEPGCIVETTRDAIAPLGAIGHDRIGVCVDTCHLATSFE + DPEEALDALEAAGIRIVKSQLSAALHAEHPSRLEVRDALAAFAEPRFLHQTRTTTATGG + LRGTDDLDEALAAGGPLPDSAPWRAHFHVPLHADPAAPLTSTLPVLKSALSRLVGGARP + LTRHLEVETYTWQALPAQLRPRGRAQLTDGIAAELMLARDLLTDLGLKELP" + gene complement(1436..2311) + /locus_tag="IE238_RS36845" + /old_locus_tag="GCM10010308_74010" + CDS complement(1436..2311) + /GO_function="GO:0016788 - hydrolase activity, acting on + ester bonds [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_004980911.1" + /locus_tag="IE238_RS36845" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74010" + /product="TatD family hydrolase" + /protein_id="WP_127438561.1" + /transl_table=11 + /translation="MRIFDPHIHMTSRTTDDYEAMYAAGVRAVVEPAFWLGQPRTSAAS + FCDYFDALLGWEPFRAAQYGIAHHCTIALNPKEANDPRCTPVLAELPRYLVKDRVVAVG + EIGYDSMTPAEDTALAAQLQLAADHGLPALVHTPHRDKLAGLRRTLDVVRESALPTDRV + LVDHLNETTVKEAKDSGAWLGFSVYPDTKMDEARMVALLREYGPEKVLVNSAADWGRSD + PLKTRKVGDLMLEEGFGEDDVDRVLWRNPVAFYGLSGRLDLDVTATAPTHEGNSVLRGA + PAAEPLPTGA" + gene complement(2313..2912) + /locus_tag="IE238_RS36850" + /old_locus_tag="GCM10010308_74020" + CDS complement(2313..2912) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019890542.1" + /locus_tag="IE238_RS36850" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74020" + /product="EboA domain-containing protein" + /protein_id="WP_127438562.1" + /transl_table=11 + /translation="MTVVHTPPDADLPGEFAGLGTDARRWLTAARASATARDTDWELRF + AEAGRRCGTEHADAARVLLLAAARPDAETVTLLYHRGTAAERRAVLLALDGLDTEPAHA + LPLVEDALRANDTTLLAAALGPYAARHLDAHQWRHAVLKCLFTGVPVATVANLAARARA + DAELARMLRAYAAERTAAHRDIPADLDRVLALTQEQ" + gene complement(2909..3754) + /locus_tag="IE238_RS36855" + /old_locus_tag="GCM10010308_74030" + CDS complement(2909..3754) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330932.1" + /locus_tag="IE238_RS36855" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74030" + /product="sugar phosphate isomerase/epimerase" + /protein_id="WP_193517004.1" + /transl_table=11 + /translation="MSPLRLGYGTNGLTDLRLEDALRLLADLGYDGVGLTLDHMHLDPL + APDLAARTRHVARQLHRLGLAVTVETGARYVLDPRRKHGPSLLDDDPDARWARIRLLIR + SVRVAADLGAHAVHCFSGPRPAGLDQDTAWKRLADALGPVLDAAEDTGVPLAVEPEPGH + LLATLTDFHRLRTELGDPEPLGLTLDIGHCQCLEPLPPADCVRAAAPWLRHVQIEDMRR + GVHEHLPFGDGEIDFPPVLDALAATGYQGLTVVELPRHSHAGPELAAQSMRFLRNGGTR + " + gene complement(3751..4707) + /locus_tag="IE238_RS36860" + /old_locus_tag="GCM10010308_74040" + CDS complement(3751..4707) + /GO_component="GO:0016021 - integral component of membrane + [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330933.1" + /locus_tag="IE238_RS36860" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74040" + /product="UbiA family prenyltransferase" + /protein_id="WP_193517005.1" + /transl_table=11 + /translation="MSAQRPAHGPARDGHLHAWAELLRAPAALTVPGDVLAGTAAAGTR + PTGRTALAAGASLCLYEAGMALNDWADREEDATARPHRPLPSGRVRPGAALAAAGLLSA + AGLALAACAGRRALAVAGPLAATVWAYDLGLKHTPAGPAAMAAARSLDLLLGAAAGPGA + VRRAIVPAAFLGSHTLAVSLVSRRETEGGSSTAPLTALAAAGALTTVLAGRPTAHPAPD + ASTGAPTPATPPADKATRAVRAALAASYAATFARPLAHAALNPSPELTQRAVGAGVRAT + IALQSGLMARAGAPGTGVLTAALAPLAAHLARKVSTT" + gene complement(4704..5819) + /locus_tag="IE238_RS36865" + /old_locus_tag="GCM10010308_74050" + CDS complement(4704..5819) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_003962403.1" + /locus_tag="IE238_RS36865" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74050" + /product="inositol-3-phosphate synthase" + /protein_id="WP_127437809.1" + /transl_table=11 + /translation="MTSADETRTGVWLVGARGSVATTAVSGCAALAAGLLPPTGMVTET + PPFADCGLPALASLVFGGHDTATTPLPKRAEELAAQGVLPPWLPTAVQGELAAADEHIR + PGGPVPGDRRATEELIADFATDLRTFARTTGVARTVVVNVASTEPDPAHGAWPASSLYA + AAALRAGCPYVNFTPSTGLSHPQLAGAARASGLPYAGRDGKTGQTLLRSVLGPMFAQRA + LAVRAWSGTNLLGGGDGAALADPAAAAAKNAGKERVLTDTLGTRVEGEVHIDDVPALGD + WKTAWDHVAFDGFLGTRMVLQTIWQGCDSALAAPLVLDLARLLARAHERGLSGPLGELG + FYFKDPDAEGSALAEQYTRLLTLADRLGGTR" + gene complement(6069..7184) + /locus_tag="IE238_RS36870" + /old_locus_tag="GCM10010308_74060" + CDS complement(6069..7184) + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF033206.1" + /locus_tag="IE238_RS36870" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74060" + /product="ScyD/ScyE family protein" + /protein_id="WP_193450429.1" + /transl_table=11 + /translation="MANSRNSWTKILLAAGAAGAVAVPLTAGPVQAQPQAHRHGHTHTR + TEATVTVVASQLNNPRGVTALGDGGVLVAEAGAGLADCPVDQTCVGTTGSVYKVKGSFQ + GRVATGLASTAKGVAPGAPISANGPSDVVPDRFGGYVVVSGLGGTTESRAALGEGAQTL + GTVFRTRDHKVLADLTDHETRLNPDGGDVHANPWRLARSGSGYLATDAGANTVVRGNAD + GTTATEYLLPKNELPTGAAETVPTGIAKAADGTVYVADMSGGRVGASRVWKIAPGRQPE + ILATGMTNLIDLDLDRDGDLIALSYSAAALAGPPQPGALFEIDADSGAVTEIPTGDQLK + QPTGVAVDPCGKVYVTNNTLGTNGQLVRVNR" + gene 7551..8513 + /locus_tag="IE238_RS36875" + /old_locus_tag="GCM10010308_74070" + CDS 7551..8513 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330937.1" + /locus_tag="IE238_RS36875" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74070" + /product="acetylserotonin O-methyltransferase" + /protein_id="WP_234311021.1" + /transl_table=11 + /translation="MVTRAVHVAAELKVAEALAEGPLSADELAGRVGADADALGRVLRL + LASNGVFATRPDGAFELTPMADALRADHPMSMRGIALLMGHPIHWEDWSGFPETVVTGE + PALPKLRGMHAFEFLTKNAEYGQVFFQGMGSMSASETEPILAAYDFSQFGTVVDFCGGQ + GALLAGILGAAPGCEGVLFDPRVEENGAAEFLAAQGVADRTKRVAGDLFDVPPGGADAY + VLKHIVHDWPEEQALRILRNVRAAIKPGGKLLIAEMVIPEQGDQPHSGKLVDLWLMLLV + GGRERTPGQYADLLARAGFRLERVVETAAAISLVEAVPV" + gene complement(8732..10246) + /locus_tag="IE238_RS36880" + /old_locus_tag="GCM10010308_74080" + CDS complement(8732..10246) + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330938.1" + /locus_tag="IE238_RS36880" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74080" + /product="FAD-dependent monooxygenase" + /protein_id="WP_193517006.1" + /transl_table=11 + /translation="MEGTAADTDVIVVGAGPTGLMLAGELRLGGARVVVIEKLAAPTGQ + SRGLGFTARAMETFDERGLLPRFGQGETLATSPVGHFGGAQFDFTVLEDAHFGARGIPQ + GDTEAVLEGWAGELGADIRRGWEFVSLTDGFLDGDGVEITVRTPQGEERTLRASYLAGC + DGGSSRVRRAAGFDFPGTDATQGMYLADITGVELTPRFLGERLNNGMVMAAPLSQGVWR + IIVCPDGRPAHDRERTVTFEEVAAAWQDITGEDISHGGASWVSSFTNATRQASEYRRGR + VFLAGDAAHIHLPAGGQGLSTGVQDAANLGWKLASVIRGDAPRELLDTYHAERHPVGAR + LLMNTRAQGIVFLGGAESDPLRELMAELVRYDDVKRHLAGIVSHLDIRYDLAGTASGPT + HPLLGRRMPPRLLVGADGETRIARLLHAGHGVLLDLADDETVRATAAGHADRVDVVTAV + AKPTDGPDALAGATAVLIRPDGYVAWTGTCAQGLETALERWFGPPR" + gene complement(10349..11824) + /locus_tag="IE238_RS36885" + /old_locus_tag="GCM10010308_74090" + CDS complement(10349..11824) + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330939.1" + /locus_tag="IE238_RS36885" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74090" + /product="FAD-dependent monooxygenase" + /protein_id="WP_127443921.1" + /transl_table=11 + /translation="MAADALTTDVVVVGAGPVGMMLAGELAHGGVGVVVVEKRRAPSTE + SRASTLHARTMEILDSRSLLPEFGDPPNEPRGHFGGIPLDLTLPSSHPGQWKVPQTRTE + VILGEWALSLGAELQCKHELTALDDSGDLVEAEAAGPDGRTLRLRCRYLVACDGEESTV + RRLIGADFPGRDATRELLRADVAGIDIPGRRFERLEHGLAIAARRPDGVTRVMVHEFGS + AARARPHGDASFEEITAVWKRVTGEDISGGTPLWANAFGDASRQLTRYRHGRVLFAGDA + AHRQMPVGGQALNLGMQDAFNLGWKLALVVRGKAPQTLLDSYHDERHEVGRQVLANIRA + QSLLLLGGPEVEPLRDLLTELIGQEDVRRRLAGMISGLDVRYDVGGPAHPLLGARLPCT + EVRARRRLLTTTHLVRSGGGVLLDLTGRPGRPPAVLDGWADRVTALDAQPLPGSSLQGT + DRVLVRPDGHVAWAGPGTDGLAEALTRWFGPPR" + gene complement(11828..12772) + /locus_tag="IE238_RS36890" + /old_locus_tag="GCM10010308_74100" + CDS complement(11828..12772) + /NRPS_PKS="Domain: Polyketide_cyc2 (4-146). E-value: + 2.7e-16. Score: 52.1. Matches aSDomain: + nrpspksdomains_IE238_RS36890_Polyketide_cyc2.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (157-310). E-value: + 2.1e-08. Score: 26.5. Matches aSDomain: + nrpspksdomains_IE238_RS36890_Polyketide_cyc2.2" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330940.1" + /locus_tag="IE238_RS36890" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74100" + /product="aromatase/cyclase" + /protein_id="WP_193517007.1" + /transl_table=11 + /translation="MTTREVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEAD + GDHERIHIWATANGQAKEWTSRRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDR + SRVRLLHDYSAIGDDPHDLLWIEQAVDKNSTSELAALKVNVEAAHAAATEELTFSFADT + VQIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGLQELEMDTRAKDGSVHTTKSY + RVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTASSQHTVTLNTANIARILGQDA + TVADARAYVHTALSTNSRATLAHAKAYAEQKKG" + aSDomain complement(11843..12301) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36890_Polyketide_cyc2.2" + /domain_subtype="Polyketide_cyc2" + /evalue="2.10E-08" + /label="IE238_RS36890_Polyketide_cyc2.2" + /locus_tag="IE238_RS36890" + /protein_end="310" + /protein_start="157" + /score="26.5" + /tool="antismash" + /translation="FSFADTVQIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGL + QELEMDTRAKDGSVHTTKSYRVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTAS + SQHTVTLNTANIARILGQDATVADARAYVHTALSTNSRATLAHAKAYAE" + aSModule 11843..12760 + /domains="nrpspksdomains_IE238_RS36890_Polyketide_cyc2.1" + /domains="nrpspksdomains_IE238_RS36890_Polyketide_cyc2.2" + /incomplete + /locus_tags="IE238_RS36890" + /tool="antismash" + /type="unknown" + aSDomain complement(12335..12760) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36890_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="2.70E-16" + /label="IE238_RS36890_Polyketide_cyc2.1" + /locus_tag="IE238_RS36890" + /protein_end="146" + /protein_start="4" + /score="52.1" + /tool="antismash" + /translation="EVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEADGDHE + RIHIWATANGQAKEWTSRRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDRSRVR + LLHDYSAIGDDPHDLLWIEQAVDKNSTSELAALKVNVE" + gene complement(12813..13601) + /gene="fabG" + /locus_tag="IE238_RS36895" + /old_locus_tag="GCM10010308_74110" + CDS complement(12813..13601) + /EC_number="1.1.1.100" + /GO_function="GO:0016491 - oxidoreductase activity + [Evidence IEA]" + /NRPS_PKS="Domain: PKS_KR (8-164). E-value: 7.1e-11. Score: + 34.2. Matches aSDomain: + nrpspksdomains_IE238_RS36895_PKS_KR.1" + /NRPS_PKS="type: other" + /codon_start=1 + /gene="fabG" + /gene_functions="biosynthetic-additional + (rule-based-clusters) adh_short" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330941.1" + /locus_tag="IE238_RS36895" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74110" + /product="3-oxoacyl-ACP reductase FabG" + /protein_id="WP_030970829.1" + /sec_met_domain="adh_short (E-value: 5.9e-36, bitscore: + 115.1, seeds: 230, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTDTTTQRVAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVA + ATVKELQGEGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIA + DELWDDVIDTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKH + GVVGFTKALGNELAPTGITVNAVCPGYVETPMAQRVRQGYAAAYDTSEDAILEKFQAKI + PLGRYSTPEEVAGLVGYLASDTAASITSQALNVCGGLGNF" + aSDomain complement(13110..13577) + /aSDomain="PKS_KR" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36895_PKS_KR.1" + /evalue="7.10E-11" + /label="IE238_RS36895_PKS_KR.1" + /locus_tag="IE238_RS36895" + /protein_end="164" + /protein_start="8" + /score="34.2" + /tool="antismash" + /translation="VAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVAATVKELQG + EGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIADELWDDVI + DTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKHG" + CDS_motif complement(13509..13571) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36895_0001" + /evalue="6.00E-05" + /label="PKSI-KR_m1" + /locus_tag="IE238_RS36895" + /protein_end="31" + /protein_start="10" + /score="15.7" + /tool="antismash" + /translation="VVTGATSGIGLASARLLGRQG" + gene complement(13614..13883) + /locus_tag="IE238_RS36900" + /old_locus_tag="GCM10010308_74120" + CDS complement(13614..13883) + /NRPS_PKS="Domain: ACP (12-83). E-value: 9.1e-13. Score: + 40.2. Matches aSDomain: nrpspksdomains_IE238_RS36900_ACP.1" + /NRPS_PKS="type: other" + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) PP-binding" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_015037163.1" + /locus_tag="IE238_RS36900" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74120" + /product="acyl carrier protein" + /protein_id="WP_019330942.1" + /sec_met_domain="PP-binding (E-value: 1.5e-08, bitscore: + 26.1, seeds: 164, tool: rule-based-clusters)" + /transl_table=11 + /translation="MASKSFTLDDLKRTLREAAGVAEGVDLDGDILDTEFEVIGYESLA + LLEAGSLIEREYGISLDEEAVGEANTPRSFIEVVNAQLAPAKAA" + aSDomain complement(13635..13847) + /aSDomain="ACP" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36900_ACP.1" + /evalue="9.10E-13" + /label="IE238_RS36900_ACP.1" + /locus_tag="IE238_RS36900" + /protein_end="83" + /protein_start="12" + /score="40.2" + /tool="antismash" + /translation="RTLREAAGVAEGVDLDGDILDTEFEVIGYESLALLEAGSLIEREY + GISLDEEAVGEANTPRSFIEVVNAQL" + gene complement(13950..15161) + /locus_tag="IE238_RS36905" + /old_locus_tag="GCM10010308_74130" + CDS complement(13950..15161) + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (48-401). E-value: + 9.4e-31. Score: 98.9. Matches aSDomain: + nrpspksdomains_IE238_RS36905_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330943.1" + /locus_tag="IE238_RS36905" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74130" + /product="ketosynthase chain-length factor" + /protein_id="WP_030970827.1" + /sec_met_domain="t2clf (E-value: 1.8e-209, bitscore: 686.3, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTASVVVTGLGVVSPNGMGVKDYWAATLGGKHGIGRITRFDPTGY + PARLAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPAHLPEFDMGVIT + ASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSEG + AGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSDEPDHAYLPFDR + DANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGREPNLAKAIETA + LADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKTMTGRLYSGGAP + LDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLARGAGGFNSAMV + VRAA" + aSDomain complement(13959..15017) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36905_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="9.40E-31" + /label="IE238_RS36905_PKS_KS.1" + /locus_tag="IE238_RS36905" + /protein_end="401" + /protein_start="48" + /score="98.9" + /tool="antismash" + /translation="LAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPA + HLPEFDMGVITASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGM + KGPSGVVVSEGAGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSD + EPDHAYLPFDRDANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGR + EPNLAKAIETALADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKT + MTGRLYSGGAPLDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLA + RGAGGFNSAMVVR" + CDS_motif complement(14466..14504) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36905_0002" + /evalue="1.20E-04" + /label="PKSI-KS_m4" + /locus_tag="IE238_RS36905" + /protein_end="232" + /protein_start="219" + /score="15.0" + /tool="antismash" + /translation="FDRDANGYVPGEG" + CDS_motif complement(14673..14696) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36905_0001" + /evalue="9.90E+01" + /label="PKSI-KS_m4" + /locus_tag="IE238_RS36905" + /protein_end="163" + /protein_start="155" + /score="-2.9" + /tool="antismash" + /translation="SGVVVSEG" + gene complement(15158..16429) + /locus_tag="IE238_RS36910" + /old_locus_tag="GCM10010308_74140" + CDS complement(15158..16429) + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (5-395). E-value: + 3.7e-53. Score: 172.7. Matches aSDomain: + nrpspksdomains_IE238_RS36910_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007385254.1" + /locus_tag="IE238_RS36910" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74140" + /product="beta-ketoacyl-[acyl-carrier-protein] synthase + family protein" + /protein_id="WP_029394634.1" + /sec_met_domain="t2ks (E-value: 2.1e-248, bitscore: 815.1, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MSGRRVVITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAP + FRSRVAAEADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVT + VGSAVGATMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPS + TVVSTGCTSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEP + ECASRPFDKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRP + DGVEMAEAIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSS + IKSMVGHSLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQLIDAV + LTVGSGFGGFQSAMVLATPERSLV" + aSDomain complement(15245..16414) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36910_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="3.70E-53" + /label="IE238_RS36910_PKS_KS.1" + /locus_tag="IE238_RS36910" + /protein_end="395" + /protein_start="5" + /score="172.7" + /tool="antismash" + /translation="VVITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAPFRSRV + AAEADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVTVGSAV + GATMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPSTVVST + GCTSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEPECASR + PFDKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRPDGVEM + AEAIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSSIKSMV + GHSLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQL" + gene complement(16426..16755) + /locus_tag="IE238_RS36915" + /old_locus_tag="GCM10010308_74150" + CDS complement(16426..16755) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019767153.1" + /locus_tag="IE238_RS36915" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74150" + /product="TcmI family type II polyketide cyclase" + /protein_id="WP_019330945.1" + /transl_table=11 + /translation="MHSTLIVARMAATSSNDVAQLFADFDATEMPHRMGTRRRQLFSYR + GLYFHLQDFDEDNGGELIEAAKADPRFVRISEDLKPFIEAYDPTTWRSPADAMATRFYS + WEASR" + gene complement(17013..17711) + /locus_tag="IE238_RS36920" + /old_locus_tag="GCM10010308_74160" + CDS complement(17013..17711) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330946.1" + /locus_tag="IE238_RS36920" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74160" + /product="antibiotic biosynthesis monooxygenase" + /protein_id="WP_193517008.1" + /transl_table=11 + /translation="MPIISAEDKHLTVLNLFTTDTPEKQAKLIEEMTKIVNAAAYEGWM + SSTVHSGVDGYGTLNFIQWRSGEDLEKRYAGEEFKHRTLPVFGEITTSIRLMQNEVAHT + LTSDALGGKIEIGPDRDDYTVFTLFPVTPEGQDEAVDALGPGQAFLADVPGFRAHVVLR + GLRARGLEGSFVISYSQWDSKEAFEVYRDQAPEEQADARKAAVARVRAVVTGEPYLNTY + RVVHTRSAGE" + gene complement(17768..19186) + /locus_tag="IE238_RS36925" + /old_locus_tag="GCM10010308_74170" + CDS complement(17768..19186) + /GO_function="GO:0071949 - FAD binding [Evidence IEA]" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_004948222.1" + /locus_tag="IE238_RS36925" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74170" + /product="FAD-dependent monooxygenase" + /protein_id="WP_233535396.1" + /transl_table=11 + /translation="MLAGELRLAGVSVVVLDKLSEPIQESRALGFSARTIEEFAQRGLM + DRFGEVGVIPVGHFGGVPLDYRVIEGGSYGARGIPQARTEGVLGGWARELGADIRRGCE + VTGIEQTDASVTVTAAGADGPFSLRARHVVGCDGARSIVRKLAGIGFPGTEPAIELRFA + DLAGVALRPRFSGERVAGGMVMVIPMGPDRCRVIYFDSSEPLRTSPDPITFDEVAQTWQ + RLTGEDVSGATPLWVSSTTDVSRQADRYRHGRVFLAGDAAHIHLPIGAQGMSAGVQDAV + NLGWKLALDIKGQAPEGLLDTYHAERHPVGARILTNTLAQRILYLGGDEITPMREVLAE + LMGAHESVQRHLAGMVTGLDIRHDVGEGDHPLLGRRLPDRELVVDGEKTPFYALLRTAR + PVLLELGGDHGLRTAAAGWADRVDLVAAEFDGCEAPVDGILVRPDGYVAWVAGLGAGPD + GLTAALGRWFGPSA" + gene 19407..19889 + /locus_tag="IE238_RS36930" + /old_locus_tag="GCM10010308_74180" + CDS 19407..19889 + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007389987.1" + /locus_tag="IE238_RS36930" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74180" + /product="nuclear transport factor 2 family protein" + /protein_id="WP_050990831.1" + /transl_table=11 + /translation="MTSSLTTDQSASVSAAESSAQVAGLLHRYLVSLDDERLDDAWTAG + LFTEDAVVAFPVSRHEGADGMAEYHRSALSAFAATQHLGSPAVVDVDGDRAVFRANLIS + THVHHPRHTPPEGDLPPLFATGTFVNGEARRTARGWRLSLLAFRLLWADGSPPPAR" + gene complement(20105..20521) + /locus_tag="IE238_RS36935" + /old_locus_tag="GCM10010308_74190" + CDS complement(20105..20521) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330949.1" + /locus_tag="IE238_RS36935" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74190" + /product="pyridoxamine 5'-phosphate oxidase family protein" + /protein_id="WP_030970823.1" + /transl_table=11 + /translation="MPSMPRPDAVTVPDSVQAFLTGTALVAAFTTMRPDGTPHVAPVRF + TWDADAQLARVMTVRSSRKARNLLATPGAPVALCQVDGFRWVTLEGTGTVVTDPERVAL + GARLYAKRYWSAPPTPSDRVVIEIAVDRVLSLNA" + gene complement(20758..20904) + /locus_tag="IE238_RS36940" + /old_locus_tag="GCM10010308_74200" + CDS complement(20758..20904) + /codon_start=1 + /inference="COORDINATES: ab initio prediction:GeneMarkS-2+" + /locus_tag="IE238_RS36940" + /note="Derived by automated computational analysis using + gene prediction method: GeneMarkS-2+." + /old_locus_tag="GCM10010308_74200" + /product="hypothetical protein" + /protein_id="WP_019330950.1" + /transl_table=11 + /translation="MHEGDDERHEGDTARCARAVHGGPPPLRLAGAEEREDEDGRVIVR + SID" + gene complement(20939..22429) + /locus_tag="IE238_RS36945" + /old_locus_tag="GCM10010308_74210" + CDS complement(20939..22429) + /NRPS_PKS="Domain: Condensation_DCL (38-314). E-value: + 1.3e-48. Score: 157.5. Matches aSDomain: + nrpspksdomains_IE238_RS36945_Condensation_DCL.1" + /NRPS_PKS="type: NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic-additional + (rule-based-clusters) Condensation" + /gene_kind="biosynthetic-additional" + /inference="COORDINATES: protein motif:HMM:NF012873.2" + /locus_tag="IE238_RS36945" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74210" + /product="condensation domain-containing protein" + /protein_id="WP_193517009.1" + /sec_met_domain="Condensation (E-value: 3.4e-30, bitscore: + 96.0, seeds: 42, tool: rule-based-clusters)" + /transl_table=11 + /translation="MAWHSRPRALRGPGTARPPGVPALWPHLDLLGDFGGRRGAGRHVE + QLVWRWHGPLDTERFTAAWQSVVDRESVLRAALAPGPRPHLVLHEHAHGDVVRHRAGGA + GWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGPVTRVVLTFHHALLDAWSVCLL + MQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGARDFWRGAVPDGPVAVLPARPG + PRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSALETVWALLLYRAAGPGGAATVG + FGVTVSGRGITLDCAERLPGPLRNCLPMVVRVDPGETVGRLLTALRDRALDMAAYEWVS + TRRIHRWTGRCPDGELLQSVVSVDSLPRPPGNLRNELAGAGIALEPEPAHGACPDLPVA + LLVRPGGDGRLTFCVDHDRNRISDADARLLAGHCARLLRHLPGTDEATTNGAVLDVLAG + EALPRIAPRPSRPRPAGSWLRPRSTSSGAAVDRAASHP" + CDS_motif complement(21452..21511) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36945_0004" + /evalue="3.90E+01" + /label="C2_LCL_024-062" + /locus_tag="IE238_RS36945" + /protein_end="326" + /protein_start="306" + /score="-3.2" + /tool="antismash" + /translation="LPMVVRVDPGETVGRLLTAL" + aSDomain complement(21488..22315) + /aSDomain="Condensation" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36945_Condensation_DCL.1 + " + /domain_subtype="Condensation_DCL" + /evalue="1.30E-48" + /label="IE238_RS36945_Condensation_DCL.1" + /locus_tag="IE238_RS36945" + /protein_end="314" + /protein_start="38" + /score="157.5" + /tool="antismash" + /translation="GAGRHVEQLVWRWHGPLDTERFTAAWQSVVDRESVLRAALAPGPR + PHLVLHEHAHGDVVRHRAGGAGWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGP + VTRVVLTFHHALLDAWSVCLLMQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGA + RDFWRGAVPDGPVAVLPARPGPRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSAL + ETVWALLLYRAAGPGGAATVGFGVTVSGRGITLDCAERLPGPLRNCLPMVVRVD" + CDS_motif complement(21503..21589) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36945_0003" + /evalue="6.10E-06" + /label="C5_DCL_263-294" + /locus_tag="IE238_RS36945" + /protein_end="309" + /protein_start="280" + /score="18.7" + /tool="antismash" + /translation="GFGVTVSGRGITLDCAERLPGPLRNCLPM" + CDS_motif complement(21917..21982) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36945_0002" + /evalue="4.90E-08" + /label="C3_DCL_135-156" + /locus_tag="IE238_RS36945" + /protein_end="171" + /protein_start="149" + /score="25.5" + /tool="antismash" + /translation="FHHALLDAWSVCLLMQELCRAY" + CDS_motif complement(22199..22300) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36945_0001" + /evalue="4.80E-10" + /label="C2_DCL_024-062" + /locus_tag="IE238_RS36945" + /protein_end="77" + /protein_start="43" + /score="31.7" + /tool="antismash" + /translation="VEQLVWRWHGPLDTERFTAAWQSVVDRESVLRAA" + gene complement(22634..23443) + /locus_tag="IE238_RS36950" + /old_locus_tag="GCM10010308_74220" + CDS complement(22634..23443) + /GO_function="GO:0008897 - holo-[acyl-carrier-protein] + synthase activity [Evidence IEA]" + /NRPS_PKS="Domain: ACPS (134-195). E-value: 7e-12. Score: + 37.1. Matches aSDomain: + nrpspksdomains_IE238_RS36950_ACPS.1" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_007389988.1" + /locus_tag="IE238_RS36950" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74220" + /product="4'-phosphopantetheinyl transferase superfamily + protein" + /protein_id="WP_029394636.1" + /transl_table=11 + /translation="MERVTCAAPLHVPRPHGPWPAVREDLFRHGNALVCTTWSEWLPSV + LTTPRLRELLGDDWQRYRRTRDAAVRYRFAASRMLIKYTAAAALAVPPEYLDLAYRLGG + RPYLRGFDQIELSLSHTGDVMAVGLSRIGRIGVDVEPAERPVRLDLLETQVFTPAEARE + LAELPEGERTAHALRLWTLKEAYSKALGQGLRFGFKEFGFRQGRLSAPDGSRVTRDEWG + FATYPVMDRFLLSVACHNAGLSTAGDTSVGTMLDQGFLSAMTDTGQQ" + aSDomain complement(22859..23041) + /aSDomain="ACPS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36950_ACPS.1" + /evalue="7.00E-12" + /label="IE238_RS36950_ACPS.1" + /locus_tag="IE238_RS36950" + /protein_end="195" + /protein_start="134" + /score="37.1" + /tool="antismash" + /translation="IGVDVEPAERPVRLDLLETQVFTPAEARELAELPEGERTAHALRL + WTLKEAYSKALGQGLR" + gene complement(23532..25412) + /locus_tag="IE238_RS36955" + /old_locus_tag="GCM10010308_74230" + CDS complement(23532..25412) + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330953.1" + /locus_tag="IE238_RS36955" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74230" + /product="acyl-CoA dehydrogenase" + /protein_id="WP_193517010.1" + /transl_table=11 + /translation="MTAALDTAAGPTGQTPAPRSTTPTPAPEHTTPTPAPEHTTRAPAP + EPEHTTPTPECERAARAPEPERAARLEAALGDPFDPANPHGHLALVRADDTREAPHATE + ALLTEHGLSAEFVPHDLGGRLRDLEELARVLRPLFRRDLALGYGFGITSLFAASSVWTA + GDPHQRAALADVLLGGGRVAIVHREVAHANAILRREVRAQRPAGGGFLLNGSKDAVMNA + DRTDTFVVYARTSAGSGSASHSVLLLPGPPASGEVRRLARVEMPGMRGARFHGLRLADV + RLPDSALVGSLGEGVTLALRSFQISHCLIPGTVLAGVDSVLRLAVRAATENRPDGRPAR + RWHKALSGVFADLLACDAMAVTGLRALSLVPQHAHLLAAAVKYTMPDLLREDLEELAAV + LGARGYDRGPLYGGFQKLARDLPVAGLGHSGTAVCQAVLVPQLPALARTAWFRTAEPSA + ALFLPGAPLPPLDHRRLTHSGTDDPLTATLIGAAERLAARTGTQPLHAALAALARALVE + ELRVLRARCAALPAAGSTVFDPLACALADRYALLLCAAACLGVWEGQADGDGFLADPAW + AVLVLSRIGRRLGIAVPETPADAEQAVLAEALGRCRHGRSLDLYDTPLAG" + gene complement(25409..26293) + /locus_tag="IE238_RS36960" + /old_locus_tag="GCM10010308_74240" + CDS complement(25409..26293) + /NRPS_PKS="Domain: Polyketide_cyc (3-131). E-value: + 9.4e-13. Score: 40.4. Matches aSDomain: + nrpspksdomains_IE238_RS36960_Polyketide_cyc.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (146-253). E-value: + 1e-07. Score: 24.3. Matches aSDomain: + nrpspksdomains_IE238_RS36960_Polyketide_cyc2.1" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_019330954.1" + /locus_tag="IE238_RS36960" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74240" + /product="SRPBCC family protein" + /protein_id="WP_078912213.1" + /transl_table=11 + /translation="MTAPAPSGVLYGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMW + AVAGDRISSWVSHRRLDVGQRRVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFT + VVGDAPADAAWTERVTRANSRAQLQRLAWLAERWTRLDDLVMSFEDTVRVNVPAELVFD + FLYRAGDWPDDLAGTRPLTVQEDTPGIQVLALDGRSATGGEAVRISFPAAGRLVHKHTR + TSGPLAAYTGEWTIEPQPGAGLDVTVRHDVLLNDDAALDQDAARRACDEVGRAGRRLLE + HAVRHASDAVRVL" + aSDomain complement(25535..25855) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36960_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="1.00E-07" + /label="IE238_RS36960_Polyketide_cyc2.1" + /locus_tag="IE238_RS36960" + /protein_end="253" + /protein_start="146" + /score="24.3" + /tool="antismash" + /translation="SFEDTVRVNVPAELVFDFLYRAGDWPDDLAGTRPLTVQEDTPGIQ + VLALDGRSATGGEAVRISFPAAGRLVHKHTRTSGPLAAYTGEWTIEPQPGAGLDVTVRH + DVL" + aSModule 25535..26284 + /domains="nrpspksdomains_IE238_RS36960_Polyketide_cyc.1" + /domains="nrpspksdomains_IE238_RS36960_Polyketide_cyc2.1" + /incomplete + /locus_tags="IE238_RS36960" + /tool="antismash" + /type="unknown" + aSDomain complement(25901..26284) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36960_Polyketide_cyc.1" + /domain_subtype="Polyketide_cyc" + /evalue="9.40E-13" + /label="IE238_RS36960_Polyketide_cyc.1" + /locus_tag="IE238_RS36960" + /protein_end="131" + /protein_start="3" + /score="40.4" + /tool="antismash" + /translation="PAPSGVLYGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMWAVA + GDRISSWVSHRRLDVGQRRVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFTVVG + DAPADAAWTERVTRANSRAQLQRL" + gene 26608..26844 + /locus_tag="IE238_RS36965" + /old_locus_tag="GCM10010308_74250" + CDS 26608..26844 + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF039972.1" + /locus_tag="IE238_RS36965" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74250" + /product="hypothetical protein" + /protein_id="WP_031022584.1" + /transl_table=11 + /translation="MRRFRPRRCVRGLWEGLVAYGRLCLAGETDRYDHPPRPRIRWHRP + PPGHPERVRDDMPLTDLERRLARELADEDHDVR" + gene complement(27171..28448) + /locus_tag="IE238_RS36970" + /old_locus_tag="GCM10010308_74260" + CDS complement(27171..28448) + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (89-421). E-value: + 3e-25. Score: 80.8. Matches aSDomain: + nrpspksdomains_IE238_RS36970_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_018846562.1" + /locus_tag="IE238_RS36970" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74260" + /product="ketosynthase chain-length factor" + /protein_id="WP_193517011.1" + /sec_met_domain="t2clf (E-value: 2.5e-172, bitscore: 564.0, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTKATQAPEPARPAPTPAGAEGPRQTLVTGIGVAAPNGLGTRAWW + DAVLCGRTGLGPITRFDASGYPVRIAGEIPGFVDEDHIPSRLLPSTDRGTRIALVAAEE + ALRDANVSPADLPAYGAGVITASSAGGAEFGERGLAALWSKGAQHVSAYQSFASFHAAA + PAQISIRHRLRGHGSTVVSEQAGGIDALARARRRIRDGACLMVTGGIDSTLCAWGWAAH + LADGRLSPATEPARAYRPFAATADGHAVGEGGALLVLEDARAAARRGATGYGVIAGCAA + TFDGPDRPTLRQAAELALADAGLAPEHVDVVFADGAAERRADLVESQALCALFGPYGVP + VTVPKTMTGRLGAGGSALDVAAALLALREKVVPPTTGTGRVADDCPLDLVTGAPRELPR + LRVALVLARGRGGFNSAAVLQAPQTQ" + aSDomain complement(27186..28181) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36970_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="3.00E-25" + /label="IE238_RS36970_PKS_KS.1" + /locus_tag="IE238_RS36970" + /protein_end="421" + /protein_start="89" + /score="80.8" + /tool="antismash" + /translation="STDRGTRIALVAAEEALRDANVSPADLPAYGAGVITASSAGGAEF + GERGLAALWSKGAQHVSAYQSFASFHAAAPAQISIRHRLRGHGSTVVSEQAGGIDALAR + ARRRIRDGACLMVTGGIDSTLCAWGWAAHLADGRLSPATEPARAYRPFAATADGHAVGE + GGALLVLEDARAAARRGATGYGVIAGCAATFDGPDRPTLRQAAELALADAGLAPEHVDV + VFADGAAERRADLVESQALCALFGPYGVPVTVPKTMTGRLGAGGSALDVAAALLALREK + VVPPTTGTGRVADDCPLDLVTGAPRELPRLRVALVLARGRGGFNSAAVLQA" + gene complement(28445..29716) + /locus_tag="IE238_RS36975" + /old_locus_tag="GCM10010308_74270" + CDS complement(28445..29716) + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (3-396). E-value: + 4.4e-49. Score: 159.3. Matches aSDomain: + nrpspksdomains_IE238_RS36975_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_kind="biosynthetic" + /inference="COORDINATES: similar to AA + sequence:RefSeq:WP_005321633.1" + /locus_tag="IE238_RS36975" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74270" + /product="beta-ketoacyl-[acyl-carrier-protein] synthase + family protein" + /protein_id="WP_193517012.1" + /sec_met_domain="t2ks (E-value: 2.3e-202, bitscore: 663.4, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MNRVVITGIGVVAPGAVGTAGFWDLLTVGRTATRRVTLFDACGYR + SRVAAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSL + GSAIGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVA + LVSSGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPA + TASRPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAITAHSSAHHMTGLRPG + ALEMADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSI + KSMIGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTSTVL + TVASGFGGFHTAAVLTRPQLKEAA" + aSDomain complement(28529..29707) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36975_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="4.40E-49" + /label="IE238_RS36975_PKS_KS.1" + /locus_tag="IE238_RS36975" + /protein_end="396" + /protein_start="3" + /score="159.3" + /tool="antismash" + /translation="VVITGIGVVAPGAVGTAGFWDLLTVGRTATRRVTLFDACGYRSRV + AAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSLGSA + IGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVALVS + SGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPATAS + RPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAITAHSSAHHMTGLRPGALE + MADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSIKSM + IGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTS" + gene complement(29713..30492) + /locus_tag="IE238_RS36980" + /old_locus_tag="GCM10010308_74280" + CDS complement(29713..30492) + /NRPS_PKS="Domain: Thioesterase (15-242). E-value: 7.3e-38. + Score: 123.1. Matches aSDomain: + nrpspksdomains_IE238_RS36980_Thioesterase.1" + /NRPS_PKS="type: other" + /codon_start=1 + /inference="COORDINATES: protein motif:HMM:NF013166.2" + /locus_tag="IE238_RS36980" + /note="Derived by automated computational analysis using + gene prediction method: Protein Homology." + /old_locus_tag="GCM10010308_74280" + /product="alpha/beta fold hydrolase" + /protein_id="WP_193517013.1" + /transl_table=11 + /translation="MASRSRDREAGTARITLTCLAHAGAGVASYRGWSAAVGPGIDVAA + LPLPGRDSRRREPRLTERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALAD + SGLPPLFLAVGACPPPHTTSVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTF + LPVLRDDLRLARSLRNAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIE + LHTVAGGHFFASSSSLAQHVGRACRGHVTALPTGGGR" + aSDomain complement(29767..30447) + /aSDomain="Thioesterase" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_IE238_RS36980_Thioesterase.1" + /evalue="7.30E-38" + /label="IE238_RS36980_Thioesterase.1" + /locus_tag="IE238_RS36980" + /protein_end="242" + /protein_start="15" + /score="123.1" + /tool="antismash" + /translation="TLTCLAHAGAGVASYRGWSAAVGPGIDVAALPLPGRDSRRREPRL + TERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALADSGLPPLFLAVGACPP + PHTTSVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTFLPVLRDDLRLARSLR + NAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIELHTVAGGHFFASSSS + LAQHV" + CDS_motif complement(30187..30255) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_IE238_RS36980_0001" + /evalue="3.80E-07" + /label="NRPS-te1" + /locus_tag="IE238_RS36980" + /protein_end="102" + /protein_start="79" + /score="22.6" + /tool="antismash" + /translation="RGPYALYGHSMGALVGYTLTRAL" +ORIGIN + 1 cgccacagca ggacgtcgcc gagttcgcgg aagtaccagc cgttgccgac gatgccgtgc + 61 tcggacgggt aggtcccggt gaggaaggtg gactgggcgg cgcaggtgac ggcgggcagg + 121 acggtgccca gcggggcgcg ggagccggac tggccgagcc gtttgaggtg gggcatgtgg + 181 tccaggagcc ggggggtgag gccgacgacg tccaggacca gcagcgggac cggccccccg + 241 gaagaggtgg tgggggtcat ggcagctcct tcaggccgag gtcggtcagc aggtcacggg + 301 cgagcatcag ctccgcggcg atcccgtcgg tgagctgggc ccggccccgg ggccgcaact + 361 gggccggcaa cgcctgccag gtgtaggtct ccacctccag atgccgggtc agcggacgcg + 421 ccccgcccac cagccgggac agagccgact tcagcaccgg cagagtcgag gtgagcggcg + 481 cggccgggtc cgcgtgcagg gggacgtgga agtgcgcgcg ccagggcgcc gagtcgggca + 541 gcggtccgcc ggcggccagg gcctcgtcca ggtcatccgt gccacgcagc ccgcccgtgg + 601 cagtggtggt gcgggtctgg tgcaggaagc ggggctcggc gaaggcggcg agagcgtcgc + 661 gtacttcgag acgagaaggg tgctcggcgt gcagggcggc ggagagctgg gacttcacga + 721 ttcggatccc ggccgcctcc agggcgtcca gcgcttcctc cggatcctcg aaggaggtgg + 781 cgaggtggca ggtgtcgaca cagacaccga ttcggtcgtg tccgatcgcg cccagcggag + 841 cgatagcgtc ccgggtcgtc tccacgatgc agccgggttc gggttccagg ccgatgcgga + 901 tggagcggcc ggtcagctcg tgaagggtgt ccagacgctc gccgagcgtg gccagcgccg + 961 tgcgggcctt gtcggcgcgg gtctcgtccc aggcggtgcg ccaggccagc ggcagcgtgg + 1021 agacggagcc ctcgctcaca tcgtcgggca gcagtccggc gaggacgcgg gccagggcgg + 1081 tggtgtgctc caggcgttcg gggtgagccc agtccggttt gtagacgcgg tacttgacct + 1141 cttcggcgcc gaagccctgg taggggaagc cgttgagggt gacgacctcc agtccccgcc + 1201 ggtcgagttc ggtgcgcagt ccgcgcagcg cggaggggtc ggtggccagg gcgtgggcgg + 1261 cgtctttggc gagccacagc ccgatgccga gacggtcgcg gcccaggcgg cggcggaccg + 1321 gctcgcagtg gtcgcggagc tgggcgagga ccccgtcgag ggtttcggcg ggatggacgt + 1381 tggtgcagta ggcgaggtgg acggtggagc cgtccgggtg ccggaaccgc accgttcacg + 1441 ctcccgtcgg cagcggctcg gcggccgggg cgccgcgcag gacggagttg ccctcgtggg + 1501 tgggcgcggt ggccgtgacg tcgaggtcga ggcgtccgct gaggccgtag aaggcgacgg + 1561 ggttgcgcca cagcacccgg tccacgtcgt cctcgccgaa gccctcctcg agcatcaggt + 1621 caccgacctt gcgggtcttg agcgggtcgc tcctgcccca gtccgcggcc gagttcacca + 1681 gcaccttctc cgggccgtac tcacgcagca gagcgaccat gcgggcctcg tccatcttgg + 1741 tgtccggata gacggagaac cccagccagg caccgctgtc cttggcctcc ttgaccgtgg + 1801 tctcgttgag gtggtcgacc agcacccggt ccgtgggcag cgcggactcg cgcaccacgt + 1861 ccagcgtgcg gcgcagcccg gcgagcttgt cccggtgcgg ggtgtgcacc agcgccggca + 1921 gcccgtggtc ggcggcgagc tgcaactggg cggccagcgc ggtgtcctcg gccggggtca + 1981 tcgagtcgta gccgatctcc cccaccgcca ccacccggtc cttgaccaga tagcgcggca + 2041 gctcggccag caccggagtg cagcgcggat cgttcgcctc cttcgggttc aacgcgatcg + 2101 tgcagtgatg ggcgatcccg tactgcgccg cacggaacgg ctcccagccc agcaacgcgt + 2161 cgaagtagtc acagaaggag gctgcagagg tgcggggctg ccccagccag aaggcgggct + 2221 cgaccacggc acggacaccc gcggcgtaca tggcttcgta gtcgtcggtg gtccgggacg + 2281 tcatgtggat gtgggggtcg aagatgcgca agtcactgct cctgggtcag ggcgagcacg + 2341 cggtcgaggt cggccgggat gtctcggtgg gcggcggtgc gctcggcggc gtaggcgcgc + 2401 agcattctgg ccagttccgc gtctgcgcgg gcgcgggccg ccaggtttgc cacggtggcc + 2461 acgggcacgc cggtgaacag gcacttgagt acggcgtgcc gccattggtg ggcgtccagg + 2521 tgccgggccg cgtaggggcc gagggcggcg gcgagcaggg tggtgtcgtt ggcgcgcagg + 2581 gcgtcttcga ccagcggcag agcgtgggcg ggttcggtgt cgagtccgtc cagggcgagc + 2641 aggaccgcac gccgttcggc ggctgtcccc cggtggtaca gcagggtcac ggtctccgcg + 2701 tcggggcgtg ccgccgccag cagcagtacg cgggcggcgt cggcgtgttc ggtgccgcag + 2761 cggcggcccg cctcggcgaa gcgcagttcc cagtcggtgt cccgggcggt tgccgaggcg + 2821 cgggcggcgg tgagccagcg gcgtgcgtcg gtgccgaggc cggcgaactc gccgggcagg + 2881 tccgcgtccg gcggggtgtg tacgacggtc atctcgtccc tccgttgcgc aggaaccgca + 2941 tcgactgtgc ggccagttcg ggtccggcgt gggagtgccg gggcagttcg acgacggtca + 3001 ggccctggta gccggtggcg gcgagggcgt cgagtacggg cgggaagtcg atctcgccgt + 3061 ccccgaaggg gaggtgttcg tggacgccgc ggcgcatgtc ctcgatctgc acgtgccgca + 3121 gccagggcgc ggcggcccgt acgcagtcgg cgggcggcag gggctccagg cactggcagt + 3181 gcccgatgtc gagggtcagt cccagtggtt cggggtcgcc cagttcggtg cgcaggcggt + 3241 ggaagtcggt cagtgtggcc agcaggtggc cgggctcggg ttcgaccgcc agggggacgc + 3301 cggtgtcctc cgcggcgtcc aggacggggc cgagggcgtc ggccaggcgt ttccaggcgg + 3361 tgtcctggtc caggcccgcg ggccgtgggc cgctgaagca gtgcacggcg tgcgcgccga + 3421 ggtcggcggc gacgcgtacc gagcggatca gcaggcgtat gcgtgcccag cgggcgtccg + 3481 ggtcgtcgtc gagcaggctg ggtccgtgct tgcggcgcgg gtcgaggacg tagcgggcgc + 3541 cggtctcgac ggtgaccgcg aggccgaggc ggtgcagttg ccgggcgacg tggcgggtgc + 3601 gggccgcgag gtcgggggcg agcgggtcga ggtgcatgtg gtcgagggtg agtccgacgc + 3661 cgtcgtagcc gaggtcggcc agcaggcgca gggcgtcctc caggcgcagg tcggtcagcc + 3721 cgttggtgcc gtagccgagg cgcagcgggc tcatgtggtg ctcactttcc gggccaggtg + 3781 cgcggcgagg ggtgccaggg cggcggtgag gacgccggtg ccgggtgcgc cggcccgggc + 3841 catcagtccg ctctgcaggg cgatcgtggc gcggacgccg gcgccgacgg cccgctgtgt + 3901 cagttccggg gaggggttga gcgcggcgtg ggccaggggg cgggcgaagg tggcggcgta + 3961 ggaagcggcc agggcggcgc gtacggcgcg ggtggccttg tcggccggtg gtgtcgcggg + 4021 agtcggtgcg ccggtgctgg cgtcgggcgc ggggtgggcg gtggggcggc cggcgaggac + 4081 ggtggtgagg gcgcccgcgg cggcgagggc cgtgaggggg gcggtgctgg agccgccctc + 4141 ggtctcgcgg cgggagacga gggagacggc cagggtgtgg ctgccgagga acgccgccgg + 4201 gacgatcgcc cgtcgcacgg cgcccgggcc ggcggccgcg cccagcagca ggtccaggga + 4261 gcgggcggcg gccatcgccg cgggtcccgc cggggtgtgt ttcaggccca ggtcgtaggc + 4321 ccatacggtg gcggccaggg ggccggcgac cgcgagggcc cgtcgtcccg cgcatgcggc + 4381 gagggccagg cccgcggcgg agaggaggcc cgcggcggcg agggcggcgc cgggccggac + 4441 gcggccggac ggcagggggc ggtggggccg ggcggtggcg tcctcctcgc ggtccgccca + 4501 gtcgttgagt gccatgcccg cctcgtacag gcacagtgag gcgccggccg cgagggcggt + 4561 gcgtccggtg ggccgtgtgc cggcggccgc ggtgccggcg aggacgtcac cggggacggt + 4621 gagcgcggcg ggggcgcgca gcagttcggc ccaggcgtgg aggtgcccgt cgcgggccgg + 4681 gccgtgggcg ggccgctgag cgctcacctg gttcctccga gccggtcggc gagggtgagc + 4741 agtcgggtgt actgctcggc cagggcggag ccttcggcgt cggggtcctt gaagtagaag + 4801 ccgagttcgc ccagcgggcc ggacaggccc cgctcgtggg cgcgggcgag caggcgggcc + 4861 aggtcgagga cgagcggtgc ggcgagggcg gagtcgcagc cctgccagat ggtctgcagg + 4921 accatgcggg tgccgaggaa gccgtcgaag gcgacgtggt cccaggcggt cttccagtcc + 4981 ccgagggcgg ggacgtcgtc gatgtgcact tcgccttcga cccgggtgcc gagggtgtcg + 5041 gtgaggacgc gttccttgcc ggcgttcttc gccgcggcgg cggcggggtc ggcgagggcg + 5101 gcgccgtcgc cgccgcccag caggttcgtg ccggaccagg cccgtaccgc cagtgcccgc + 5161 tgggcgaaca tcggccccag caccgaacgc agcagggtct gcccggtctt gccgtcgcgg + 5221 cccgcgtacg gcaggcccga ggcgcgggcc gcgcccgcca gctgggggtg gctcagcccg + 5281 gtcgacggcg tgaagttgac gtaggggcag cccgcccgca gggccgccgc ggcgtacagg + 5341 gagctggccg gccacgcgcc gtgtgcgggg tccggttcgg tggaggcgac gttgacgacg + 5401 accgtgcggg cgacgccggt ggtgcgggcg aaggtgcgca ggtcggtggc gaagtcggct + 5461 atcagctctt cggtggcgcg acggtcgccg ggtaccggtc ctccggggcg gatgtgttcg + 5521 tccgcggcgg ccagttcccc ctggacggcg gtcggcagcc agggcggcag tactccttgg + 5581 gcggccagtt cctcggcgcg tttgggcagg ggggtggtcg ccgtgtcgtg gccgccgaag + 5641 acgagggagg ccagggccgg caggccgcag tcggcgaagg ggggcgtctc ggtgaccatg + 5701 ccggtgggtg gcagcagtcc tgccgccagc gccgcgcagc ccgacaccgc cgtcgtggcg + 5761 accgaaccgc gggctccgac gagccacacg ccggtccggg tctcgtcggc cgaggtcatg + 5821 gcatcttgcg tcacggggca gcctccctga gcgtcgaatg tgttgtccgg caagtggatg + 5881 cccggccagg atgccgagcc gggctgtgcg ggggcgtcgc cctccgtcgg ctgtcgagcg + 5941 gccgccgagc ggattcccat cggccgcggg cgtccggcgc cgggcacagc gaggccccgc + 6001 cggtcgcagg ggtgcgggac cggcggggcc tggcaggggg gtgtgcgcgg cgcaccctcc + 6061 tgcgggggtc agcggttgac gcggaccagc tggccgttgg tgccgagcgt gttgttggtg + 6121 acgtacacct tgccgcaggg gtcgacggcg acgccggtgg gctgcttgag ctggtcgccg + 6181 gtggggatct cggtgaccgc gccgctgtcg gcgtcgatct cgaacagggc gcccggctgc + 6241 ggcgggccgg ccagcgcggc ggcgctgtag gacagggcga tcaggtcgcc gtcccggtcc + 6301 aggtccaggt cgatgaggtt ggtcatgccg gtggcgagga tctcgggctg ccggcccggg + 6361 gcgatcttcc agacgcggga ggcgccgacc cggccgccgc tcatgtcggc gacgtacacg + 6421 gtgccgtcgg cggccttggc gatgccggtg ggtacggtct cggcggcgcc ggtgggcagt + 6481 tcgttcttgg gcaggaggta ctcggtggcg gtggtgccgt cggcgttgcc gcgtacgacg + 6541 gtgttggcgc ccgcgtcggt ggccaggtag ccgctgccgc tgcgcgcgag ccgccacggg + 6601 ttggcgtgca cgtcgccgcc gtcggggttc agccgcgtct cgtggtcggt gaggtcggcg + 6661 agcaccttgt ggtcgcgggt gcggaagacc gtgcccaggg tctgggcgcc ctcgcccagc + 6721 gcggcgcgcg actcggtggt gccgccgagg ccgctgacga cgacgtagcc gccgaaccgg + 6781 tcgggcacga cgtcgctggg gccgttggcg gagatcgggg cgcccggggc gacgcccttg + 6841 gccgtggagg cgaggccggt ggcgacgcgg ccctggaagc tgcccttgac cttgtagacg + 6901 gagccggtgg tgcccacgca cgtctggtcg accgggcagt cggccagtcc ggcgccggcc + 6961 tcggcgacca gcacgccgcc gtcgcccagc gcggtgacgc cgcgcgggtt gttcagctgg + 7021 gaggccacga cggtcacggt cgcctcggta cgggtgtggg tgtgaccgtg gcggtgggcc + 7081 tggggctggg cctggacggg gccggcggtc agcgggacgg cgacggcgcc ggccgcgccc + 7141 gccgccagaa gtatcttcgt ccaggagtta cgcgagttcg ccatttctct cctcggtttc + 7201 caatgctccc cccttttccc ggagagcgga tgcgaaatca gcgccaccct agggcagtcg + 7261 ccggttttat tgcgtcaaat tttccgcagg aaaaagtggg tgcacccgtg aaccagcggt + 7321 attcgagtct ccctccagga ggcgtcgacc tttttccata tcgttgtagt cccggtccct + 7381 tccggcggtt gggacagact tttgcgctcc tgccatggag gaaactcatg cccgaattgc + 7441 cgcctccgca cgtcgtacgg gaagcggaga aagcacgagc ggatctgcag cggcagagcc + 7501 gggaactcgc gcctccgccg ttcgctctgc tggaattgat catgggtgtc atggtcacgc + 7561 gtgcggtgca cgtcgccgcc gaactgaagg tggccgaggc gctcgccgag ggtccgctgt + 7621 ccgccgacga gctcgccggg cgggtcggtg cggacgccga cgcgctcggc cgggtgctgc + 7681 gcctgctggc gagcaacggt gtgttcgcca cgcgcccgga cggtgccttc gagctgacgc + 7741 cgatggcgga cgcgctgcgc gccgaccatc cgatgtcgat gcggggcatc gcgctgctga + 7801 tgggccaccc gatccactgg gaggactgga gcggcttccc ggagacggtg gtcaccggcg + 7861 agccggcgct gccgaagctg cgcggtatgc acgccttcga gttcctgacg aagaacgcgg + 7921 agtacggcca ggtgttcttc cagggcatgg gcagcatgtc cgcctcggag acggagccga + 7981 tcctggcggc gtacgacttc tcgcagttcg ggacggtggt ggacttctgc ggcggccagg + 8041 gcgcgttgct cgcgggcatc ctgggtgcgg cgcccgggtg cgagggcgtt ctgttcgacc + 8101 cgcgggtcga ggagaacggg gctgcggagt tcctggccgc gcagggtgtg gccgaccgga + 8161 cgaagcgggt ggccggcgac ctgttcgacg tgccgccggg cggcgccgac gcctacgtcc + 8221 tcaagcacat cgtgcacgac tggcccgagg agcaggccct gcggatcctg cgcaacgtgc + 8281 gggcggcgat caagccgggc ggcaagctgc tgatcgccga gatggtgata ccggagcagg + 8341 gtgaccagcc gcactccggg aagctggtcg acctgtggct gatgctcctg gtcggtggcc + 8401 gtgagcgtac tcccggccag tacgccgatc tcctggcccg tgccgggttc cgtctggagc + 8461 gggtcgtgga gacggcggcg gcgatctccc tcgtggaggc cgtccccgtg tgaccaccgt + 8521 ggagggaggg ccccgtcgcg tgatgaggga acgcggcggg gccctccggt gtgtgcggcc + 8581 gggcagcggc ggccgggtgg gcgggggcgc cggcgggcag gcccgcgggg agcgccgggc + 8641 ggcggggggt gccgggcggc ggggggtgcc gggcggcgga cgaaggcccc cggcgtgcgc + 8701 gcacgccggg ggccgctaga gggggtgtgg gtcagcgggg cgggccgaac caccgttcca + 8761 gggccgtttc caggccctgc gcgcaggtgc ccgtccaggc gacgtagccg tcggggcgga + 8821 tcagcacggc ggtggcgccg gcgagggcgt ccgggccgtc ggtgggcttg gcgacggcgg + 8881 tgaccacgtc cacccggtcc gcgtggccgg ccgcggtcgc gcgcaccgtc tcgtcgtcgg + 8941 cgaggtcgag cagcacgccg tgcccggcgt gcaggaggcg ggcgatgcgg gtttcgccgt + 9001 ccgcgccgac gagcagccgc ggcggcatcc ggcgtcccag cagcgggtgg gtggggccgc + 9061 tcgcggtgcc ggcgaggtcg tagcggatgt ccaggtggct gacgatgccg gccaggtggc + 9121 gtttgacgtc gtcgtagcgg accagctcgg ccatcagctc gcgcagcggg tcggactcgg + 9181 cgccgccgag gaagacgatg ccctgggcgc gggtgttcat cagcagccgg gcgccgaccg + 9241 ggtggcgttc ggcgtggtag gtgtccagca gttcccgggg ggcgtcgccg cggatcaccg + 9301 aggccagctt ccagccgagg ttggcggcgt cctgcacgcc ggtgctcagg ccctggccgc + 9361 cggccggcag gtggatgtgg gcggcgtcgc ccgccaggaa gacgcggccc cgccggtact + 9421 cggaggcctg ccgggtggcg ttggtgaagg agctgaccca gctcgcgccg ccgtggctga + 9481 tgtcctcgcc ggtgatgtcc tgccaggcgg cggcgacctc ctcgaaggtg acggtccgct + 9541 cacggtcgtg cgcggggcgg ccgtcggggc agacgatgat gcgccacaca ccctgggaga + 9601 gcggtgccgc catcaccatg ccgttgttca ggcgctctcc gaggaagcgc ggggtcagct + 9661 ccacaccggt gatgtccgcc aggtacatgc cctgggtggc gtcggttccg gggaagtcga + 9721 acccggccgc cctgcggacc cggctggagc cgccgtcgca gcccgccagg taggaggcgc + 9781 gcagggtgcg ttcctcgccc tgcggggtgc gtacggtgat ctcgacgccg tcgccgtcca + 9841 ggaagccgtc ggtgagggag acgaactccc agccgcgccg gatgtccgcg ccgagttcgc + 9901 ccgcccagcc ctccaggacc gcctcggtgt cgccctgggg gatgccccgg gccccgaagt + 9961 gggcgtcctc gaggacggtg aagtcgaact gggcgccgcc gaagtgtcct acggggctgg + 10021 tggccagggt ctctccctgg ccgaaccggg gcagcagccc gcgttcgtcg aacgtctcca + 10081 tggcgcgggc ggtgaagccc aggccgcggg actgcccggt gggggcggcc agcttctcga + 10141 tgacgacgac acgggccccg cccaggcgca gttcgcccgc gagcatcagt ccggtcgggc + 10201 cggcaccgac gacgatcacg tcggtgtccg ccgctgtccc ttccatgggt ggtccttcct + 10261 ggcagtgggg tcggttcggg gcccggcggt ggggggcggc gcgtggtgcg gtgccggtcg + 10321 tccccgccgg gccggggcgc acggcaggtc agcggggagg tccgaaccag cgggtgagtg + 10381 cctcggcgag gccgtcggtg cccgggccgg cccaggccac gtggccgtcg gggcggacca + 10441 ggacacggtc ggtgccctgc agtgaactgc ccggcaaggg ctgggcgtcc agtgcggtga + 10501 cgcggtccgc ccagccgtcg aggactgccg gcggccggcc gggccggccg gtcaggtcca + 10561 gcaggacgcc gccgcccgag cgcaccaggt gggtggtggt gagcaggcgt cggcgtgccc + 10621 gcacctcggt gcacggcagc cgggccccga gcagcgggtg ggcggggccg ccgacgtcgt + 10681 agcgcacgtc caggccgctg atcatgccgg ccaggcgacg gcgtacgtcc tcctgcccga + 10741 tcaactccgt cagcaggtcg cgcaacggct cgacctccgg tccgccgagc agcagcagcg + 10801 actgggcgcg gatgttggcc aggacctgcc ggccgacctc gtgacgttcg tcgtggtagc + 10861 tgtcgaggag ggtctgcggt gccttgccgc gtaccaccag ggccagtttc cagcccaggt + 10921 tgaaggcgtc ctgcatgccg aggttgaggg cctggccgcc gaccggcatc tgccggtggg + 10981 cggcgtcgcc cgcgaagagg acgcggccgt gccggtagcg ggtcagctgg cgggaggcgt + 11041 cgccgaaggc gttggcccac aggggggtgc cgccgctgat gtcctcgccg gtgacccgct + 11101 tccacaccgc ggtgatctcc tcgaaggagg cgtcgccgtg cgggcgggcc cgcgcggcgg + 11161 agccgaactc gtggaccatc acccgggtca ccccgtcggg gcggcgggcg gcgatcgcca + 11221 ggccgtgctc caggcgttcg aagcgccggc ccgggatgtc gatgccggcg acgtcggcgc + 11281 gcagcagttc ccgcgtcgcg tccctgccgg ggaagtcggc gccgatcagg cggcgtacgg + 11341 tgctctcctc gccgtcgcag gcgaccaggt agcggcagcg cagccgcagc gtccgtccgt + 11401 ccgggccggc ggcttcggcc tccaccaggt cgccgctgtc gtcgagcgcg gtcagttcgt + 11461 gcttgcactg cagttcggcg cccagtgaca gcgcccactc ccccaggatc acctcggtcc + 11521 tggtctgcgg caccttccac tggccggggt gggaggaggg cagtgtcaga tccagcggga + 11581 tgcccccgaa gtggccgcgc ggctcgttcg gcgggtcgcc gaactcgggc agcaggctcc + 11641 ggctgtcgag gatctccatc gtgcgggcgt gcagggtgga ggcccgggac tcggtgctgg + 11701 gagcgcgtcg cttctccacg accaccacgc cgacgccgcc gtgggccagt tccccggcga + 11761 gcatcatccc gacggggccg gctccgacga cgacgacgtc ggtggtcagg gcgtccgctg + 11821 ccacggttca gcccttcttc tgctcggcgt aggccttggc gtgggcgagg gtggcgcggc + 11881 tgttggtgga cagggccgtg tggacgtagg cgcgggcgtc ggcgacggtg gcgtcctggc + 11941 cgaggatgcg ggcgatgttg gcggtgttga gggtgacggt gtgctgggag gaggcggtgg + 12001 tcgcctcgtc gccctcggtg aaggtccatt cgccggtgtg cagggtcatc agcgcgggca + 12061 gggtgacctg cttgtaggcg atcttgtggt gggggaagac gacccggtag gacttggtgg + 12121 tgtgcaccga gccgtccttg gcgcgggtgt ccatctccag ctcctgcagg ccgggggtgt + 12181 cctcgctcag gcgcaccacg gcgacgtgcg ggagccgttc ggcccacagc tgggcctcgt + 12241 tgatgaagtc gaagacgtcc ttggcggcgc cgtcgatctg cacggtgtcg gcgaaggaga + 12301 acgtcagctc ctcggtggcg gcggcgtgcg cggcctcgac gttgaccttc agggcggcca + 12361 gctcggaggt gctgttcttg tccacggcct gctcgatcca cagcaggtcg tgcgggtcgt + 12421 cgccgatggc gctgtagtcg tgcaggagcc gcacccgcga ccggtcgtcg gcgagcggct + 12481 cgatgatcca ggtgccgccc atgtgcttga ccggggcggc cgggatctcc tggcggaagg + 12541 tgatggtcag gttctcgcgg tcgagcgtgc ggcgcgaggt ccactccttg gcctggccgt + 12601 tggcggtcgc ccagatgtgg atgcgttcgt ggtcgccgtc ggcctcggtg cggtcgacgt + 12661 ggatggtggg cgggaagatg cgcggccagt tggtcacgtc cgcgagcagc tggtagacgg + 12721 cgtcggccgg tgcgccgatc gtgatctcgt gctcgacctc acgtgtggtc atgaggctca + 12781 ctcctcgggg aaggggtcgg gtgccgggtg cgtcagaagt tgccgaggcc gccgcagacg + 12841 ttgagggcct gcgaggtgat ggacgcggcg gtgtcggagg ccaggtagcc gacgaggccg + 12901 gcgacctcct cgggggtgga gtagcggccc agggggatct tcgcctggaa cttctcgagg + 12961 atggcgtcct cggaggtgtc gtaggcggcg gcgtatccct ggcgcacgcg ctgggccatc + 13021 ggggtctcga cgtagccggg gcagaccgcg ttgacggtga tgccggtggg ggccagctcg + 13081 ttgcccagtg ccttggtgaa gccgacgacg ccgtgcttgg acgccgagta cggggcgccc + 13141 aggacgacgc cctgcttgcc cgcggtggag gcgacgttga tgatccggcc gcggtccttg + 13201 gcgcgcaggc cgccgatggt cagggcggcg cgggtgacgc ggaagacgct gttgaggttg + 13261 gtgtcgatca cgtcgtccca cagctcgtcc gcgatgtcgg cggtggggcc gccgccggag + 13321 cggccggcgt tgttgacgac gacgtcgacg ctgccgaagc ggtcgacggc ggcctggatc + 13381 caggcgttga cggactcggt gtcgcggacg tcgacgaccg tgccgtccgc gtcgatgccc + 13441 tcgccctgga gttccttgac ggtggcggcg acgttctcgg cgttgcgggc gccgatgaag + 13501 acttggtggc cctgccggcc gaggagccgg gcggaggcca ggccgatgcc gctggtggcg + 13561 ccggtgacga cggcgacgcg ctgggtggtg gtgtcggtca tggtggggct ccttcaggcg + 13621 gccttggcgg gcgcgagctg cgcgttgacg acctcgatga agctgcgcgg cgtgttggcc + 13681 tcgccgacgg cctcctcgtc cagggagatg ccgtactcgc gctcgatgag gctgccggcc + 13741 tccagcaggg cgagggactc gtagccgatc acctcgaact cggtgtcgag gatgtcgccg + 13801 tccaggtcca cgccctcggc gacgcccgcg gcctcccgca gggtgcgctt gaggtcgtcg + 13861 agggtgaagg acttgctggc catggtgggt cctttcgtca gtacgtggtg gcggttgcgg + 13921 tgcgtcggtc gggcggtgtg cgggggtcct caggcggcgc gcacgaccat ggcggagttg + 13981 aagccgccgg ctccccgggc caggaccagg gcggtgcgca gctcggccgg gcggggttcg + 14041 cccaggacca ggtcgagggg gtagtcggcg cacgggtcga tgtgcacggt gggcgggatg + 14101 acgccgtcgc gcagggcgag gaacgcggcc gccaggtcca ggggcgcgcc gccggagtac + 14161 aggcgcccgg tcatggtctt gggcaccgtc accggcacgc cccggtcgcc gaagaccgtg + 14221 ctgacggcgc gggcctcggc gaggtcgccg gccgggtcgc cggcgccgtc ggcgaagacc + 14281 acgtcgatgt cggcggcgtt cacgtcggcg tcggccagtg ccgtctcgat ggccttggcc + 14341 aggttgggtt cgcgtccgct gccgggccgg gggtcgatgg tggctccgta gccggcgatc + 14401 tcgccgtagg ggcggacgcc gcgggcgcgt gcggcgtcgg cgtcctcggc gatgaggatc + 14461 gcgccgccct ctccggggac gtagccgttc gcgtcgcggt cgaagggcag gtaggcgtgg + 14521 tcgggttcgt cgctggtggt gagccggccg caggccagct gggccaccca gccccagggg + 14581 cagatggagg cgtcgacgcc gccggtgacg atcagcgggg tgccccggcg gatctgccgg + 14641 cgggcctgcg cgacggcgtc caggccgccc gcgccttcgc tgacgacgac gccggagggg + 14701 cccttcatgc cgttgcggat ggagatctgg ccgctgttga cggcgtagaa ccaggcgaag + 14761 gactggtagg cggagacgta ctggctgccc tggctccaca gggcctgcag ttcgccctgg + 14821 ccgaactcga agccgcccgc ggcggaggcc gtgatgacgc ccatgtcgaa ctcgggcagg + 14881 tgcgcggggt cggcgccggc gtccgcgagt gcccagtcgg cggccaccag ggccagccgg + 14941 gtgacgcggt cggtctgcgg cagcagccgg ctgggcagca gttcctcggc gtcgaagtcc + 15001 tcgatctgcc cggccagacg ggccgggtag ccggtggggt cgaagcgggt gatgcggccg + 15061 atgccgtgct tgccgcccag ggtggccgcc cagtagtcct tcacccccat gccgttgggt + 15121 gagacgacgc ccaggccggt caccaccacg gaggcggtca tacgaggctc ctttcggggg + 15181 tggcgagcac catggcgctc tggaagccgc cgaatccgct gccgaccgtg aggaccgcgt + 15241 cgatcagctg gtcgcgggcg accaggggca cgtagtcgag gtcgcactcg gggtcggggg + 15301 tgtgcaggtt ggcggtgggc gggacgacgt cgtactccat ggcgagtgcc gaggcggcga + 15361 tctcgatgga gccgatcgcg ccgagcgagt gcccgaccat cgacttgatg gagctgaccg + 15421 gggtgcggta ggcgtggtcg ccgaggctgc gcttgaacgc ggccgtctcg tgccggtcgt + 15481 tctgcttggt gcccgagccg tgggcgttga tgtagtcgat ggactgcggg ttcagccggg + 15541 cctcgcccag ggccaggtcg atcgcctcgg ccatctccac gccgtcgggg cgcaggcccg + 15601 tcatgtggta ggcgttggag cgggtggcgt agccggcgat ctcggcgtag atgtgggcgc + 15661 cgcgcttgcg ggcgctgtcg agttcctcca ggacgaagaa ggcggttccc tcgccgagga + 15721 cgaatccgtt gcgggtcttg tcgaacggcc gggaggcgca ctcgggttcg tcgtggcgcg + 15781 gggtggtcgc cttgatcgcg tcgaagcagg ccatggtgat cggtgagatc ggcgcgtcgg + 15841 aggagccggc gatcacgacg tcggccgatc cctcgcggac cagttcgacg gcgtagccga + 15901 cggagtcgat gccggaggtg cagccggtgg agaccaccgt gctggggcct tcggccccca + 15961 ccgcccaggc gacctcggcg gcgaaggagc tgggcaccat gtagtcgtac aggtgcggga + 16021 ccgcgtaggt gtggtcgacc gtgtccagcc gtcccccgtc gctgaccacc cggtactcct + 16081 ggtccaggcc catcgtggcg ccgacggcgc tgccgacggt gacgcccacg cggtgcgggt + 16141 ccagggaggg gatgtcgagg ccgctgtcgg cgacggcgcc gcgcgaggcg acgacggcga + 16201 actgcgcggc ccggtccagc cggcggacct cctgcggggt caggccgtgc tcgtaggggt + 16261 cgaagtccgc ttcggcggcc acccgggagc ggaagggggc ggggtcgaag aaggtgatgc + 16321 cccgtgtcgc ggtacggccg ttgctcagca ggttccagaa gttctccctg ccgacaccgc + 16381 cgggggcgat cacctcgatc ccggtgatca caacgcgtcg cccgctcaac gggaggcctc + 16441 ccagctgtag aagcgcgtgg ccatcgcgtc ggccggcgag cgccaggtcg tggggtcgta + 16501 ggcctcgatg aagggcttga ggtcctcgct gatccgcacg aagcgcgggt cggccttggc + 16561 ggcctcgatc agttcaccgc cgttgtcctc gtcgaagtcc tggaggtgga agtacaggcc + 16621 ccggtaggag aagagctggc ggcgccgtgt gcccatgcgg tgcggcatct cggtggcgtc + 16681 gaagtcggcg aacaactggg ccacgtcgtt gctcgaggtg gccgccatcc gggcgacgat + 16741 cagcgtgctg tgcataggga ttagctcctc ggcggttgcg cggaagggtt ctcgaagcgg + 16801 gcggaccggc ccggcccggc ggcccggggg gctgcggcgc caccgccttc gacggtgcgg + 16861 cctggcggta gcgccccgca cggggcctgc ctgagtcccg cctgagccga agcggcgggt + 16921 gcacacgagc acgccttcgg gcctgcgccc ccgggtgccg gggacgaggt ccgaaggcgt + 16981 gcgggtcccg tgcgccgtcc ggcgcgccgg gctcactcgc cggcagagcg cgtgtgcacg + 17041 acccggtagg tgttgaggta gggctcgccg gtgacgacgg cgcggacgcg ggccacggcg + 17101 gccttgcggg cgtcggcctg ctcctcgggg gcctggtcgc ggtagacctc gaaggcctcc + 17161 ttgctgtccc actgggagta ggagatgacg aaggatccct ccaggccgcg ggcgcgcaga + 17221 cccctgagca cgacgtgggc gcggaagccg ggcacgtcgg cgaggaaggc ctggccgggg + 17281 ccgagggcgt ccacggcctc gtcctgcccc tcgggggtga ccgggaagag ggtgaagacg + 17341 gtgtagtcgt cgcggtccgg gccgatctcg atcttgccgc cgagggcgtc cgaggtcagc + 17401 gtgtgggcga cctcgttctg catcagccgg atcgaggtgg tgatctcgcc gaagaccggg + 17461 agcgtgcggt gcttgaactc ctcgcccgcg tagcgcttct cgaggtcctc gccgctgcgc + 17521 cactggatga agttgagggt gccgtagccg tcgacgcccg agtggacggt ggaggacatc + 17581 cagccctcgt acgcggccgc gttgacgatc ttcgtcatct cctcgatcag cttggcctgc + 17641 ttctcgggag tgtccgtggt gaacaggttc aggacggtga ggtgcttgtc ctcggcggag + 17701 atgatgggca tgggtccttc gctttccttg gtgggtgcgg tggatgtcgc tgcgcggccc + 17761 gcgacggtca ggcgctgggg ccgaaccagc ggccgagggc ggcggtgaga ccgtccggcc + 17821 cggcgccgag gccggcgacc caggcgacgt agccgtcggg gcggacgagg atgccgtcca + 17881 cgggggcctc gcagccgtcg aactcggccg cgacgaggtc gacccggtcg gcccagccgg + 17941 cggccgcggt gcgcaggccg tggtcgcccc cgagttccag gagcacgggg cgtgcggtgc + 18001 gcagcagcgc gtagaacggg gtcttctcac cgtcgacgac cagttcccgg tccggcaggc + 18061 gccggccgag cagggggtgg tcgccttcgc cgacgtcgtg ccggatgtcc aggccggtga + 18121 ccatgccggc caggtggcgc tggacggatt cgtgggcgcc catcagctcg gcgagcacct + 18181 cgcgcatcgg cgtgatctcg tcgccgccga ggtagaggat gcgctgggcg agggtgttgg + 18241 tcaggatgcg ggccccgacg gggtggcgct cggcgtggta ggtgtcgagc agcccttcgg + 18301 gcgcctggcc cttgatgtcg agggcgagct tccagccgag gttcacggcg tcctgcacgc + 18361 ccgcgctcat gccctgcgcg ccgatcggca ggtggatgtg cgcggcgtcg ccggccagga + 18421 agacgcggcc gtggcggtac cggtcggcct ggcggctgac gtccgtggtg gagctgaccc + 18481 acagcggggt ggcgccgctg acgtcctcgc cggtcaggcg ctgccaggtc tgggcgacct + 18541 cgtcgaaggt gatcgggtcc gggctggtgc gcagcggctc ggagctgtcg aagtagatga + 18601 cgcggcagcg gtccgggccc atcgggatga ccatgaccat gccgccggcg acgcgctccc + 18661 cgctgaaccg gggccgcagc gccactccgg ccaggtcggc gaagcgcagc tcgatggccg + 18721 gctcggtgcc ggggaagccg atgcccgcga gcttgcgcac gatgctgcgg gcaccgtcgc + 18781 agcccaccac gtggcgggcg cgcagggaga aggggccgtc ggcgcccgcg gcggtgacgg + 18841 tcaccgaggc gtcggtctgc tcgatgcccg tgacctcgca cccgcggcgg atgtcggcgc + 18901 ccagctcgcg cgcccagccg cccaggacgc cctcggtgcg ggcctgcggg atgccgcgcg + 18961 ccccgtacga accgccctcg atcacccggt agtcgagcgg gacgccgccg aagtggccga + 19021 ccgggatgac tccgacctcg ccgaaccggt ccatcagccc gcgctgcgcg aattcctcga + 19081 tggtccgcgc cgagaaaccc agggcgcggg attcctgaat cggctcggaa agtttgtcga + 19141 gaaccaccac cgagactcca gcgagcctca attcacctgc gagcataaga ccggtgggac + 19201 cggctcccac gacaatgaca tctgaatcgt agaattccat ctgccctctt ctcactggtg + 19261 ttccatcaat agtgcgaggg cttacgaggg ctgtaaatag gcgttgttac aggtcttgtg + 19321 cagtcaatgc cagaaaaacg tctggtacgt cagagcttcg acaagcggtc ttgccccggg + 19381 cgcgtcgggt gacggcattc tctggcatga cctccagtct gacgaccgat caatccgcat + 19441 ccgtgtccgc cgccgagtcg agcgcacagg tcgccggtct gctgcaccgg tatctggtct + 19501 cgctcgacga cgagcggctc gacgacgcct ggaccgccgg cctgttcacc gaggacgcgg + 19561 tcgtcgcgtt cccggtcagc cggcacgagg gcgccgacgg catggccgag taccaccggt + 19621 cggcgctgtc ggcgttcgcg gccacccagc acctcggttc tccggccgtg gtcgacgtgg + 19681 acggggaccg ggccgtgttc cgggcgaacc tgatctccac ccatgtgcac cacccgcgcc + 19741 acacgcctcc cgagggggac ctgcccccgc tcttcgcgac gggcacgttc gtgaacggcg + 19801 aggcgcgccg caccgcgcgg ggctggcggc tgagcctgct ggccttccgg ctgctgtggg + 19861 cggacggctc ccctcccccg gcccggtgac cccggccgcg gtgcggtgac cccgagccgc + 19921 ggtggggcga ccgcgggcgc ggtggggtga ccccgagccg cggtggggtg accgcggccg + 19981 tggtgcggcg gcgccgggcc gggggagggg agccgcgccg cggtacacgc gcgtgccgcc + 20041 ccggacgcgg tccggggcgg cgggggcggt gggggtggtg gtgcggagcc ggcggggcag + 20101 gcgttcaggc gttcaggctc aggacgcggt cgaccgcgat ctcgatgacc acccggtcgg + 20161 acggggtcgg cggggcggac cagtaccgct tggcgtacag ccgtgccccg agcgccaccc + 20221 gttcggggtc ggtcacgacc gtgccggtcc cctccagcgt gacccagcgg aagccgtcca + 20281 cctggcagag cgccaccggg gcgccgggcg tggccagcag gttgcgggcc ttgcgggagg + 20341 agcgcaccgt catcacccgc gcgagctggg cgtccgcgtc ccaggtgaag cgtacggggg + 20401 ccacgtgcgg tgtgccgtcc ggccgcatcg tcgtgaacgc ggcgacgagc gccgtaccgg + 20461 tcaggaacgc ctggacggag tcgggcaccg tcacggcgtc cgggcgcggc atcgacggca + 20521 tgggcgggtc ctcgcttcca gagggtgttg cgtgcgtggg cgcttcccgt gctccgggcg + 20581 gctgtcgcgc gggcgtcggg ggcggccgtg ggtccggggc cagcttgccg ggggccgctc + 20641 gaccctcgct ggacccggct ccccccgccc ggcccgccgc ccgcctccgc cgtgcgccgt + 20701 gtgtcatgcg ctgtgctccc gtgggtcgtg cgtcgtgcgt cgtttcgggt gtccgggcta + 20761 gtcgatgctg cggacgatga cgcgtccgtc ctcgtcctcg cgctcctccg cgcccgccag + 20821 ccgcaggggc ggcgggccgc cgtggaccgc cctggcgcat cgggccgtgt caccctcgtg + 20881 ccgttcgtcg tcgccttcgt gcatgggcac ctcctcggtg atcggtcggc ccagagtgtc + 20941 aagggtggct cgcggcccgg tcgacggccg ccccggagga agtggagcgc ggccggagcc + 21001 aggacccggc cggtcgcggc ctcgagggcc gcggcgcgat gcgcggcagt gcctcaccgg + 21061 cgagcacgtc cagcacggcc ccgttggtgg tggcctcgtc ggtgccgggc agatgccgca + 21121 gcagccgggc gcagtgcccg gccagcaggc gggcgtcggc gtcggagatc cggttgcggt + 21181 cgtggtcgac gcagaaggtg aggcggccgt cgccgccggg acggaccagc agggcgacgg + 21241 gcaggtcggg gcaggcgccg tgcgccggtt ccggctccag cgcgatgccg gcgccggcga + 21301 gttcgttcct caggttgccc ggcgggcgcg gaaggctgtc caccgagacc acgctctgca + 21361 gcagttcccc gtcggggcag cggcccgtcc agcggtggat ccggcgggtg gagacccatt + 21421 cgtaggcggc catgtccagc gcccggtccc gcagggccgt cagcagccgg ccgaccgtct + 21481 cgccggggtc cacgcggacc accatcggca ggcagttgcg cagcggcccg ggcagccgct + 21541 cggcgcagtc cagggtgatg ccgcggccgg agacggtgac gccgaagccc accgtcgcgg + 21601 ccccgccggg cccggccgcg cggtacagca gcagcgccca gaccgtctcc agggcgctgg + 21661 agtcgggtac ggcgcgcagg gcggcccagc ggtggagccg ttcggcctcg gcggggctca + 21721 gccgtacctc ggtcctgccc cggccccgct ggcgggtgcg cgggccgggc cgggcgggca + 21781 gcacggcgac cggcccgtcg ggcacggcgc cccgccagaa gtcccgggct ccagcggggt + 21841 cctgccgctg gagccagccc gcccagtcgc gcaggtcggg gcggcgctcg ccgccgggca + 21901 gctcgccgcc ggcgaggtag gcccggcaca gctcctgcat cagcaggcac acgctccacg + 21961 cgtccagcag cgcgtggtgg aaggtgagga ccacccgggt caccggcccg gcaccggccg + 22021 ggtcgtcggt gcgctccacg agggtgacac gcagcgggca ggggcggctg ggatcgaggc + 22081 cgcgccggcg gtcccgctcc agcagccggt cccatccggc gccgcccgca cggtggcgca + 22141 cgacgtcgcc gtgggcgtgc tcgtgcagga ccaggtgcgg ccggggcccc ggggccaggg + 22201 cggcccgcag cacgctctcg cggtcgacga ccgactgcca ggccgcggtg aaccgctcgg + 22261 tgtccagcgg gccgtgccag cgccagacga gctgctcgac gtggcgcccg gcgccacggc + 22321 gcccgccgaa gtcgcccagc aggtcgaggt ggggccacag ggccggtacg cccggcggac + 22381 gggccgtgcc ggggccccgc agggcacgcg ggcggctgtg ccacgccatg ggacgccctc + 22441 ctcgtcgctg cctcctcccg cacgggccgg ccgtgcgcac ggttctcggg gagcggcggg + 22501 ccccttgagg gggcgcggta ctcccccggc atcgtggcac cggtggctgc catgggcctg + 22561 acggcccgct gacgctgctc gcgaccgggc ggagaaacgc ttctgcagcg gtggggccgt + 22621 accggaacgc ccgctactgc tgtcccgtgt ccgtcatcgc cgacaggaac ccctggtcca + 22681 gcatggtccc cacggaggtg tccccggcgg tgctcagtcc ggcgttgtgg caggccacgc + 22741 tgagcaggaa gcggtccatg acggggtagg tggcgaagcc ccactcgtcg cgggtgaccc + 22801 ggctgccgtc gggtgcgctc agccggccct gccggaagcc gaactccttg aagccgaacc + 22861 gcagtccctg cccgagggct ttgctgtagg cctccttcag ggtccacagg cgcagtgcgt + 22921 gggcggtccg ctctccttcg ggcagttcgg ccagttcccg ggcctcggcc ggtgtgaaga + 22981 cctgggtctc gagcaggtcc agccgtacgg gccgctcggc cggttccacg tccaccccga + 23041 tgcggccgat gcggctcagg ccgacggcca tgacgtcccc ggtgtggctc aggctcagtt + 23101 cgatctggtc gaagccgcgc aggtagggcc ggccgcccag ccggtaggcc aggtccaggt + 23161 actcgggcgg gacggccagg gcggcggccg ccgtgtactt gatcagcatg cgggaggcgg + 23221 cgaaccggta gcgcaccgcg gcgtcgcggg tacgccggta gcgctgccag tcgtcgccga + 23281 gcagttcccg cagccgcggg gtggtcagca cgctgggcag ccattcgctc cacgtcgtgc + 23341 agaccagtgc gttgccgtgc cggaagaggt cctcgcgcac cgcgggccag gggccgtggg + 23401 gccgcggcac gtgaaggggc gcggcacatg tgacccgctc catcgtcgtc tccctgcgtg + 23461 tggttctcgc cggcccgctc ccccgttggg gggggcgggc cgaggggggg cgtcttcccg + 23521 tgccgtctcg gtcagccggc cagtggggtg tcgtacaggt cgagactgcg gccgtgccgg + 23581 cagcgtccca gcgcctcggc caggaccgcc tgttccgcgt ccgccggtgt ctcgggtacg + 23641 gcgatgccga gtctgcggcc gatgcggctg aggacgagca ccgcccaggc cgggtcggcg + 23701 aggaagccgt caccgtccgc ctgtccctcc cagaccccga ggcaggcggc ggcgcacagc + 23761 agcagggcgt agcggtcggc cagggcgcag gccagcgggt cgaacacggt gctcccggcg + 23821 gccggcaggg ccgcgcagcg cgcgcgcagc acccgcagct cctccaccag ggcgcgggcc + 23881 agcgcggcga gggcggcgtg cagtggttgt gtccccgtcc gtgcggccag ccgttcggcg + 23941 gccccgatca gggtggccgt gagcgggtcg tcggtcccgg agtgtgtcag cctgcggtgg + 24001 tcgagcggtg gcagcggcgc gcccggcagg aacagtgcgg cgctcggttc ggcggtccgg + 24061 aaccatgccg tgcgtgccag ggccggcagc tggggtacga gcaccgcctg gcagacggcc + 24121 gttcccgagt ggccgagtcc ggccacgggc aggtcgcggg cgagtttctg gaagccgccg + 24181 tacagcgggc cgcggtcgta gccgcgggcg ccgagcacgg cggcgagttc ttccaggtcc + 24241 tcgcgcagca ggtccggcat ggtgtatttg accgccgccg cgagcagatg ggcgtgctgg + 24301 ggtacgaggc tgagcgcccg cagtcccgtg acggccatgg cgtcgcaggc gagcaggtcc + 24361 gcgaagaccc cgctgagtgc cttgtgccag cggcgggcgg gccgtccgtc gggccggttc + 24421 tcggtggcgg cgcgcaccgc gagccgcagg acgctgtcca cgcccgcgag caccgtgccc + 24481 gggatgaggc agtggctgat ctggaagctg cgcagggcca gggtgacgcc ctcgccgagc + 24541 gagccgacca gggcgctgtc gggcagtcgt acgtcggcca ggcgcagtcc gtggaagcgt + 24601 gctccgcgca tgccgggcat ctccacccgc gccagccggc gcacttctcc ggaggcgggt + 24661 ggtccgggca gcaggagcac cgagtggctg gcggagccgg agccggcgga ggtgcgggcg + 24721 tagacgacga aggtgtcggt gcggtcggcg ttcatgacgg cgtccttgct gccgttgagc + 24781 aggaagccgc cgcccgcagg gcgttgtgcg cggacctcgc ggcgcaggat ggcgttggcg + 24841 tgtgccacct cccggtgcac gatcgcgacc cggcctccgc cgagcaggac gtccgcgagg + 24901 gccgcgcgct ggtgggggtc gcccgcggtc cacaccgagg acgcggcgaa cagcgaggtg + 24961 atgccgaagc cgtagccgag ggccaggtcg cggcggaaga gcgggcgcag cacgcgggcc + 25021 agctcttcga ggtccctcag gcgtccgccg aggtcgtggg ggacgaactc ggcggacagg + 25081 ccgtgctcgg tcaggagcgc ctcggtggcg tgtggtgcct cgcgggtgtc gtcggcccgg + 25141 accagggcga ggtgtccgtg cgggttggcc gggtcgaagg ggtcgccgag cgcggcctcc + 25201 agccgggcgg cgcgctcggg ttcgggtgcg cgggcggcgc gctcgcattc gggtgtggga + 25261 gtggtgtgtt cgggttcggg ggcgggtgcg cgggtggtgt gttcgggtgc gggtgtgggg + 25321 gtggtgtgtt cgggtgcggg tgtgggggtg gtgctgcgcg gggcgggggt ctgccccgtc + 25381 ggcccggcgg ccgtgtcgag ggcggcggtc acaggacccg caccgcgtcg gaggcgtggc + 25441 gcacggcgtg ctccagcagg cggcggccgg cccggccgac ctcgtcgcac gcccgccggg + 25501 cggcgtcctg gtccagtgcg gcgtcgtcgt tgagcagcac gtcgtgccgc acggtgacgt + 25561 cgaggccggc tccgggctgg ggctcgatgg tccactcgcc ggtgtacgcg gccagcggtc + 25621 cggatgtgcg ggtgtgtttg tgcacgaggc ggccggcggc ggggaagctg atgcgcaccg + 25681 cctcgccgcc ggtggccgac cggccgtcca gggcgaggac ctggatgccg ggggtgtcct + 25741 cctgcaccgt cagggggcgg gtgccggcga ggtcgtcggg ccagtcgccg gcccggtaga + 25801 ggaagtcgaa gaccagctcg gcgggcacgt tgacccggac ggtgtcctcg aaggacatca + 25861 cgaggtcgtc cagccgggtc cagcgctcgg cgagccaggc caggcgctgg agctgggcgc + 25921 ggctgttggc gcgggtgacc cgctcggtcc aggccgcgtc ggccggagcg tcgccgacga + 25981 cggtgaaggc gtgttccagg gtcacccggg agccgtcgcc caggggctcg acggtccaca + 26041 ggccggtcat cgtctcgacc ggggcggagg gccgttcctg gcggaactcc acccgccgct + 26101 gtccgacgtc caggcggcgg tgggagaccc aggagctgat ccggtcgccc gccacggccc + 26161 acatgcgcag ccgttcccgt gtcccgtcga agtccagttg ttccacgtgg acgctgggag + 26221 ggaagaacag cggccacacg gtggcgtccg cgatcaggcc gtagagcact ccgctcgggg + 26281 ccggggccgt catctcacag gcagtacggt gcactcgcgc atccggcatc gtccacaccc + 26341 tccgtcgtcc aaggcgtcgc cgccgggccg gtccccgctg ggccgcacgc gtgccgggtc + 26401 caccgggggc gggccggtgc ggccgggccc gtcgtactgc ggcttttctc gaccctgtcc + 26461 ggaaccgcta gggatgtgcc ggtagcgcgc tcgtgtcccg ctggagcggc gcccaggggc + 26521 acgcgctcca gcgggaaccg tcgggtcctc gagcccggtg accgacggtg gcctgcggcc + 26581 ccagaaacga tccgggaggt ggcagggatg aggcgcttcc gcccgcgccg atgcgtccgt + 26641 ggcctgtggg agggtctggt cgcctacggg cggctctgcc tggccggcga gacggaccgg + 26701 tacgaccacc ctccgcgccc gcggatccgg tggcaccggc cgccgccggg acacccggaa + 26761 cgggtgcgcg acgacatgcc tctgaccgac ctggagcggc gcctggcccg cgaactggcc + 26821 gacgaggacc acgacgtccg ctaggcgggg acgccaccac gcgtgccgcg ggcggggcgg + 26881 cggaacgccg ggcagccggg agagacggaa ggccgggggc cgggagccgg gaggccaaga + 26941 gaccgggaag gccggaaggc caggggcccg ggaggccggg agcccgggag ggccgggagg + 27001 ccggaagggc cgggaggcca ggagccggaa ggccgggagc ccgggcgggc cggggagcca + 27061 ggagggccgg ggagtcggcg ccgggggtgt ttccctttgc gcggtccgcg gggccgcggg + 27121 ccgttcctgg ccgccggtgt gttccgctcc gtctcgttag gggcgggccg tcactgcgtc + 27181 tgaggggcct ggagcactgc ggcggagttg aagccgcccc gtccgcgggc cagtaccagc + 27241 gccactcgca gccggggcag ttcccgtggg gctccggtga ccaggtccag cgggcagtcg + 27301 tcggcgacgc gtccggttcc ggtggtcggg gggacgactt tctcgcgcag ggcgagcagc + 27361 gcggctgcca cgtccagggc cgagccgccc gcgcccagcc gcccggtcat cgtcttcggc + 27421 acggtgaccg gtactccgta gggtccgaac agcgcgcaca gcgcctggct ctcgacgagg + 27481 tcggcgcgcc gctcggcggc gccgtcggcg aagaccacgt ccacgtgttc gggggccagg + 27541 ccggcgtcgg ccagggcgag ttccgcggcc tggcgcagtg tggggcggtc ggggccgtcg + 27601 aaggtggcgg cgcagccggc gatgacgccg tagccggtgg cgccccggcg ggcggcggcc + 27661 cgggcgtctt ccaggacgag cagggcgccg ccttcgccga ccgcgtggcc gtcggcggtg + 27721 gccgcgaagg gccggtaggc ccgggcgggt tcggtggcgg ggctgagccg gccgtccgcc + 27781 aggtgtgcgg cccagcccca tgcgcacagt gtggagtcga tcccgccggt gaccatgagg + 27841 catgccccgt cgcggatccg ccgccgggcg cgggcgagtg cgtcgatgcc gccggcctgt + 27901 tcgctgacga cggtcgagcc gtggccgcgc agccggtgcc ggatggagat ctgtgcgggg + 27961 gctgccgcgt ggaaggacgc gaaggactgg taggcgctga cgtgctgggc gcctttgctc + 28021 cacagtgcgg ccagtccccg ttcgccgaat tcggcgccgc ccgcggagct ggcggtgatc + 28081 acgccggcgc cgtatgcggg caggtcggcc gggctcacgt tggcgtcgcg cagtgcttct + 28141 tcggccgcga ccagggcgat gcgggtgccg cggtcggtgg agggcagcag tctgctgggg + 28201 atgtggtcct cgtcgacgaa gccggggatc tcgccggcga tgcgtacggg gtagccggag + 28261 gcgtcgaagc gggtgatggg gcccagtccg gtgcgcccgc acagcacggc gtcccaccag + 28321 gctctggtgc ccaggccgtt gggtgcggcg actccgatgc cggtgaccag ggtctggcgg + 28381 gggccttcgg cgccggcggg ggtgggggcg ggtcgggccg gttcgggggc ctgggtcgcc + 28441 ttggtcatgc ggcctccttg agctgtggcc gggtgaggac ggcggccgtg tggaagccgc + 28501 cgaagccgct ggcgacggtg aggacggtgc tggtgcgctg ttcccgggcg aacagggggg + 28561 tgtagtcgag gtcgcaggtg gggtcgggtt cgtggaggtt ggcggtgggc gggacggtgt + 28621 cgtgccggat ggccagggcg ctggcggcca ggtccagggc gccggcggcg cccagggcgt + 28681 gcccgatcat cgacttgatg gagctgacgg gcacgcggtg ggcgctgccg cccaggcttt + 28741 ccttgagggc gtgtgtctcg tgccggtcgt tgtgccgggt tcccgcgccg tgggcgctga + 28801 tgtagtcgac gtcggcgggg ttcagccgtg cctggtcgag ggcggcgcgg atggcgtcgg + 28861 ccatctccag tgccccgggg cgcagtcccg tcatgtggtg ggcgctgctg tgggcggtga + 28921 tggcggacag ttccgcgtag gggcgggcgc cgcggcggcg ggcgtgttcg agttcttcca + 28981 ggaccagtac ggcggcgccc tcgccgagca cgaatccgtc gcgggtgcgg tcgaaggggc + 29041 ggctggcggt ggcggggtcg tcgttgcggg agctggtgag gcgcaggcgg tcgaagcagg + 29101 ccatggcgat gggcacgatg ggtgcttccg ttccgccggc gacgacgatg tcggcgctgc + 29161 cttcccggat caggtcggcg ccgtggccga cggcgtccag gccggaggtg cagccgctgg + 29221 agacgagggc gacggggccc tgtgcgcccc ggtcgcgggc gacggtggcg gccagggagc + 29281 tggggacgaa gtagtcgtag agggattcgg cggcctcggt gtggtcgagg gtccaggtgg + 29341 tgccgcagtc gctgaggatg gcgtactggg tggccaggct cgtggtgcag ccgatggcgc + 29401 tgcccaggct gacgccggtg cgcagggggt tgcggccgat gcggtccgcg acgccgctgt + 29461 cggcgacggc ttcgcgtgcg gcgaccagcg cgaactgtgc cgcgcggtcc aggcgttcgg + 29521 tgtcggcgag gtcgaatccg tgggcggcgg gggtgaagtc gacctcggcg gcgacgcggg + 29581 agcggtagcc gcaggcgtcg aagagggtga cgcggcgggt ggcggtgcgg ccgacggtga + 29641 gcaggtccca gaagccggcg gtgcccaccg cgccgggggc gacgacgccg atcccggtga + 29701 tcacgacgcg gttcaccggc cgcctcccgt gggcagcgcg gtcacgtggc cgcggcaggc + 29761 ccggccgacg tgctgggcca ggctcgagga gcttgcgaag aagtgtcccc cggcgacggt + 29821 gtgcagttcg atcaggttgg tggtccactg ctgccagtgg cgcagggcgg cgggtgcggc + 29881 gagcgggtcg tcgcggcccg cgaagaccag gacgggcacg tccagcggcc ctccggtgac + 29941 cgggtccagg gcggcgttgc gcagcgatcg ggccaggcgc aggtcgtcgc gcaggacggg + 30001 caggaaggtg cgccgccaca gtccgccggg ggaggcggag gcgcccggcg gcagggagcc + 30061 gatctcgtcg agcagcggca gcaggtcctc gtcgggcagg tccgccgcgt ccgccaggac + 30121 ggaggtggtg tgcgggggcg ggcaggcgcc gacggccagg aacagcgggg gcaggccgga + 30181 gtcggccagg gcccgggtga gcgtgtagcc gacgagggct cccatgctgt gtccgtagag + 30241 cgcgtagggg ccgcggcgtg ccgtctgcag caaggtcggc aggaagtcgg cgagcaggcc + 30301 ggcgcgttcg gtcaggcgtg gttcgcggcg gcggctgtcg cggcccggga gcggcagggc + 30361 ggccacgtcg atgccgggtc cgaccgccgc ggaccagccg cggtagctcg ccacgcccgc + 30421 tccggcgtgg gcgaggcagg tgagtgtgat ccgtgcggtg cccgcctcac ggtccctgga + 30481 gcgggaagcc atgcgtcgcc ctccttgtga acggtccggt ccggccccat ccgggcgggc + 30541 gccgccggcg tggcgcgtgc cacgcggtgc cgtcccggcg ccggtccggg gggtgggtgc + 30601 ccctgcgcac cgagcgtcgc ccgcgcggct cgtgcggcgc tcaaccccgc ggcgaggcgg + 30661 gcggcggcct cggcg +// diff --git a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk new file mode 100755 index 000000000..d7febe529 --- /dev/null +++ b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk @@ -0,0 +1,3887 @@ +LOCUS Chromosome1 84281 bp DNA linear UNK 14-OCT-2019 +DEFINITION Bacteria strain JK1. +ACCESSION Chromosome1 +VERSION Chromosome1 +KEYWORDS . +SOURCE Bacteria + ORGANISM Bacteria Unclassified. + . +COMMENT ##antiSMASH-Data-START## + Version :: 6.1.1 + Run date :: 2023-02-06 17:22:58 + NOTE: This is a single cluster extracted from a larger record! + Orig. start :: 13276 + Orig. end :: 97557 + ##antiSMASH-Data-END## +FEATURES Location/Qualifiers + CDS 1..690 + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:O33341 Putative glutamine + amidotransferase" + /db_xref="UniProtKB/TrEMBL:A0A399CHF0" + /locus_tag="JK1GL000010" + /note="GO_function: GO:0016787 - hydrolase activity" + /product="MULTISPECIES: gamma-glutamyl-gamma-aminobutyrate + hydrolase family protein" + /protein_id="ncbi_JK1GL000010" + /transl_table=11 + /translation="MAVTADATTVNWNIWGDVAVAVLPQPYLDKVTQAGGAPVLLPPLV + EAVESVMERVDALLMSGGADIDPALYGARPGEFVFPPHPARDAAELAALAVAERRGIPV + LGVCRGLQLISITRGGTLDQHLPEHSPAVPGRYEPRTIRVKPDSLLGGALGPSPTVYCH + HHQGIDKLGAGLVATAWSDDGVIEGAEAEDPSAPFLAGLQAHGELGEDTVALFEAFIEA + AKAGPRR" + protocluster 1..84281 + /aStool="rule-based-clusters" + /category="PKS" + /contig_edge="False" + /core_location="[47298:63009]" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + /t2pks_malonyl_elongations="8|9 (Score: 1286.8; E-value: + 9.9e-215)" + /t2pks_molecular_weights="acetyl-CoA_8 (Da): 414.403" + /t2pks_molecular_weights="acetyl-CoA_9 (Da): 456.440" + /t2pks_product_classes="angucycline" + /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" + /tool="antismash" + proto_core 34023..49733 + /aStool="rule-based-clusters" + /tool="antismash" + /cutoff="20000" + /detection_rule="(t2ks and t2clf)" + /neighbourhood="35000" + /product="T2PKS" + /protocluster_number="1" + /t2pks_malonyl_elongations="8|9 (Score: 1286.8; E-value: + 9.9e-215)" + /t2pks_molecular_weights="acetyl-CoA_8 (Da): 414.403" + /t2pks_molecular_weights="acetyl-CoA_9 (Da): 456.440" + /t2pks_product_classes="angucycline" + /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" + cand_cluster 1..84281 + /SMILES="" + /candidate_cluster_number="1" + /contig_edge="False" + /detection_rules="(t2ks and t2clf)" + /detection_rules="AfsA" + /kind="neighbouring" + /product="T2PKS" + /product="butyrolactone" + /protoclusters="1" + /protoclusters="2" + /tool="antismash" + region 1..84281 + /candidate_cluster_numbers="1" + /candidate_cluster_numbers="2" + /contig_edge="False" + /product="T2PKS" + /product="butyrolactone" + /region_number="1" + /rules="(t2ks and t2clf)" + /rules="AfsA" + /tool="antismash" + mRNA 1..690 + /locus_tag="JK1GL000010" + /note="MULTISPECIES: gamma-glutamyl-gamma-aminobutyrate + hydrolase family protein" + gene 1..690 + /locus_tag="JK1GL000010" + mRNA complement(992..2509) + /locus_tag="JK1GL000012" + /note="MULTISPECIES: NAD(P)-binding protein" + gene complement(992..2509) + /locus_tag="JK1GL000012" + CDS complement(992..2509) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A3R9UBU6" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 497.4; E-value: + 8.3e-151)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 492.0; E-value: 4.7e-150)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000012" + /note="GO_function: GO:0071949 - FAD binding" + /product="MULTISPECIES: NAD(P)-binding protein" + /protein_id="ncbi_JK1GL000012" + /transl_table=11 + /translation="MAKGAIVVGAGPVGLMLAGELRLGGVDVVVYDKLPGPSGESRGVG + FTRRAAEVFEQRGLLERFGDVEWAQGHFGGVRIDFGKLDDNHFSVRGVPQFRTEEILEN + WLKELGVPVLRNHEVTGYRERPDGVVVEYEGPDGHGEDTAQYLVGCDGARSLVRTLAGI + DFKGWGATRGMYMADLVGAGVRQRPIGEKVPGGMVMAFNLENGVDRIVIHDENLRPPED + KSALRFTDIADAWQRMTGESLHHAEVRWISSFTDTTRQAEHYRSGRVFLAGDATHIHMP + AGAQGMSVGVQDAANLGWKLAAAINGWAPEGLLDTFESERHPVGEKLMRNTRAQTRLYL + TGDEMEPLRAVMRELVELPEAARHLAGIVSGVDIRYDMGPGDHPLLGLRLAPGHELLLE + DGGRTRVAELLHPARGVLLVTGAADDAARVRGAAAGWDDRVRTVVGEWAEPVTGDRPAA + VLLRPDGHVAWAAPDGVELLGRALERWFGRGRDTAGSRAHAVGAAGV" + mRNA complement(2542..3522) + /locus_tag="JK1GL000011" + /note="MULTISPECIES: alpha/beta hydrolase" + gene complement(2542..3522) + /locus_tag="JK1GL000011" + CDS complement(2542..3522) + /codon_start=1 + /db_xref="COG:COG0596 Pimeloyl-ACP methyl ester + carboxylesterase" + /db_xref="UniProtKB/TrEMBL:A0A399CRL9" + /gene_functions="biosynthetic-additional + (rule-based-clusters) Abhydrolase_6" + /gene_functions="biosynthetic-additional + (rule-based-clusters) PF00561" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1262:haloalkane dehalogenase (Score: 153.4; E-value: + 1.3e-46)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000011" + /note="GO_function: GO:0003824 - catalytic activity" + /product="MULTISPECIES: alpha/beta hydrolase" + /protein_id="ncbi_JK1GL000011" + /sec_met_domain="Abhydrolase_6 (E-value: 2.5e-15, bitscore: + 56.4, seeds: 455, tool: rule-based-clusters)" + /sec_met_domain="PF00561 (E-value: 3.1e-22, bitscore: 78.2, + seeds: 48, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTLNRRTMLALGTGATALAMTGTATAAHAREHTGSVPSDSELARS + LPGGFRSRCATVNGVRLHYVTGGHGRPLLLVPGWPQTWWAYRKVMPQLARTHRVIAVDL + RGMGGSDKPAGGYDKKTMAADLHALVRHLGHRQVDIAGHDIGAMVAFAFAANHPEATRR + LALLDTPHPDESEYDLRLLYRPGTGTALWWWAVNQLQQLPEQLMCGRMRHVIDWLFAHS + LADQNLVGEADREIYAHAYNSPQAIRAGTGWYQACHQDIADLAGYGRLTMPVLGIGGNF + TYEDLQRKLTAQATDVRMVRASKSVHYLPEEEPEVVAGALLDFFG" + mRNA complement(3561..4397) + /locus_tag="JK1GL000013" + /note="MULTISPECIES: NAD(P)H-binding protein" + gene complement(3561..4397) + /locus_tag="JK1GL000013" + CDS complement(3561..4397) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W167" + /gene_functions="other (smcogs) SMCOG1199:NmrA family + protein (Score: 213.1; E-value: 9.8e-65)" + /gene_kind="other" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000013" + /product="MULTISPECIES: NAD(P)H-binding protein" + /protein_id="ncbi_JK1GL000013" + /transl_table=11 + /translation="MTVLVTGSRGKVGSLLVQVLHERGVAVRAGSSNPEKLSLPAGTES + VRLALDTPADFAAALDGVDSVFLYAEPAAVDAFVAQAEKAGVEHVVIMSADAVLRPSAA + DDPIAAPHLAVEQALAASSLTSTPLNCGALAGNALPWAWSLKARGAVGLPYPDSHADPV + NERDIAEAACAVLTDPALRGRSYHLTGPQSLTFAEHVAIIAAAAGRDIPVERIPPQVWR + ANKPDFMPDDIADALLKLWAASTAPVPLTDHVEQLTGHPARPFTVWADQHAGAFRA" + mRNA complement(4636..6432) + /locus_tag="JK1GL000014" + /note="MULTISPECIES: monooxygenase" + gene complement(4636..6432) + /locus_tag="JK1GL000014" + CDS complement(4636..6432) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W161" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 497.8; E-value: + 6.2e-151)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 494.4; E-value: 8.7e-151)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000014" + /note="GO_function: GO:0071949 - FAD binding" + /product="MULTISPECIES: monooxygenase" + /protein_id="ncbi_JK1GL000014" + /transl_table=11 + /translation="MTAAGSVTAAGSASARRRLEPSPTRLGRRHRPRSAAAAPAPRPPA + GTDTWSHAPPPPPAPPRPGPGPRRGGPLLRGPALRLQRRSIGEVFPGAWLPPRTRERFT + NDLREEYFMAKGAIVVGAGPVGLMLAGELRLGGVDVVVYDKLPAPSGESRGLGFTSRTA + EVLDQRGLLDELGEFRWGRHGHFGGVRIDFTLLEESHFGVMGLAQSRTEQLLGDWTARL + GVPVLRGREVTGFEETEDGVVVRYDGPDGPGEDHAQYLIGCDGGRSTVRRLAGIAFPGD + EATRGMYLADVTGADIRPRPIGERVEGGGMVLSVGLGDGYDRIVIHEPGVRPHHGEGTL + TFTEVADAWQRMTGESIHHGHTRWMTALTNATGLAEQYRSGRVLLAGDAAHDHAPLGAQ + GVSVGLQDAVNLGWKLAATINGWAPDGLLDTYHAERHPLGEQLLRNVHAQSLLYLSGEE + MEPLRAVMRELVRIPDAARYLAGQVSGLHIRYDVGAGEHPLLGLRLPLQRALQRADGTR + VRVAELLHEARGVLIVTGDPSTVHKTAADWSDRVDVVAGTWAEDGGPEAVLLRPDGHVV + WAAPDGGDVTDALTRWFGAAAV" + mRNA complement(6579..8087) + /locus_tag="JK1GL000015" + /note="MULTISPECIES: MFS transporter" + gene complement(6579..8087) + /locus_tag="JK1GL000015" + CDS complement(6579..8087) + /codon_start=1 + /db_xref="COG:COG2271 Sugar phosphate permease" + /db_xref="UniProtKB/TrEMBL:Q1RQU5" + /gene_functions="transport (smcogs) SMCOG1005:Drug + resistance transporter, EmrB/QacA (Score: 405.2; E-value: + 4.8e-123)" + /gene_kind="transport" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000015" + /note="GO_component: GO:0005887 - integral component of + plasma membrane; GO_component: GO:0016021 - integral + component of membrane; GO_function: GO:0022857 - + transmembrane transporter activity; GO_process: GO:0055085 + - transmembrane transport" + /product="MULTISPECIES: MFS transporter" + /protein_id="ncbi_JK1GL000015" + /transl_table=11 + /translation="MAASDATTARSASGAGLSPGLILAFVCMGQFMVFTDVSIVNLALP + SIQEGLGMSEVSLNYIVTAYATVLGGFLLLGGRLADTFGRRRLIQIGFVIFALASLTSG + LAENGTMLIASRAVQGFGAALITPAALAILTNTFAEGPERNKALGVWGSLSGIASIVGV + ILGGVLADTWGWEWIFWINVPIGLGAAVLAPRILPESKAEERGKFDTLGAVTLTAGLLL + LIFTLGEATTVGWDTFRTIGSLVGVVALLTAFVVIEAKVASPMMPLRIFRLKTMRVANI + SAVLVFGTFGSLFFFASLFMQQAFGYSPLKAGFAYVPLAFSVAAGAGIASGLVTKMAAR + PVVMMGLTLTVAGLLLMWRAPADGSYVVDLLAPFILLGLGCGMVFVTLQIAAFVGVTDE + DAGVGAGLINTSQEAGGALGLAVVATIAYSGMSTEMAATGGKPELIAEVHEAANHDAFL + SGAMLGTVALLVVTFLMPRGKQSMSSAPAEAGEGPALVKADAEK" + mRNA complement(8210..8947) + /locus_tag="JK1GL000016" + /note="hemerythrin domain-containing protein" + gene complement(8210..8947) + /locus_tag="JK1GL000016" + CDS complement(8210..8947) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A399CNC7" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000016" + /product="hemerythrin domain-containing protein" + /protein_id="ncbi_JK1GL000016" + /transl_table=11 + /translation="MSMSDPAQSPGARMYEEFVAIHAVLRRGTRLVVDAYERLADGHDT + DTATLVDAGRWLLAFTHAHHKAEDDLFWPVLEALYPDARAQLKELSDDHVVLDRRLNAL + ETAIDALDEATQAARATGGTDGARAGAEAARQVHQVLDGHLTAEEAVVEDLFPGVPADD + IDRLREAFVQGSPRFGLHFMFGLLDDPEPARGRDLLTENFPPQLRAAGPRLISQYEAGI + QGLRGGPGDDSGRPVTSAGPRSS" + mRNA complement(9126..10688) + /locus_tag="JK1GL000017" + /note="MFS transporter" + gene complement(9126..10688) + /locus_tag="JK1GL000017" + CDS complement(9126..10688) + /codon_start=1 + /db_xref="COG:COG0477 MFS family permease" + /db_xref="UniProtKB/TrEMBL:A0A429NHX3" + /gene_functions="transport (smcogs) SMCOG1005:Drug + resistance transporter, EmrB/QacA (Score: 417.7; E-value: + 7.5e-127)" + /gene_kind="transport" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000017" + /note="GO_component: GO:0005887 - integral component of + plasma membrane; GO_component: GO:0016021 - integral + component of membrane; GO_function: GO:0022857 - + transmembrane transporter activity; GO_process: GO:0055085 + - transmembrane transport" + /product="MFS transporter" + /protein_id="ncbi_JK1GL000017" + /transl_table=11 + /translation="MMTTVEDPASAAQGRPAGTSVRVLLIPLVAAMMLSQLDTMIVGTA + LPTVTAELGGLEHVSWVVTAYTLATAVSTPVWGRLGDVRDRKNVLLAAIVVFLAGSALS + GAAQDMGQLIGFRAVQGLGAGGLMAGVMAIVGELVPPRERGRYQGLISGAMAVAMIGGP + MAGGAVTDHLGWRWAFYLNLPLGALALAMIWRLLRLPRRSRVARVDTLGAALLTVGISA + TVLLTTWGGTRYAWDSAAVVLLAAAAGAALWAFVRRQARTADPIMPLHMFQVRNFTLMS + VIGFLTGFVMFGVLLFLPLYQQAVQGASATNSGLLLLPMLAALIAASLVAGRVTTVSGR + YKVFPVTGGALLCAGAWLLSRMDTSTSRPTAALSMAVLGAGLGCLTQTVTVVAQNSVEL + RDIGAASAAVTLFRTLGSCFGVAVMGTLFNREVLRVTAERAPGVPALDNARLDAQSLER + LEPALHEAYRHATAAGTHVAFLLCAGVGAAVLGAGLLVREVALRRAGQDTARPAVSRAP + GGH" + mRNA complement(10723..11481) + /locus_tag="JK1GL000018" + /note="MULTISPECIES: response regulator transcription + factor" + gene complement(10723..11481) + /locus_tag="JK1GL000018" + CDS complement(10723..11481) + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:A0QTK2 DNA-binding response + regulator MtrA" + /db_xref="UniProtKB/TrEMBL:A0A399CJS4" + /gene_functions="regulatory (smcogs) SMCOG1008:response + regulator (Score: 157.2; E-value: 7.8e-48)" + /gene_kind="regulatory" + /locus_tag="JK1GL000018" + /note="GO_function: GO:0003677 - DNA binding; GO_process: + GO:0000160 - phosphorelay signal transduction system; + GO_process: GO:0006355 - regulation of transcription, + DNA-templated" + /product="MULTISPECIES: response regulator transcription + factor" + /protein_id="ncbi_JK1GL000018" + /transl_table=11 + /translation="MSAQTLPELRTSTSQLIRLVQDGTAPAPAAPAPGGRRILVVDADV + GPGDSLVTQLRRYGHEPVAVQCGGQALQAHADADLVLLALELPDLDGLEVCRAIRAVSR + VPVVIVTARQSELDCVLGLQAGADDYVTKPYGLRELMARIEAVMRRTHWQPAARRYIRR + GRLHIDVDSREVTVDGSGVALTRKEFDLLCLLASHPDTVIPRKHLLKQVWGDSWSQRTV + DTHVSSLRGKLGGSGWIVTVRGVGFKLGAG" + mRNA complement(11666..12070) + /locus_tag="JK1GL000019" + /note="MULTISPECIES: GNAT family N-acetyltransferase" + gene complement(11666..12070) + /locus_tag="JK1GL000019" + CDS complement(11666..12070) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W040" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000019" + /note="GO_function: GO:0008080 - N-acetyltransferase + activity" + /product="MULTISPECIES: GNAT family N-acetyltransferase" + /protein_id="ncbi_JK1GL000019" + /transl_table=11 + /translation="MNWTIERAEGKDLDLDEVLAVYRSSGLGERRPVEDRDRMKAMLTG + ANLVLVARDGDGALIGIARSVSDFSYVTYLSDIAVDGRLQRSGIGRALIDATRKEAPTA + KIVLLSAPAATAYYPHIGFTQHNSAWVLNP" + mRNA complement(12054..13340) + /locus_tag="JK1GL000020" + /note="MULTISPECIES: adenylosuccinate lyase" + gene complement(12054..13340) + /locus_tag="JK1GL000020" + CDS complement(12054..13340) + /EC_number="4.3.2.2" + /codon_start=1 + /db_xref="COG:COG0015 Adenylosuccinate lyase" + /db_xref="UniProtKB/Swiss-Prot:P74384 Adenylosuccinate + lyase" + /db_xref="UniProtKB/TrEMBL:A0A454W043" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1063:argininosuccinate lyase/adenylosuccinate lyase + (Score: 140.4; E-value: 1.5e-42)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000020" + /note="GO_function: GO:0003824 - catalytic activity; + GO_function: GO:0004018 - N6-(1,2-dicarboxyethyl)AMP + AMP-lyase (fumarate-forming) activity; GO_process: + GO:0009152 - purine ribonucleotide biosynthetic process" + /product="MULTISPECIES: adenylosuccinate lyase" + /protein_id="ncbi_JK1GL000020" + /transl_table=11 + /translation="MIPRYTLPEMADLFADQSRYATWVKVEILASEAQAGLGRVPAAAV + EDMRRARVPLAARVAEIEKERDHEVLSFLAAYCEDIPEDSARWVHLGMTSYDLVDTALG + HTLARATDLLLAAARRLRATLVGKALEHWDTVMVGRTHGVHAEPTTFGHKLGVHAFAVD + RSITRLTAAREAVAVGTVSGSVGTYALIDPEVERHVCDALGLGVEPVPSQVVARDRHAQ + LMQAVAALGACIEQIALELRLLQRTEVREVEEHRTGAYQGSSAMPHKRNPTTSERLCGL + ARLLRGYADTALENVALWHERDLAHQSVERVILPDSLSVGHFQTVMAADLINSLTVRPE + RMRAHIDTTDGLIHSSAVLADLLARGVERERAYRGVQAAADHTLATGEHFAAGLAREGI + DVESLEPERFLTRHDVIRTRLETLRELDD" + mRNA complement(13437..14957) + /locus_tag="JK1GL000021" + /note="MULTISPECIES: glutamine synthetase" + gene complement(13437..14957) + /locus_tag="JK1GL000021" + CDS complement(13437..14957) + /EC_number="6.3.1.2" + /codon_start=1 + /db_xref="COG:COG0174 Glutamine synthetase" + /db_xref="UniProtKB/TrEMBL:A0A429NHX7" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000021" + /note="GO_function: GO:0003824 - catalytic activity; + GO_function: GO:0004356 - glutamate-ammonia ligase + activity; GO_process: GO:0006542 - glutamine biosynthetic + process; GO_process: GO:0006807 - nitrogen compound + metabolic process" + /product="MULTISPECIES: glutamine synthetase" + /protein_id="ncbi_JK1GL000021" + /transl_table=11 + /translation="MYARSWSSPAPDGSVGRPSFVTDHGLWDDERVAAAERVEAALDEV + DFVRLVFGDPHGLARSKTLTADAFRSVLRNGMNFSPGPFLFDTGHAVAVDFLGDHGIGV + DEIAGAGNFVLVPDPVTFQVLPERGPRTAWVLGDEYLRDGTPHPLSSRAVLRRVVNRYA + ALGLQPVLGLEVEWYLTRRLDDEPGNQGNGFGLQGQAPRVTAVNAGYQFNLDAAYDTVA + PITGPLGLHLRKLGLPLRSMEHESGPGQVETTFSPMTALDTADAMLLFRTVTKRFCARR + GHHASFMSQPRLDAADPSGWHLNQSVVDLATGRNLFSAEGLSGGLSPNGKAYAEGLLTW + ARELFLLSVPTVNGYRRLAAEHALAPTRLGWSFEDRTAMLRVVGSGAGAHIENRVGEPC + ANPYLNIAAQLFAGLEGLTAQPADPQTAPRGEAPTETQPQTVPQTLAEALDAFRTGRAD + QLLGAPLAACMTKLKESELGRFTAWSSQTAPAPGQVTDWEQREYFGVY" + mRNA complement(14962..16371) + /locus_tag="JK1GL000022" + /note="MULTISPECIES: amidase" + gene complement(14962..16371) + /locus_tag="JK1GL000022" + CDS complement(14962..16371) + /EC_number="6.3.5.6" + /EC_number="6.3.5.7" + /codon_start=1 + /db_xref="COG:COG0154 Asp-tRNAAsn/Glu-tRNAGln + amidotransferase A subunit or related amidase" + /db_xref="UniProtKB/TrEMBL:A0A429NHY2" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1105:amidase (Score: 416.1; E-value: 3.3e-126)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000022" + /note="GO_function: GO:0004040 - amidase activity" + /product="MULTISPECIES: amidase" + /protein_id="ncbi_JK1GL000022" + /transl_table=11 + /translation="MTARGIRRTKELLSRRELTVVEHVQDVLAAVRERDHLGAYVAVAG + DEAIRAAARADELIRDRGREAWWDLPLLGVTVSVKDLLQTRDLPTTRGSLLPNGRPAQD + APAVARLRAAGAIVVGKTTTSEFGWSASTVGRLAPPTRNPYDPSRSAGGSSGGAAASVA + AGLCEGALGTDGSGSIRIPAAFCGVVGYKPSFGRVPYYPNGADRLAHQGPIAATVADAA + LLGQVIAGPHPTDPDSGLGSLDSPRDMRSLRIGWIEYEGTDPEIRRVTEAARDVLLDEG + HLVEEVQVRCHNLYPAVVDILAATEAAGTRPEDEELIDPGRLHVVRHGRTLSGVAVIQA + EEIRQNLRATLRSVMDDYDLLAMATVPVEPFDAGAIGPDWAADVRDLLWLAWAPASYPY + NMTGQPAASLPAGLTSSGLPAGVQLVGPVGADDLVLTVARRLEAMLPPLPQPPAAPPVA + ASTGTTGERTF" + mRNA complement(16491..18431) + /locus_tag="JK1GL000023" + /note="hypothetical protein" + gene complement(16491..18431) + /locus_tag="JK1GL000023" + CDS complement(16491..18431) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A3R9U297" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000023" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000023" + /transl_table=11 + /translation="MPERGESRRAANARKRISRRPSRLGLVAGATLKPDRVREADAGFP + GLLKRVWRRAEQTEDLRSFVEVLLTLDGHVPADVQLRALSAAEEAALAALCGLSWRATA + TAAPAARGDAAPATAAPGDGTSGDAEETVFSGEIALATSGRIVLRVPSAAPLKADGLVG + GVRRVPWTRATLDAYRAQLRRAEDRVARTVADCRGWLAEQGAEGRGELLEQAKEAALRT + APFVLYQQGRQYTNFRDHNTLTGKTLWPGHPDCALSSLQDLPLELWSDHDVQLVVCLTL + LIRSAGPGRVEEANGTQLTVDHVAHMLERIRVGYNAALGRDQVPPAASATVADLHELAV + SLRSHRGEVAREAQLYREIHGALMHKIEKVAGPCADLARAREDAVTARLTSRLPLRGDN + LAELGEALAAAPGWLAAPHGDFATGLEALVYESAAAATEAFEADFAMSRGMRSLPDLIT + ALREERWAEICDWEITRFFCCVVPDPSAARHFGDSTAALADAAWAMSSRMQYNSWHFIA + GNLPKAPEVVDRDHFVPPTIPDVAFYSDQHHHGHVNNNVRFSIRSPQSVVVDGRRFNGF + VDLRLLRCDGAPFGEQDLLAAHRVSAFTARATGLVAELAAAGEQIEVTAFDSPWHWSAV + TGGADPATRAS" + mRNA complement(18440..18766) + /locus_tag="JK1GL000024" + /note="MULTISPECIES: 4Fe-4S ferredoxin" + gene complement(18440..18766) + /locus_tag="JK1GL000024" + CDS complement(18440..18766) + /EC_number="7.2.1.2" + /codon_start=1 + /db_xref="COG:COG1149 MinD superfamily P-loop ATPase, + contains an inserted ferredoxin domain" + /db_xref="UniProtKB/TrEMBL:A0A399CKM6" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000024" + /product="MULTISPECIES: 4Fe-4S ferredoxin" + /protein_id="ncbi_JK1GL000024" + /transl_table=11 + /translation="MKKIASSAALSGRVERIAQRDRPDNWKKPPRRIEKSECITCDTCL + RSCPAEFGAIFDRGLDVVIIPELCSGCPACVLECPVDCIYVDEDWTPTDDAMWNHIELT + AKGA" + mRNA complement(18897..20342) + /locus_tag="JK1GL000025" + /note="alkaline phosphatase family protein" + gene complement(18897..20342) + /locus_tag="JK1GL000025" + CDS complement(18897..20342) + /codon_start=1 + /db_xref="COG:COG1524 Predicted pyrophosphatase or + phosphodiesterase, AlkP superfamily" + /db_xref="UniProtKB/TrEMBL:A0A429NFG1" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000025" + /note="GO_function: GO:0003824 - catalytic activity" + /product="alkaline phosphatase family protein" + /protein_id="ncbi_JK1GL000025" + /transl_table=11 + /translation="MTPTTSSGGPVPLLVLDVVGLTPRLLDHMPHLKRLGQSGSRAPLG + TVLPAVTCAAQSTFLTGTYPSEHGIVGNGWYFRELGDVLLWRQHNGLVTGDKLWDAARR + AHPGYSVANICWWYAMGADTDITVTPRPVYYADGRKEPDCYTRPAALHDELTDRLGTFP + LFHFWGPGADLVSSQWIIDATRHIMHTRHPDLTLCYLPHLDYDLQRYGPDDPRSHKAAT + DLDTALAPLLDDARAEGRTVVALSEYGITPVSRPVDINRALRRAGLLEVHTQDGMEYLD + PMASRAFAVADHQIAHVYVRRPEDLDATRAALDGLPGIETLLDDEGKKAHHLDHPRAGE + LVAVAEPDAWFTYYYWLDDARAPDFAQLVEIHRKPGYDPVELFMDPLDPYVKVKAATAL + ARKKLGMRYRMAVVPLDASPVRGSHGRLPASDDDGPLLICSIPRAVGDRVAATDVKQLL + LRLAGLESAAAREEPRPRTGTTV" + mRNA complement(20339..21514) + /locus_tag="JK1GL000026" + /note="TIM barrel protein" + gene complement(20339..21514) + /locus_tag="JK1GL000026" + CDS complement(20339..21514) + /codon_start=1 + /db_xref="COG:COG1082 Sugar phosphate isomerase/epimerase" + /db_xref="UniProtKB/TrEMBL:A0A399CJC3" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000026" + /note="GO_function: GO:0008270 - zinc ion binding" + /product="TIM barrel protein" + /protein_id="ncbi_JK1GL000026" + /transl_table=11 + /translation="MRFRHPDGSTVHLAYCTNVHPAETLDGVLAQLRDHCEPVRRRLGR + DRLGIGLWLAKDAAHALATDPSALRGLRTELDRRGLEVVTLNGFPYEGFGAEEVKYRVY + KPDWADPERLEHTTSLARVLAGLLPDDVTDGSISTLPLAWRTAWDETRADKARAALATL + GERLDALHELTGRSIRIGLEPEPGCVVETTHDAIAPLGAIGHDRIGICVDTCHLATSFE + DPHTALDALTAARVPVVKSQLSAALHAEHPSRPEVRDALAAFAEPRFLHQTRTTAATAG + LRGTDDLDEALAGGGPLPDTAPWRAHFHVPLHADPAAPLTSTLPVLKSALSRLVGGARP + LTRHLEVETYTWQALPAQLRPRGRAQLTDGIAAELMLARDLLTDLGLKELP" + mRNA complement(21518..22393) + /locus_tag="JK1GL000027" + /note="MULTISPECIES: hydrolase TatD" + gene complement(21518..22393) + /locus_tag="JK1GL000027" + CDS complement(21518..22393) + /codon_start=1 + /db_xref="COG:COG1099 Predicted metal-dependent hydrolase, + TIM-barrel fold" + /db_xref="UniProtKB/TrEMBL:A0A399CKK9" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000027" + /note="GO_function: GO:0016788 - hydrolase activity, acting + on ester bonds" + /product="MULTISPECIES: hydrolase TatD" + /protein_id="ncbi_JK1GL000027" + /transl_table=11 + /translation="MRIFDPHIHMTSRTTDDYEAMHAAGVRAVVEPAFWLGQPRTSPAS + FCDYFDALLGWEPFRAAQYGIAHHCTIALNPKEANDPRCTPVLAELPRYLVKDRVVAVG + EIGYDSMTPAEDTALAAQLQLAADHGLPALVHTPHRDKLAGLRRTLDVVRESALPTDRV + LVDHLNETTVKEAKDSGAWLGFSVYPDTKMDEARMVALLREYGPEKVLVNSAADWGRSD + PLKTRKVGDLMLEEGFGEDDVDRVLWRNPVAFYGLSGRLDLDVTATAPTHEGNSVLRGA + PAAEPLPTGA" + mRNA complement(22395..22994) + /locus_tag="JK1GL000028" + /note="MULTISPECIES: sugar phosphate isomerase" + gene complement(22395..22994) + /locus_tag="JK1GL000028" + CDS complement(22395..22994) + /codon_start=1 + /db_xref="COG:COG1082 Sugar phosphate isomerase/epimerase" + /db_xref="UniProtKB/TrEMBL:A0A399CHG5" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000028" + /product="MULTISPECIES: sugar phosphate isomerase" + /protein_id="ncbi_JK1GL000028" + /transl_table=11 + /translation="MTVVHTPPDADLPGEFAGLGTDARRWLTAARASATARDTDWELRF + AEAGRRCGTEHADAARVLLLAAARPDAETVTLLYHRGTAAERRAVLLALDGLDTEPAHA + LPLVEDALRANDTTLLAAALGPYAARHLDAHQWRHAVLKCLFTGVPVATVANLAARARA + DAELARMLRAYAAERTAAHRDIPADLDRVLALTQEQ" + mRNA complement(22991..23836) + /locus_tag="JK1GL000029" + /note="MULTISPECIES: TIM barrel protein" + gene complement(22991..23836) + /locus_tag="JK1GL000029" + CDS complement(22991..23836) + /codon_start=1 + /db_xref="COG:COG1082 Sugar phosphate isomerase/epimerase" + /db_xref="UniProtKB/TrEMBL:A0A454W1I9" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000029" + /product="MULTISPECIES: TIM barrel protein" + /protein_id="ncbi_JK1GL000029" + /transl_table=11 + /translation="MSPLRLGYGTNGLTDLRLEDALRLLADLGYDGVGLTLDHMHLDPL + APDLAARTRHVARQLHRLGLAVTVETGARYVLDPRRKHGPSLLDDDPDARWARVRLLIR + SVRVAADLGAHAVHCFSGPRPAGLDQDTAWKRLADALGPVLDAAEDTGVPLAVEPEPGH + LLATLTDFHRLRTELGDPEPLGLTLDIGHCQCLEPLPPADCVRAAAPWLRHVQIEDMRR + GVHEHLPFGDGEIDFPPVLDALAATGYQGLTVVELPRHSHAGPELAAQSMRFLRNGGTR + " + mRNA complement(23833..24789) + /locus_tag="JK1GL000030" + /note="prenyltransferase UbiA" + gene complement(23833..24789) + /locus_tag="JK1GL000030" + CDS complement(23833..24789) + /EC_number="2.5.1.39" + /codon_start=1 + /db_xref="COG:COG0382 4-hydroxybenzoate + polyprenyltransferase" + /db_xref="UniProtKB/TrEMBL:A0A454W1H9" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000030" + /note="GO_component: GO:0016021 - integral component of + membrane; GO_function: GO:0016765 - transferase activity, + transferring alkyl or aryl (other than methyl) groups" + /product="prenyltransferase UbiA" + /protein_id="ncbi_JK1GL000030" + /transl_table=11 + /translation="MSAQRPAHGPARDGHLHAWAELLRAPAAFTVPGDVLAGTAAAGTR + PTGRTALAAGASLCLYEAGMALNDWADREEDATARPHRPLPSGRVRPGAALAAAGLLSA + AGLALAACAGRRALAVAGPLAATVWAYDLGLKHTPAGPAAMAAARSLDLLLGAAAGPGA + VRRAIVPAAFLGSHTLAVSLVSRRETEGGSSTAPLTALAAAGALTTVLAGRPTAHPAPD + ASTGAPTPATPPADKAARAVRAALAASYAATFARPLAHAALNPSPELTQRAVGAGVRAT + IALQSGLMARAGAPGTGVLTAALAPLAAHLARKVSTT" + mRNA complement(24786..25901) + /locus_tag="JK1GL000031" + /note="MULTISPECIES: myo-inositol-1-phosphate synthase" + gene complement(24786..25901) + /locus_tag="JK1GL000031" + CDS complement(24786..25901) + /EC_number="5.5.1.4" + /codon_start=1 + /db_xref="COG:COG1260 Myo-inositol-1-phosphate synthase" + /db_xref="UniProtKB/TrEMBL:A0A454W1J4" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000031" + /note="GO_function: GO:0004512 - inositol-3-phosphate + synthase activity; GO_process: GO:0006021 - inositol + biosynthetic process; GO_process: GO:0008654 - phospholipid + biosynthetic process" + /product="MULTISPECIES: myo-inositol-1-phosphate synthase" + /protein_id="ncbi_JK1GL000031" + /transl_table=11 + /translation="MTSADETRTGVWLVGARGSVATTAVSGCAALAAGLLPPTGMVTET + PPFADCGLPALASLVFGGHDTATTPLPKRAEELAAQGVLPPWLPTAVQGELAAADEHIR + PGGPVPGDRRATEELIADFATDLRTFARTTGVARTVVVNVASTEPDPAHGAWPASSLYA + AAALRAGCPYVNFTPSTGLSHPQLAGAARASGLPYAGRDGKTGQTLLRSVLGPMFAQRA + LAVRAWSGTNLLGGGDGAALADPAAAAAKNAGKERVLTDTLGTRVEGEVHIDDVPALGD + WKTAWDHVAFDGFLGTRMVLQTIWQGCDSALAAPLVLDLARLLARAHERGLSGPLGELG + FYFKDPDAEGSALAEQYTRLLTLAGRLGGTR" + mRNA complement(26152..27273) + /locus_tag="JK1GL000032" + /note="ScyD/ScyE family protein" + gene complement(26152..27273) + /locus_tag="JK1GL000032" + CDS complement(26152..27273) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A429NH62" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000032" + /product="ScyD/ScyE family protein" + /protein_id="ncbi_JK1GL000032" + /transl_table=11 + /translation="MANSRNSWTKILLAAGAAGAVAVPLTAGPVQAQPQAHRHGHTHTH + TRTEATVTVVASQLNNPRGVTALGDGGVLVAEAGAGLADCPVDQTCVGTTGSVYKVKGS + FQGRVATGLASTAKGVAPGAPISANGPSDVVPDRFGGYVVVSGLGGTTESRAALGEGAQ + TLGTVFRTRDHKVLADLTDHETRLNPDGGDVHANPWRLTRSGSGYLATDAGANTVVRGN + ADGTTATEYLLPKNELPTGAAETVPTGIAKAADGTVYVADMSGGRVGASRVWKIAPGQQ + PEILATGMTNLIDLDLDRDGDLIALSYSAAALAGPPQPGALFEIDADSGAVTEIPTGDQ + LKQPTGVAVDPCGKVYVTNNTLGTNGQLVRVNR" + mRNA 27631..28602 + /locus_tag="JK1GL000033" + /note="MULTISPECIES: hydroxyneurosporene methyltransferase" + gene 27631..28602 + /locus_tag="JK1GL000033" + CDS 27631..28602 + /codon_start=1 + /db_xref="COG:COG1414 DNA-binding transcriptional + regulator, IclR family" + /db_xref="UniProtKB/TrEMBL:A0A399CND7" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1042:O-methyltransferase (Score: 322.9; E-value: + 4e-98)" + /gene_functions="biosynthetic-additional (t2pks) MET + (Score: 266.1; E-value: 1e-81)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000033" + /note="GO_function: GO:0008168 - methyltransferase + activity; GO_function: GO:0008171 - O-methyltransferase + activity" + /product="MULTISPECIES: hydroxyneurosporene + methyltransferase" + /protein_id="ncbi_JK1GL000033" + /transl_table=11 + /translation="MGVMVTRAVHVAAELKVAEALAEGPLSADELAGRVGADADALGRV + LRLLASNGVFATRPDGAFELTPMADALRADHPMSMRGIALLMGHPIHWEDWSGFPETVV + TGEPALPKLRGMHAFEFLTKNAEYGQVFFQGMGSMSASETEPILAAYDFSQFGTVVDFC + GGQGALLAGILGAAPGCEGVLFDPRVEENGAAEFLAAQGVADRTKRVAGDLFDVPPGGA + DAYVLKHIVHDWPEEQALRILRNVRAAIKPGGKLLIAEMVIPEQGDQPHSGKLVDLWLM + LLVGGRERTPGQYADLLARAGFRLERVVETAAAISLVEAVPV" + mRNA complement(28804..30318) + /locus_tag="JK1GL000034" + /note="FAD-binding protein" + gene complement(28804..30318) + /locus_tag="JK1GL000034" + CDS complement(28804..30318) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A399CJT3" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 551.4; E-value: + 3.7e-167)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 570.9; E-value: 5.2e-174)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000034" + /note="GO_function: GO:0071949 - FAD binding" + /product="FAD-binding protein" + /protein_id="ncbi_JK1GL000034" + /transl_table=11 + /translation="MEGTAADTDVIVVGAGPTGLMLAGELRLGGARVVVIEKLAAPTGQ + SRGLGFTARAMETFDERGLLPRFGQGETLATSPVGHFGGAQFDFTVLEDAHFGARGIPQ + GDTEAVLEGWAGELGADIRRGWEFVSLTDGFLDGDGVEITVRTPQGEERTLRASYLAGC + DGGSSRVRRAAGFDFLGTDATQGMYLADITGVELTPRFLGERLNNGMVMAAPLSQGVWR + IIVCPDGRPAHDRERTVTFEEVAAAWQDITGEDISHGGASWVSSFTNATRQASEYRRGR + VFLAGDAAHIHLPAGGQGLSTGVQDAANLGWKLASVIRGDAPRELLDTYHAERHPVGAR + LLMNTRAQGIVFLGGAESDPLRELMAELVRYDDVKRHLAGIVSHLDIRYDLADTATGPT + HPLLGRRMPPRLLVGADGETRIARLLHAGHGVLLDLADDETVRATAAGHADRVDVVTAV + AKPTDGPDALAGATAVLIRPDGYVAWTGTCAQGLETALERWFGPPR" + mRNA complement(30421..31896) + /locus_tag="JK1GL000035" + /note="FAD-dependent oxidoreductase" + gene complement(30421..31896) + /locus_tag="JK1GL000035" + CDS complement(30421..31896) + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:Q5YTV5 Rifampicin + monooxygenase" + /db_xref="UniProtKB/TrEMBL:A0A3R9U1U9" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 556.6; E-value: + 9.8e-169)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 585.0; E-value: 2.9e-178)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000035" + /note="GO_function: GO:0071949 - FAD binding" + /product="FAD-dependent oxidoreductase" + /protein_id="ncbi_JK1GL000035" + /transl_table=11 + /translation="MAADALTTDVVVVGAGPVGMMLAGELAHGGVGVVVVEKRRAPSTE + SRASTLHARTMEILDSRSLLPEFGDPPNEPRGHFGGIPLDLTLPSSHPGQWKVPQTRTE + VILGEWALSLGAELQCKHELTALDDSGDLVEAEAAGPDGRTLRLRCRYLVACDGEESTV + RRLIGADFPGRDATRELLRADVAGIDIPGRRFERLEHGLAIAARRPDGVTRVMVHEFGS + AARARPHGDVSFEEITAVWKRVTGEDISGGTPLWANAFGDASRQLTRYRHGRVLFAGDA + AHRQMPVGGQALNLGMQDAFNLGWKLALVVRGKAPQTLLDSYHDERHEVGRQVLANIRA + QSLLLLGGPEVEPLRDLLTELIGQEDVRRRLAGMISGLDVRYDVGGPAHPLLGARLPCT + EVRARRRLLTTTQLVRSGGGVLLDLTGRPGRPPAVLDGWADRVTALDAQPSPGSSLQGT + DRVLVRPDGHVAWAGPGTDGLAEALTRWFGPPR" + mRNA complement(31900..32844) + /locus_tag="JK1GL000036" + /note="cyclase" + gene complement(31900..32844) + /locus_tag="JK1GL000036" + CDS complement(31900..32844) + /EC_number="4.2.1.-" + /NRPS_PKS="Domain: Polyketide_cyc2 (4-146). E-value: + 2.2e-16. Score: 52.4. Matches aSDomain: + nrpspksdomains_JK1GL000036_Polyketide_cyc2.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (157-310). E-value: + 2.8e-09. Score: 29.3. Matches aSDomain: + nrpspksdomains_JK1GL000036_Polyketide_cyc2.2" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:P41178 hypothetical protein" + /db_xref="UniProtKB/TrEMBL:A0A399CFS4" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1128:cyclase/dehydrase (Score: 454.2; E-value: + 3.6e-138)" + /gene_functions="biosynthetic-additional (t2pks) CYC C7-C12 + (Score: 472.7; E-value: 9.4e-145)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000036" + /product="cyclase" + /protein_id="ncbi_JK1GL000036" + /transl_table=11 + /translation="MTTREVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEAD + GDHERIHIWATANGQAKEWTSRRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDR + SRVRLLHDYSAVGDDPHDLLWIEQAVDKNSTSELAALKVNVEAAHAAATEELTFSFTDT + VHIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGLQELEMDTRAKDGSVHTTKSY + RVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTASSQHTVTLNTANIARILGQDA + TVADARAYVHTALSTNSRATLAHAKAYAEQKKG" + aSDomain complement(31915..32373) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000036_Polyketide_cyc2.2" + /domain_subtype="Polyketide_cyc2" + /evalue="2.80E-09" + /label="JK1GL000036_Polyketide_cyc2.2" + /locus_tag="JK1GL000036" + /protein_end="310" + /protein_start="157" + /score="29.3" + /tool="antismash" + /translation="FSFTDTVHIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGL + QELEMDTRAKDGSVHTTKSYRVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTAS + SQHTVTLNTANIARILGQDATVADARAYVHTALSTNSRATLAHAKAYAE" + aSModule 31915..32832 + /domains="nrpspksdomains_JK1GL000036_Polyketide_cyc2.1" + /domains="nrpspksdomains_JK1GL000036_Polyketide_cyc2.2" + /incomplete + /locus_tags="JK1GL000036" + /tool="antismash" + /type="unknown" + aSDomain complement(32407..32832) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000036_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="2.20E-16" + /label="JK1GL000036_Polyketide_cyc2.1" + /locus_tag="JK1GL000036" + /protein_end="146" + /protein_start="4" + /score="52.4" + /tool="antismash" + /translation="EVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEADGDHE + RIHIWATANGQAKEWTSRRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDRSRVR + LLHDYSAVGDDPHDLLWIEQAVDKNSTSELAALKVNVE" + mRNA complement(32884..33672) + /locus_tag="JK1GL000037" + /note="MULTISPECIES: SDR family NAD(P)-dependent + oxidoreductase" + gene complement(32884..33672) + /locus_tag="JK1GL000037" + CDS complement(32884..33672) + /EC_number="1.1.1.-" + /NRPS_PKS="Domain: PKS_KR (8-164). E-value: 7.1e-11. Score: + 34.2. Matches aSDomain: + nrpspksdomains_JK1GL000037_PKS_KR.1" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:P41177 Monensin polyketide + synthase putative ketoacyl reductase" + /db_xref="UniProtKB/TrEMBL:A0A3R9UGD4" + /gene_functions="biosynthetic-additional + (rule-based-clusters) adh_short" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1001:short-chain dehydrogenase/reductase SDR (Score: + 259.1; E-value: 6.8e-79)" + /gene_functions="biosynthetic-additional (t2pks) KR C9 + (Score: 472.0; E-value: 1.1e-144)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000037" + /note="GO_function: GO:0016491 - oxidoreductase activity" + /product="MULTISPECIES: SDR family NAD(P)-dependent + oxidoreductase" + /protein_id="ncbi_JK1GL000037" + /sec_met_domain="adh_short (E-value: 1.4e-33, bitscore: + 115.1, seeds: 230, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTDTTTQRVAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVA + ATVKELQGEGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIA + DELWDDVIDTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKH + GVVGFTKALGNELAPTGITVNAVCPGYVETPMAQRVRQGYAAAYDTSEDAILEKFQAKI + PLGRYSTPEEVAGLVGYLASDTAASITSQALNVCGGLGNF" + aSDomain complement(33181..33648) + /aSDomain="PKS_KR" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000037_PKS_KR.1" + /evalue="7.10E-11" + /label="JK1GL000037_PKS_KR.1" + /locus_tag="JK1GL000037" + /protein_end="164" + /protein_start="8" + /score="34.2" + /specificity="KR activity: inactive" + /specificity="KR stereochemistry: C1" + /tool="antismash" + /translation="VAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVAATVKELQG + EGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIADELWDDVI + DTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKHG" + CDS_motif complement(33580..33642) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000037_0001" + /evalue="6.00E-05" + /label="PKSI-KR_m1" + /locus_tag="JK1GL000037" + /protein_end="31" + /protein_start="10" + /score="15.7" + /tool="antismash" + /translation="VVTGATSGIGLASARLLGRQG" + mRNA complement(33685..33954) + /locus_tag="JK1GL000038" + /note="MULTISPECIES: acyl carrier protein" + gene complement(33685..33954) + /locus_tag="JK1GL000038" + CDS complement(33685..33954) + /NRPS_PKS="Domain: ACP (12-83). E-value: 9.1e-13. Score: + 40.2. Matches aSDomain: nrpspksdomains_JK1GL000038_ACP.1" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="COG:COG0236 Acyl carrier protein" + /db_xref="UniProtKB/Swiss-Prot:P41174 Monensin polyketide + synthase acyl carrier protein" + /db_xref="UniProtKB/TrEMBL:A0A399CG47" + /gene_functions="biosynthetic-additional + (rule-based-clusters) PP-binding" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1129:acyl carrier protein (Score: 114.7; E-value: + 2.6e-35)" + /gene_functions="biosynthetic-additional (t2pks) ACP + (Score: 127.3; E-value: 3.8e-40)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000038" + /product="MULTISPECIES: acyl carrier protein" + /protein_id="ncbi_JK1GL000038" + /sec_met_domain="PP-binding (E-value: 3.6e-06, bitscore: + 26.1, seeds: 164, tool: rule-based-clusters)" + /transl_table=11 + /translation="MASKSFTLDDLKRTLREAAGVAEGVDLDGDILDTEFEVIGYESLA + LLEAGSLIEREYGISLDEEAVGEANTPRSFIEVVNAQLAPAKAA" + aSDomain complement(33706..33918) + /aSDomain="ACP" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000038_ACP.1" + /evalue="9.10E-13" + /label="JK1GL000038_ACP.1" + /locus_tag="JK1GL000038" + /protein_end="83" + /protein_start="12" + /score="40.2" + /tool="antismash" + /translation="RTLREAAGVAEGVDLDGDILDTEFEVIGYESLALLEAGSLIEREY + GISLDEEAVGEANTPRSFIEVVNAQL" + mRNA complement(34023..35234) + /locus_tag="JK1GL000039" + /note="MULTISPECIES: ketosynthase chain-length factor" + gene complement(34023..35234) + /locus_tag="JK1GL000039" + CDS complement(34023..35234) + /EC_number="2.3.1.-" + /EC_number="2.3.1.260" + /EC_number="2.3.1.235" + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (48-401). E-value: + 9.4e-31. Score: 98.9. Matches aSDomain: + nrpspksdomains_JK1GL000039_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) + synthase" + /db_xref="UniProtKB/Swiss-Prot:Q02062 Actinorhodin + polyketide putative beta-ketoacyl synthase 2" + /db_xref="UniProtKB/TrEMBL:A0A399CKN5" + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1093:Beta-ketoacyl synthase (Score: 672.2; E-value: + 3.4e-204)" + /gene_functions="biosynthetic-additional (t2pks) CLF 8|9 + (Score: 704.2; E-value: 9.9e-215)" + /gene_kind="biosynthetic" + /locus_tag="JK1GL000039" + /note="GO_function: GO:0003824 - catalytic activity" + /product="MULTISPECIES: ketosynthase chain-length factor" + /protein_id="ncbi_JK1GL000039" + /sec_met_domain="t2clf (E-value: 4.4e-207, bitscore: 686.3, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTASVVVTGLGVVSPNGMGVKDYWAATLGGKHGIGRITRFDPTGY + PARLAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPAHLPEFDMGVIT + ASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSEG + AGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSDEPDHAYLPFDR + DANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGREPNLAKAIETA + LADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKTMTGRLYSGGAP + LDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLARGAGGFNSAMV + VRAA" + aSDomain complement(34032..35090) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000039_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="9.40E-31" + /label="JK1GL000039_PKS_KS.1" + /locus_tag="JK1GL000039" + /protein_end="401" + /protein_start="48" + /score="98.9" + /tool="antismash" + /translation="LAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPA + HLPEFDMGVITASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGM + KGPSGVVVSEGAGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSD + EPDHAYLPFDRDANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGR + EPNLAKAIETALADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKT + MTGRLYSGGAPLDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLA + RGAGGFNSAMVVR" + CDS_motif complement(34539..34577) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000039_0002" + /evalue="1.20E-04" + /label="PKSI-KS_m4" + /locus_tag="JK1GL000039" + /protein_end="232" + /protein_start="219" + /score="15.0" + /tool="antismash" + /translation="FDRDANGYVPGEG" + CDS_motif complement(34746..34769) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000039_0001" + /evalue="9.90E+01" + /label="PKSI-KS_m4" + /locus_tag="JK1GL000039" + /protein_end="163" + /protein_start="155" + /score="-2.9" + /tool="antismash" + /translation="SGVVVSEG" + mRNA complement(35231..36484) + /locus_tag="JK1GL000040" + /note="beta-ketoacyl-acyl-carrier-protein synthase family + protein" + gene complement(35231..36484) + /locus_tag="JK1GL000040" + CDS complement(35231..36484) + /EC_number="2.3.1.-" + /EC_number="2.3.1.260" + /EC_number="2.3.1.235" + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (1-389). E-value: + 9.4e-53. Score: 171.4. Matches aSDomain: + nrpspksdomains_JK1GL000040_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) + synthase" + /db_xref="UniProtKB/Swiss-Prot:P41175 Putative polyketide + beta-ketoacyl synthase 1" + /db_xref="UniProtKB/TrEMBL:A0A454W1H2" + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1022:Beta-ketoacyl synthase (Score: 482.3; E-value: + 2.3e-146)" + /gene_functions="biosynthetic-additional (t2pks) KS (Score: + 773.1; E-value: 1.4e-235)" + /gene_kind="biosynthetic" + /locus_tag="JK1GL000040" + /note="GO_function: GO:0003824 - catalytic activity" + /product="beta-ketoacyl-acyl-carrier-protein synthase + family protein" + /protein_id="ncbi_JK1GL000040" + /sec_met_domain="t2ks (E-value: 7.1e-244, bitscore: 808.0, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAPFRSRVA + AEADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVTVGSAVG + ATMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPSTVVSTG + CTSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEPECASRP + FDKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRPDGVEMA + EAIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSSIKSMVG + HSLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQLIDAVLTVGSG + FGGFQSAMVLATPERSLV" + aSDomain complement(35318..36481) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000040_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="9.40E-53" + /label="JK1GL000040_PKS_KS.1" + /locus_tag="JK1GL000040" + /protein_end="389" + /protein_start="1" + /score="171.4" + /tool="antismash" + /translation="ITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAPFRSRVAA + EADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVTVGSAVGA + TMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPSTVVSTGC + TSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEPECASRPF + DKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRPDGVEMAE + AIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSSIKSMVGH + SLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQL" + mRNA complement(36499..36828) + /locus_tag="JK1GL000042" + /note="MULTISPECIES: TcmI family type II polyketide + cyclase" + gene complement(36499..36828) + /locus_tag="JK1GL000042" + CDS complement(36499..36828) + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:P23159 hypothetical protein" + /db_xref="UniProtKB/TrEMBL:A0A399CJD3" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1225:Polyketide synthesis cyclase (Score: 161; + E-value: 1.3e-49)" + /gene_functions="biosynthetic-additional (t2pks) CYC + C4-C17/C2-C19 (Score: 199.8; E-value: 9.5e-62)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000042" + /note="GO_process: GO:0030639 - polyketide biosynthetic + process" + /product="MULTISPECIES: TcmI family type II polyketide + cyclase" + /protein_id="ncbi_JK1GL000042" + /transl_table=11 + /translation="MHSTLIVARMAATSSNDVAQLFADFDATEMPHRMGTRRRQLFSYR + GLYFHLQDFDEDNGGELIEAAKADPRFVRISEDLKPFIEAYDPTTWRSPADAMATRFYS + WEASR" + mRNA complement(37086..37784) + /locus_tag="JK1GL000041" + /note="hypothetical protein" + gene complement(37086..37784) + /locus_tag="JK1GL000041" + CDS complement(37086..37784) + /codon_start=1 + /db_xref="COG:COG2329 Heme-degrading monooxygenase HmoA and + related ABM domain proteins" + /db_xref="UniProtKB/TrEMBL:A0A454W1H6" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000041" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000041" + /transl_table=11 + /translation="MPIISAEDKHLTVLNLFTTDTPEKQAKLIEEMTKIVNAAAYEGWM + SSTVHSGVDGYGTLNFIQWRSGEDLEKRYAGEEFKHRTLPVFGEITTSIRLMQNEVAHT + LTSDALGGKIEIGPDRDDYTVFTLFPVTPEGQDEAVDALGPGQAFLADVPGFRAHVVLK + GLRARGLEGSFVISYSQWDSKEAFEVYRDQAPEEQADARKAAVARVRAVVTGEPYLNTY + RVVHTRSAGE" + mRNA complement(37841..39313) + /locus_tag="JK1GL000043" + /note="MULTISPECIES: monooxygenase" + gene complement(37841..39313) + /locus_tag="JK1GL000043" + CDS complement(37841..39313) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W1G7" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1050:monooxygenase FAD-binding (Score: 529.6; E-value: + 1.4e-160)" + /gene_functions="biosynthetic-additional (t2pks) OXY + (Score: 512.5; E-value: 2.7e-156)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000043" + /note="GO_function: GO:0071949 - FAD binding" + /product="MULTISPECIES: monooxygenase" + /protein_id="ncbi_JK1GL000043" + /transl_table=11 + /translation="MEFYDSDVIVVGAGPTGLMLAGELRLAGVSVVVLDKLSEPIQESR + ALGFSARTIEEFAQRGLMDRFGEVGVIPVGHFGGVPLDYRVIEGGSYGARGIPQARTEG + VLGGWARELGADIRRGCEVTGIEQTDASVTVTAAGADGPFSLRARHVVGCDGARSIVRK + LAGIGFPGTEPAIELRFADLAGVALRPRFSGERVAGGMVMVIPMGPDRCRVIYFDSSEP + LRTSPDPITFDEVAQTWQRLTGEDVSGATPLWVSSTTDVSRQADRYRHGRVFLAGDAAH + IHLPIGAQGMSAGVQDAVNLGWKLALDIKGQAPEGLLDTYHAERHPVGARILTNTLAQR + ILYLGGDEITPMREVLAELMGAHESVQRHLAGMVTGLDIRHDVGEGDHPLLGRRLPDRE + LVVDGEKTPFYALLRTARPVLLELGGDHGLRTAAAGWADRVDLVAAEFDGCEAPVDGIL + VRPDGYVAWVAGLGAGPDGLTAALGRWFGPTA" + mRNA 39480..39962 + /locus_tag="JK1GL000044" + /note="MULTISPECIES: nuclear transport factor 2 family + protein" + gene 39480..39962 + /locus_tag="JK1GL000044" + CDS 39480..39962 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A399CRN6" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000044" + /product="MULTISPECIES: nuclear transport factor 2 family + protein" + /protein_id="ncbi_JK1GL000044" + /transl_table=11 + /translation="MTSSLTTDQSASVSAAESSAQVAGLLHRYLVSLDDERLDDAWTAG + LFTEDAVVAFPVSRHEGADGMAEYHRSALSAFAATQHLGSPAVVDVDGDRAVFRANLIS + THVHHPRHTPPEGDLPPLFATGTFVNGEARRTARGWRLSLLAFRLLWADGSPPPAR" + mRNA complement(40155..40571) + /locus_tag="JK1GL000045" + /note="MULTISPECIES: pyridoxamine 5'-phosphate oxidase" + gene complement(40155..40571) + /locus_tag="JK1GL000045" + CDS complement(40155..40571) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W1F9" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000045" + /note="GO_function: GO:0048037 - cofactor binding" + /product="MULTISPECIES: pyridoxamine 5'-phosphate oxidase" + /protein_id="ncbi_JK1GL000045" + /transl_table=11 + /translation="MPSMPRPDAVTVPDSVQAFLTGTALVAAFTTMRPDGTPHVAPVRF + TWDADAQLARVMTVSSSRKARNLLATPGAPVALCQVDGFRWVTLEGTGTVVTDPERVAL + GARLYAKRYWSAPPTPSDRVVIEIAVDRVLSLNA" + mRNA complement(40814..40960) + /locus_tag="JK1GL000046" + /note="hypothetical protein" + gene complement(40814..40960) + /locus_tag="JK1GL000046" + CDS complement(40814..40960) + /codon_start=1 + /locus_tag="JK1GL000046" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000046" + /transl_table=11 + /translation="MHEGDDERHEGDTARCARAVHGGPPPLRLAGAEEREDEDGRVIVR + SID" + mRNA complement(40995..42485) + /locus_tag="JK1GL000047" + /note="hypothetical protein" + gene complement(40995..42485) + /locus_tag="JK1GL000047" + CDS complement(40995..42485) + /NRPS_PKS="Domain: Condensation_DCL (38-314). E-value: + 1e-48. Score: 157.8. Matches aSDomain: + nrpspksdomains_JK1GL000047_Condensation_DCL.1" + /NRPS_PKS="type: NRPS-like protein" + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W1I0" + /gene_functions="biosynthetic-additional + (rule-based-clusters) Condensation" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1127:condensation domain-containing protein (Score: + 260.3; E-value: 6.5e-79)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000047" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000047" + /sec_met_domain="Condensation (E-value: 7.1e-28, bitscore: + 96.2, seeds: 42, tool: rule-based-clusters)" + /transl_table=11 + /translation="MAWHSRPRALRGPGTARPPGVPALWPHLDLLGDFGGRRGAGRHVE + QLVWRWHGPLDTERFAAAWQSVVDRESVLRAALAPGPRPHLVLHEHAHGDVVRHRAGGA + GWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGPVTRVVLTFHHALLDAWSVCLL + MQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGARDFWRGAVPDGPVAVLPARPG + PRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSALETVWALLLYRAAGPGGAATVG + FGVTVSGRGITLDCAERLPGPLRNCLPMVVRVDPGETVGRLLTALRDRALDMAAYEWVS + TRRIHRWTGRCPDGELLQSVVSVDSLPRPPGNLRNELADAGIALEPEPAHGACPDLPVA + LLVRPGGDGRLTFCVDHDRNRISDADARLLAGHCARLLRHLPGTDEATTNGAVLDVLAG + EALPRIAPRPSRPRPAGSWLRPRSTSFGAAVDRAASHP" + CDS_motif complement(41508..41567) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000047_0004" + /evalue="3.90E+01" + /label="C2_LCL_024-062" + /locus_tag="JK1GL000047" + /protein_end="326" + /protein_start="306" + /score="-3.2" + /tool="antismash" + /translation="LPMVVRVDPGETVGRLLTAL" + aSDomain complement(41544..42371) + /aSDomain="Condensation" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000047_Condensation_DCL.1" + /domain_subtype="Condensation_DCL" + /evalue="1.00E-48" + /label="JK1GL000047_Condensation_DCL.1" + /locus_tag="JK1GL000047" + /protein_end="314" + /protein_start="38" + /score="157.8" + /tool="antismash" + /translation="GAGRHVEQLVWRWHGPLDTERFAAAWQSVVDRESVLRAALAPGPR + PHLVLHEHAHGDVVRHRAGGAGWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGP + VTRVVLTFHHALLDAWSVCLLMQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGA + RDFWRGAVPDGPVAVLPARPGPRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSAL + ETVWALLLYRAAGPGGAATVGFGVTVSGRGITLDCAERLPGPLRNCLPMVVRVD" + CDS_motif complement(41559..41645) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000047_0003" + /evalue="6.10E-06" + /label="C5_DCL_263-294" + /locus_tag="JK1GL000047" + /protein_end="309" + /protein_start="280" + /score="18.7" + /tool="antismash" + /translation="GFGVTVSGRGITLDCAERLPGPLRNCLPM" + CDS_motif complement(41973..42038) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000047_0002" + /evalue="4.90E-08" + /label="C3_DCL_135-156" + /locus_tag="JK1GL000047" + /protein_end="171" + /protein_start="149" + /score="25.5" + /tool="antismash" + /translation="FHHALLDAWSVCLLMQELCRAY" + CDS_motif complement(42255..42356) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000047_0001" + /evalue="3.80E-10" + /label="C2_DCL_024-062" + /locus_tag="JK1GL000047" + /protein_end="77" + /protein_start="43" + /score="32.1" + /tool="antismash" + /translation="VEQLVWRWHGPLDTERFAAAWQSVVDRESVLRAA" + mRNA complement(42690..43436) + /locus_tag="JK1GL000048" + /note="MULTISPECIES: 4'-phosphopantetheinyl transferase + superfamily protein" + gene complement(42690..43436) + /locus_tag="JK1GL000048" + CDS complement(42690..43436) + /EC_number="2.7.8.-" + /NRPS_PKS="Domain: ACPS (113-174). E-value: 6.1e-12. Score: + 37.3. Matches aSDomain: nrpspksdomains_JK1GL000048_ACPS.1" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="COG:COG2091 Phosphopantetheinyl transferase" + /db_xref="UniProtKB/TrEMBL:A0A399CJU2" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1012:4'-phosphopantetheinyl transferase (Score: 140.4; + E-value: 8.9e-43)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000048" + /note="GO_function: GO:0000287 - magnesium ion binding; + GO_function: GO:0008897 - holo-[acyl-carrier-protein] + synthase activity" + /product="MULTISPECIES: 4'-phosphopantetheinyl transferase + superfamily protein" + /protein_id="ncbi_JK1GL000048" + /transl_table=11 + /translation="MREDLFRHGNALVCTTWSEWLPSVLTTPRLRELLGDDWQRYRRTR + DAAVRYRFAASRMLIKYTAAAALAVPPEYLDLAYRLGGRPYLRGFDQIELSLSHTGDVM + AVGLSRIGRIGVDVEPAERPVRLDLLETQVFTPAEARELAELPEGERTAHALRLWTLKE + AYSKALGQGLRFGFKEFGFRQGRLSAPDGSRVTRDEWGFATYPVMDRFLLSVACHNAGL + STAGDTSVGTMLDQGFLSAMTDTGQQ" + aSDomain complement(42915..43097) + /aSDomain="ACPS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000048_ACPS.1" + /evalue="6.10E-12" + /label="JK1GL000048_ACPS.1" + /locus_tag="JK1GL000048" + /protein_end="174" + /protein_start="113" + /score="37.3" + /tool="antismash" + /translation="IGVDVEPAERPVRLDLLETQVFTPAEARELAELPEGERTAHALRL + WTLKEAYSKALGQGLR" + mRNA complement(43588..45402) + /locus_tag="JK1GL000049" + /note="acyl-CoA dehydrogenase" + gene complement(43588..45402) + /locus_tag="JK1GL000049" + CDS complement(43588..45402) + /codon_start=1 + /db_xref="COG:COG1960 Acyl-CoA dehydrogenase related to the + alkylation response protein AidB" + /db_xref="UniProtKB/TrEMBL:A0A3R9SSA2" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1006:acyl-CoA dehydrogenase (Score: 155.1; E-value: + 4.6e-47)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000049" + /note="GO_function: GO:0016627 - oxidoreductase activity, + acting on the CH-CH group of donors; GO_function: + GO:0050660 - flavin adenine dinucleotide binding; + GO_process: GO:0055114 - oxidation-reduction process" + /product="acyl-CoA dehydrogenase" + /protein_id="ncbi_JK1GL000049" + /transl_table=11 + /translation="MTAALDTAAGPTGQAPDPRSTTPTPAPEHTTPESQHITRAPEPER + AARLEAALGDPFDPVNPHGHLALVRADDTREAPHATEALLTEHGLSAEFVPHDLGGRLR + DLEELARVLRPLFRRDLALGYGFGITSLFAASSVWTAGDTHQRAALADVLLGGGRVAIV + HREVAHANAILRREVRAQRPAGGGFLLNGSKDAVMNADRTDTFVVYARTSAGSGSASHS + VLLLPGPPASGEVRRLARVEMPGMRGARFHGLRLADVRLPDSALVGSLGEGVTLALRSF + QISHCLIPGTVLAGVDSVLRLAVRAATENRPDGRPARRWHKALSGVFADLLACDAMAVT + GLRALSLVPQHAHLLAAAVKYTMPDLLREDLEELAAVLGARGYDRGPLYGGFQKLARDL + PVAGLGHSGTAVCQAVLVPQLPALARTAWFRTAEPSAALFLPGAPLPPLDHRRLTHSGT + DDPLTATLIGAAERLAARTGTQPLHAALAALARALVEELRVLRARCAALPAAGSTVFDP + LACALADRYALLLCAAACLGVWEGQADGDGFLADPAWAVLVLSRIGRRLGIAVPETPAD + AEQAVLAEALGRCRHGRSLDLYDTPLAG" + mRNA complement(45399..46259) + /locus_tag="JK1GL000050" + /note="MULTISPECIES: cyclase" + gene complement(45399..46259) + /locus_tag="JK1GL000050" + CDS complement(45399..46259) + /EC_number="4.2.1.-" + /NRPS_PKS="Domain: Polyketide_cyc2 (2-127). E-value: + 2.5e-11. Score: 36.0. Matches aSDomain: + nrpspksdomains_JK1GL000050_Polyketide_cyc2.1" + /NRPS_PKS="Domain: Polyketide_cyc2 (138-245). E-value: + 1e-07. Score: 24.3. Matches aSDomain: + nrpspksdomains_JK1GL000050_Polyketide_cyc2.2" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A399CG55" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1128:cyclase/dehydrase (Score: 266.8; E-value: + 4.2e-81)" + /gene_functions="biosynthetic-additional (t2pks) CYC C7-C12 + (Score: 256.3; E-value: 6.9e-79)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000050" + /product="MULTISPECIES: cyclase" + /protein_id="ncbi_JK1GL000050" + /transl_table=11 + /translation="MLYGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMWAVAGDRIS + SWVSHRRLDVGQRRVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFTVVGDAPAD + AAWTERVTRANSRAQLQRLAWLAERWTRLDDLVMSFEDTVRVNVPAELVFDFLYRAGDW + PDDLAGTRPLTVQEDTPGIQVLALDGRSATGGEAVRISFPAAGRLVHKHTRTSGPLAAY + TGEWTIEPQPGAGLDVTVRHDVLLNDDAALDQDAARRVCDEVGRAGRRLLEHAVRHASD + AVRVL" + aSDomain complement(45525..45845) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000050_Polyketide_cyc2.2" + /domain_subtype="Polyketide_cyc2" + /evalue="1.00E-07" + /label="JK1GL000050_Polyketide_cyc2.2" + /locus_tag="JK1GL000050" + /protein_end="245" + /protein_start="138" + /score="24.3" + /tool="antismash" + /translation="SFEDTVRVNVPAELVFDFLYRAGDWPDDLAGTRPLTVQEDTPGIQ + VLALDGRSATGGEAVRISFPAAGRLVHKHTRTSGPLAAYTGEWTIEPQPGAGLDVTVRH + DVL" + aSModule 45525..46253 + /domains="nrpspksdomains_JK1GL000050_Polyketide_cyc2.1" + /domains="nrpspksdomains_JK1GL000050_Polyketide_cyc2.2" + /incomplete + /locus_tags="JK1GL000050" + /tool="antismash" + /type="unknown" + aSDomain complement(45879..46253) + /aSDomain="Polyketide_cyc" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000050_Polyketide_cyc2.1" + /domain_subtype="Polyketide_cyc2" + /evalue="2.50E-11" + /label="JK1GL000050_Polyketide_cyc2.1" + /locus_tag="JK1GL000050" + /protein_end="127" + /protein_start="2" + /score="36.0" + /tool="antismash" + /translation="YGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMWAVAGDRISSW + VSHRRLDVGQRRVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFTVVGDAPADAA + WTERVTRANSRAQLQRLAWLA" + mRNA 46599..46835 + /locus_tag="JK1GL000051" + /note="hypothetical protein" + gene 46599..46835 + /locus_tag="JK1GL000051" + CDS 46599..46835 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W1G8" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000051" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000051" + /transl_table=11 + /translation="MRRFRPRRCVRGLWEGLVAYGRLCLAGETDRYDHPPRPRVRWHRP + PPGHPERVRDDMPLTDLERRLARELTDEDHDVR" + mRNA complement(47200..48465) + /locus_tag="JK1GL000052" + /note="ketosynthase chain-length factor" + gene complement(47200..48465) + /locus_tag="JK1GL000052" + CDS complement(47200..48465) + /EC_number="2.3.1.-" + /EC_number="2.3.1.260" + /EC_number="2.3.1.235" + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (85-416). E-value: + 4.3e-25. Score: 80.3. Matches aSDomain: + nrpspksdomains_JK1GL000052_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) + synthase" + /db_xref="UniProtKB/Swiss-Prot:Q02062 Actinorhodin + polyketide putative beta-ketoacyl synthase 2" + /db_xref="UniProtKB/TrEMBL:A0A454W1F8" + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2clf" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1093:Beta-ketoacyl synthase (Score: 579.4; E-value: + 5.2e-176)" + /gene_functions="biosynthetic-additional (t2pks) CLF 8|9 + (Score: 582.6; E-value: 8.2e-178)" + /gene_kind="biosynthetic" + /locus_tag="JK1GL000052" + /note="GO_function: GO:0003824 - catalytic activity" + /product="ketosynthase chain-length factor" + /protein_id="ncbi_JK1GL000052" + /sec_met_domain="t2clf (E-value: 5.9e-170, bitscore: 564.0, + seeds: 26, tool: rule-based-clusters)" + /transl_table=11 + /translation="MTKATQAPEPARPAGAQGPRQTLVTGIGVAAPNGLGTRAWWDAVL + CGRTGLGPITRFDASGYPVRIAGEIPGFVDEDHIPSRLLPSTDRGTRIALVAAEEALRD + ANVSPADLPAYGAGVITASSAGGAEFGERGLAALWSKGAQHVSAYQSFASFHAAAPAQI + SIRHRLRGHGSTVVSEQAGGIDALARARRRIRDGACLMVTGGIDSTLCAWGWAAHLADG + RLSPATEPARAYRPFAATADGHAVGEGGALLVLEDARAAARRGATGYGVIAGCAATFDG + PDRPTLRQAAELALADAGLAPEHVDVVFADGAAERRADLVESQALCALFGPYGVPVTVP + KTMTGRLGAGGSALDVAAALLALREKVVPPTTGTGRVADDCPLDLVTGAPRELPRLRVA + LVLARGRGGFNSAAVLRAPQAQ" + aSDomain complement(47218..48210) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000052_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="4.30E-25" + /label="JK1GL000052_PKS_KS.1" + /locus_tag="JK1GL000052" + /protein_end="416" + /protein_start="85" + /score="80.3" + /tool="antismash" + /translation="STDRGTRIALVAAEEALRDANVSPADLPAYGAGVITASSAGGAEF + GERGLAALWSKGAQHVSAYQSFASFHAAAPAQISIRHRLRGHGSTVVSEQAGGIDALAR + ARRRIRDGACLMVTGGIDSTLCAWGWAAHLADGRLSPATEPARAYRPFAATADGHAVGE + GGALLVLEDARAAARRGATGYGVIAGCAATFDGPDRPTLRQAAELALADAGLAPEHVDV + VFADGAAERRADLVESQALCALFGPYGVPVTVPKTMTGRLGAGGSALDVAAALLALREK + VVPPTTGTGRVADDCPLDLVTGAPRELPRLRVALVLARGRGGFNSAAVLR" + mRNA complement(48462..49733) + /locus_tag="JK1GL000053" + /note="MULTISPECIES: beta-ketoacyl-acyl-carrier-protein + synthase family protein" + gene complement(48462..49733) + /locus_tag="JK1GL000053" + CDS complement(48462..49733) + /EC_number="2.3.1.-" + /EC_number="2.3.1.260" + /EC_number="2.3.1.235" + /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (3-396). E-value: + 4.8e-49. Score: 159.2. Matches aSDomain: + nrpspksdomains_JK1GL000053_PKS_KS.1" + /NRPS_PKS="type: PKS/NRPS-like protein" + /codon_start=1 + /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) + synthase" + /db_xref="UniProtKB/Swiss-Prot:P16538 Tetracenomycin C + polyketide putative beta-ketoacyl synthase 1" + /db_xref="UniProtKB/TrEMBL:A0A399CKM9" + /gene_functions="biosynthetic (rule-based-clusters) T2PKS: + t2ks" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1022:Beta-ketoacyl synthase (Score: 423.8; E-value: + 1.3e-128)" + /gene_functions="biosynthetic-additional (t2pks) KS (Score: + 659.9; E-value: 3.3e-201)" + /gene_kind="biosynthetic" + /locus_tag="JK1GL000053" + /note="GO_function: GO:0003824 - catalytic activity" + /product="MULTISPECIES: beta-ketoacyl-acyl-carrier-protein + synthase family protein" + /protein_id="ncbi_JK1GL000053" + /sec_met_domain="t2ks (E-value: 6.8e-200, bitscore: 663.1, + seeds: 25, tool: rule-based-clusters)" + /transl_table=11 + /translation="MNRVVITGIGVVAPGAVGTAGFWDLLTVGRTATRRVTLFDACGYR + SRVAAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSL + GSAIGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVA + LVSSGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPA + TASRPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAVTAHSSAHHMTGLRPG + ALEMADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSI + KSMIGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTSTVL + TVASGFGGFHTAAVLTRPQLKEAA" + aSDomain complement(48546..49724) + /aSDomain="PKS_KS" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000053_PKS_KS.1" + /domain_subtype="Iterative-KS" + /evalue="4.80E-49" + /label="JK1GL000053_PKS_KS.1" + /locus_tag="JK1GL000053" + /protein_end="396" + /protein_start="3" + /score="159.2" + /tool="antismash" + /translation="VVITGIGVVAPGAVGTAGFWDLLTVGRTATRRVTLFDACGYRSRV + AAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSLGSA + IGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVALVS + SGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPATAS + RPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAVTAHSSAHHMTGLRPGALE + MADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSIKSM + IGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTS" + mRNA complement(49730..50509) + /locus_tag="JK1GL000055" + /note="MULTISPECIES: thioesterase" + gene complement(49730..50509) + /locus_tag="JK1GL000055" + CDS complement(49730..50509) + /NRPS_PKS="Domain: Thioesterase (15-242). E-value: 9.4e-38. + Score: 122.7. Matches aSDomain: + nrpspksdomains_JK1GL000055_Thioesterase.1" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A399CHI6" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1004:thioesterase (Score: 181.7; E-value: 2.1e-55)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000055" + /note="GO_function: GO:0016788 - hydrolase activity, acting + on ester bonds; GO_process: GO:0009058 - biosynthetic + process" + /product="MULTISPECIES: thioesterase" + /protein_id="ncbi_JK1GL000055" + /transl_table=11 + /translation="MASRSRDREAGTARITLTCLAHAGAGVASYRGWSAAVGPGIDVAA + LPLPGRDSRRREPRLTERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALAD + SGLPPLFLAVGACPPPHTTTVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTF + LPVLRDDLRLARSLRNAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIE + LHTVAGGHFFASSSSLAQHVGRACRGHVTALPTGGGR" + aSDomain complement(49784..50464) + /aSDomain="Thioesterase" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000055_Thioesterase.1" + /evalue="9.40E-38" + /label="JK1GL000055_Thioesterase.1" + /locus_tag="JK1GL000055" + /protein_end="242" + /protein_start="15" + /score="122.7" + /tool="antismash" + /translation="TLTCLAHAGAGVASYRGWSAAVGPGIDVAALPLPGRDSRRREPRL + TERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALADSGLPPLFLAVGACPP + PHTTTVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTFLPVLRDDLRLARSLR + NAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIELHTVAGGHFFASSSS + LAQHV" + CDS_motif complement(50204..50272) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000055_0001" + /evalue="3.80E-07" + /label="NRPS-te1" + /locus_tag="JK1GL000055" + /protein_end="102" + /protein_start="79" + /score="22.6" + /tool="antismash" + /translation="RGPYALYGHSMGALVGYTLTRAL" + mRNA complement(50767..51588) + /locus_tag="JK1GL000054" + /note="MULTISPECIES: AfsR/SARP family transcriptional + regulator" + gene complement(50767..51588) + /locus_tag="JK1GL000054" + CDS complement(50767..51588) + /codon_start=1 + /db_xref="COG:COG3629 DNA-binding transcriptional activator + of the SARP family" + /db_xref="UniProtKB/Swiss-Prot:P25047 Regulatory protein + DnrI" + /db_xref="UniProtKB/TrEMBL:A0A399CRP3" + /gene_functions="regulatory (smcogs) + SMCOG1041:transcriptional regulator, SARP family (Score: + 327.7; E-value: 3e-99)" + /gene_kind="regulatory" + /locus_tag="JK1GL000054" + /note="GO_function: GO:0003677 - DNA binding; GO_function: + GO:0005515 - protein binding; GO_process: GO:0000160 - + phosphorelay signal transduction system; GO_process: + GO:0006355 - regulation of transcription, DNA-templated" + /product="MULTISPECIES: AfsR/SARP family transcriptional + regulator" + /protein_id="ncbi_JK1GL000054" + /transl_table=11 + /translation="MEIKVLGALNAEFEGISVVPSAGKPRQILALLALYPGRVVPVPTL + MEEIWGTDLPQSSMTTLQTYILQLRRLLGTAMGPDVPGSAKDVLATRYGGYLLQIPAEA + VDAFTYERLVTEGRQAYEDGEDERAATVLRRALDLWDGPALVDVRVGPVLEIEAMRLEQ + SRLVARERRIDADLRLGRHVELIAELTDLIARHPQHEGLHSQAMVALYRSGRQAAALDV + YRRLRQRLIDELGVEPSPQLQRLHQAMLAVDPRLDIVAGPRRTSTFDLYAA" + mRNA 52329..53318 + /locus_tag="JK1GL000056" + /note="AfsR/SARP family transcriptional regulator" + gene 52329..53318 + /locus_tag="JK1GL000056" + CDS 52329..53318 + /codon_start=1 + /db_xref="COG:COG3629 DNA-binding transcriptional activator + of the SARP family" + /db_xref="UniProtKB/Swiss-Prot:P16922 Transcriptional + regulator RedD" + /db_xref="UniProtKB/TrEMBL:A0A454W7A1" + /gene_functions="regulatory (smcogs) + SMCOG1041:transcriptional regulator, SARP family (Score: + 320; E-value: 6.6e-97)" + /gene_kind="regulatory" + /locus_tag="JK1GL000056" + /note="GO_function: GO:0003677 - DNA binding; GO_function: + GO:0005515 - protein binding; GO_process: GO:0000160 - + phosphorelay signal transduction system; GO_process: + GO:0006355 - regulation of transcription, DNA-templated" + /product="AfsR/SARP family transcriptional regulator" + /protein_id="ncbi_JK1GL000056" + /transl_table=11 + /translation="MIRAGGCGIGCFPGKGEMEFRILGSVQIHDERFGVRVVPAGAKQR + ALLGALLVRAGQAVPAECLVEELWGGQPPVNAANALQAHVARLRRLLPAPGPGGPRHVW + LRTSPLGYTLSLGPAVTDAQRFHRLVGQGRELAATAPGRAVEVLREGLALWRGPALQGS + GQGPICSAEAALLEESRLRALEVLYDVCLRADRCAEITGELEELVAVHPLRERFHEQLM + TALHRCGRRAEALSTYDRARRRLARDLGIGPGQVLSRRREAILRSCEPAADSADRAGAG + TAGQGGDELGVLREELVRLRGHVELLRRQQRELSEQVARLTAHHPCGP" + CDS complement(53334..54149) + /codon_start=1 + /db_xref="COG:COG3629 DNA-binding transcriptional activator + of the SARP family" + /db_xref="UniProtKB/Swiss-Prot:P25047 Regulatory protein + DnrI" + /db_xref="UniProtKB/TrEMBL:A0A399CPF0" + /gene_functions="regulatory (smcogs) + SMCOG1041:transcriptional regulator, SARP family (Score: + 316.1; E-value: 9.8e-96)" + /gene_kind="regulatory" + /locus_tag="JK1GL000057" + /note="GO_function: GO:0003677 - DNA binding; GO_function: + GO:0005515 - protein binding; GO_process: GO:0000160 - + phosphorelay signal transduction system; GO_process: + GO:0006355 - regulation of transcription, DNA-templated" + /product="MULTISPECIES: AfsR/SARP family transcriptional + regulator" + /protein_id="ncbi_JK1GL000057" + /transl_table=11 + /translation="MDIEVLGALSVREHGVSVVPTAPKPRQVLALLALNADQVVPVAAL + VDELWGENPPRSARTTLQTYVLQLRELMAQALAHGPDERCTAKDILATVPGGYRLQTRG + GHVDYREFDQRAGLGYRAMDAEDYAGAARRLADALALWNGQALTDIQAGLRIDTEVKRL + EEARLCALDQRIEADLRLGRHRELLSELTVLVNQYRMHESLHGQFMLALHRSGRRGEAL + NVYQRLRSTLVHELGLEPSAALSRLQRSILMARPETPAAAGGSGRLVTR" + protocluster 53334..62701 + /aStool="rule-based-clusters" + /category="other" + /contig_edge="False" + /core_location="[70693:71686](+)" + /cutoff="20000" + /detection_rule="AfsA" + /neighbourhood="5000" + /product="butyrolactone" + /protocluster_number="2" + /tool="antismash" + proto_core 57418..58410 + /aStool="rule-based-clusters" + /tool="antismash" + /cutoff="20000" + /detection_rule="AfsA" + /neighbourhood="5000" + /product="butyrolactone" + /protocluster_number="2" + cand_cluster 53334..62701 + /candidate_cluster_number="2" + /contig_edge="False" + /detection_rules="AfsA" + /kind="single" + /product="butyrolactone" + /protoclusters="2" + /tool="antismash" + mRNA complement(53334..54149) + /locus_tag="JK1GL000057" + /note="MULTISPECIES: AfsR/SARP family transcriptional + regulator" + gene complement(53334..54149) + /locus_tag="JK1GL000057" + mRNA complement(54551..55162) + /locus_tag="JK1GL000058" + /note="helix-turn-helix transcriptional regulator" + gene complement(54551..55162) + /locus_tag="JK1GL000058" + CDS complement(54551..55162) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W7A3" + /gene_functions="regulatory (smcogs) SMCOG1057:TetR family + transcriptional regulator (Score: 65.9; E-value: 1.1e-19)" + /gene_kind="regulatory" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000058" + /note="GO_function: GO:0003677 - DNA binding" + /product="helix-turn-helix transcriptional regulator" + /protein_id="ncbi_JK1GL000058" + /transl_table=11 + /translation="MRTREALIRSAAEIFHDEGFHAAALTTISSRAGVSNGALHFHFAS + KAALADAVEEAAADVLRAVCGRWDGGPPGVLQCLVNATHELACALQNDVVLRAGFELSR + EAGRQPRTDLRLCWQNWVTDMVGRAGRGGELRESVAPESAVAAVVAATSGFEVLGMRNQ + AWLSRSTVAQFWLLLLPALAPAPHAGLWQAEGSWTGTATG" + mRNA complement(55195..56883) + /locus_tag="JK1GL000059" + /note="propionyl-CoA carboxylase beta chain" + gene complement(55195..56883) + /locus_tag="JK1GL000059" + CDS complement(55195..56883) + /EC_number="6.4.1.3" + /EC_number="2.1.3.15" + /codon_start=1 + /db_xref="COG:COG4799 Acetyl-CoA carboxylase, + carboxyltransferase component" + /db_xref="UniProtKB/Swiss-Prot:I3R7F1 Propionyl-CoA + carboxylase, carboxyltransferase subunit" + /db_xref="UniProtKB/TrEMBL:A0A2W6PRG9" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1059:acetyl-CoA carboxylase, carboxyl transferase, + (Score: 732.8; E-value: 3.8e-222)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000059" + /note="GO_function: GO:0016874 - ligase activity" + /product="propionyl-CoA carboxylase beta chain" + /protein_id="ncbi_JK1GL000059" + /transl_table=11 + /translation="MRAELPEPKPHRWFVTVKRRPGRAMREGQIVTILNDIPRVALPAE + PADARGRVAELHGVRAQALAGPSEKATAAQHAKGKLTARERIELLLDAGSFREVEQLRR + HRATGFGLEARKPYTDGVITGWGTVEGRTVFVYAHDFRIFGGALGEAHATKIHKIMDMA + IAAGAPLVSLNDGAGARIQEGVSALAGYGGIFQRNTRASGVIPQISVMLGPCAGGAAYS + PALTDFVFMVRDTSQMFITGPDVVKAVTGEEITQNGLGGADVHAETSGVAHFAYDDEET + CLAEVRYLLSMLPQNNREFPPCTPCSDPQSRRSEALLDLVPADGNRPYDMARVIEEIVD + DGEYLEVHEGWARNIICALARLNGQVVGIVANQPQALAGVLDIEASEKAARFVQMCDAF + NIPLVTFLDVPGFLPGVDQEHGGIIRHGAKLLYAYCNATVPRISLILRKAYGGAYIVMD + SQSIGADLTYAWPTNEIAVMGAEGAANVIFRRQIAEAEDPDAVRARMVKEYRAELMHPY + YAAERGLVDDVIDPAETREVLIESLAMLRTKDADVPSRKHGNPPQ" + mRNA complement(56915..57121) + /locus_tag="JK1GL000060" + /note="MULTISPECIES: acyl-CoA carboxylase subunit epsilon" + gene complement(56915..57121) + /locus_tag="JK1GL000060" + CDS complement(56915..57121) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W782" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000060" + /product="MULTISPECIES: acyl-CoA carboxylase subunit + epsilon" + /protein_id="ncbi_JK1GL000060" + /transl_table=11 + /translation="MAEPERAVPAVRIERGRAGAEELAALTAVLYALTARRDEGPGGRE + RSGAAPWRPGHRAGAYRSPYCWR" + mRNA 57418..58410 + /locus_tag="JK1GL000061" + /note="2-oxo-3-(phosphooxy)propyl 3-oxoalkanoate synthase" + gene 57418..58410 + /locus_tag="JK1GL000061" + CDS 57418..58410 + /EC_number="2.3.1.277" + /codon_start=1 + /db_xref="UniProtKB/Swiss-Prot:P18394 putative A-factor + biosynthesis enzyme" + /db_xref="UniProtKB/TrEMBL:A0A454W7E0" + /gene_functions="biosynthetic (rule-based-clusters) + butyrolactone: AfsA" + /gene_kind="biosynthetic" + /locus_tag="JK1GL000061" + /product="2-oxo-3-(phosphooxy)propyl 3-oxoalkanoate + synthase" + /protein_id="ncbi_JK1GL000061" + /sec_met_domain="AfsA (E-value: 3.3e-24, bitscore: 83.5, + seeds: 34, tool: rule-based-clusters)" + /transl_table=11 + /translation="MATSAFPATHPALGQEPVLPAGTPRLRPSLFRYPNLTTTVPKELV + HRAAVAEVMLTDWERVDDTRFKVAAQWPRGHSFFTPIDGRYHDPLIAAETIRQVGSLLG + HAEFGVPFGHHYLLHDLSLRVDPHHLMIHQAPASLDLDVTCEDLKMRGGRLAALRYEAV + VRRDGHTAATGVFSFSCVSPTVYRRLRPPHVFADGHRPLPLTAPAAPQSVGRMSPADVV + LSPTEDPHRWQLRLDTQHPVLFDHPGDHVPGMVLLEAARQAAAGALGRTSLLPLGLTSE + LVQYAELDIPCIIEAAPHPTHSPGLTTVHITGHQRGQTVFTCTVTAADA" + mRNA complement(58433..59041) + /locus_tag="JK1GL000062" + /note="NAD(P)H-binding protein" + gene complement(58433..59041) + /locus_tag="JK1GL000062" + CDS complement(58433..59041) + /EC_number="1.3.1.113" + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W7B3" + /gene_functions="other (smcogs) SMCOG1199:NmrA family + protein (Score: 192.5; E-value: 1.8e-58)" + /gene_kind="other" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000062" + /product="NAD(P)H-binding protein" + /protein_id="ncbi_JK1GL000062" + /transl_table=11 + /translation="MRAAADAGVEHVVKLSAAAVEDAGADDLITRWQRESEELLRSSGL + AWTLLRPRSFMSNSLGWAAEVRAEGVVRELFGASLNACVDPGDVAEVAVRALTGPGHAG + RAYVLTGPEAVSAVQRTARLSCVLGRPLRFEELGWEEARARWGRRYPPAVVEALLRSAV + RQREGAKAGVDGTFARLVGRPARSFGQWAADHVAGFSGR" + mRNA 59436..60077 + /locus_tag="JK1GL000063" + /note="TetR/AcrR family transcriptional regulator" + gene 59436..60077 + /locus_tag="JK1GL000063" + CDS 59436..60077 + /codon_start=1 + /db_xref="COG:COG1309 DNA-binding transcriptional + regulator, AcrR family" + /db_xref="UniProtKB/TrEMBL:A0A454W784" + /gene_functions="regulatory (smcogs) SMCOG1057:TetR family + transcriptional regulator (Score: 89.2; E-value: 7.5e-27)" + /gene_kind="regulatory" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000063" + /note="GO_function: GO:0003677 - DNA binding" + /product="TetR/AcrR family transcriptional regulator" + /protein_id="ncbi_JK1GL000063" + /transl_table=11 + /translation="MPAQERAIRTRQNIMLAAATVFNERGYKAATIADILTTAGVTKGA + LYFHFPSKDDLAQEVLATQNRNLTIPERPSKTQELIDVVMLHTHRLQTDPMVRAAVRLT + MDQLSTEFDRTGPFRQWADLTRQRLEQARDQGELLPHVNPTETADVLVGAYAGIQSMSH + ALTDYTDLTTRANALLRHLLPTITLPSILTSLDLNENRGAHVYTEIHTTT" + mRNA complement(61157..62014) + /locus_tag="JK1GL000064" + /note="hypothetical protein" + gene complement(61157..62014) + /locus_tag="JK1GL000064" + CDS complement(61157..62014) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454WJI8" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000064" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000064" + /transl_table=11 + /translation="MKAGAIVVAAVTGSVVLSGCGDGDGSQAKRDGVSPSASSSAGTQE + QGTVEVRAAYDKTAEAESARMTIKMKLAAEGKTITSDGKGVLDLAEGDSVMTLTVQDKT + IEQRVVDQVLYQKIPGEKALGGKPWIKIDLEKVAAQQGLSNQQIGDPAQTAAYARAITN + KDVTKAGTEEIDGANTTQYKVSVDVSKLPGGEQLSKQVGPTLPMHVWLDDKGRLRRQQI + EMTLKAPASASAKPEGSASPQQLQMSTVMEFSDFGTEVNAEAPPAGQVADMTDQSLQGS + QQHS" + mRNA 62297..62701 + /locus_tag="JK1GL000065" + /note="hypothetical protein" + gene 62297..62701 + /locus_tag="JK1GL000065" + CDS 62297..62701 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A2A2DC84" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000065" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000065" + /transl_table=11 + /translation="MNVQVPADPSGRLLWASPALPGAVHDVRAAREHDIVRKLTDAGIT + CWTDKGYRGAGGTVRVPLGPSGDTSRGQKDVNRSHAKKWVLVEQAAATLNAWRLLRNLR + CSTSGVTSLVRSVVTVHLASTDGKGSMTTF" + mRNA complement(63194..66505) + /locus_tag="JK1GL000066" + /note="MULTISPECIES: Wall-associated protein" + gene complement(63194..66505) + /locus_tag="JK1GL000066" + CDS complement(63194..66505) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A429NJW2" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000066" + /product="MULTISPECIES: Wall-associated protein" + /protein_id="ncbi_JK1GL000066" + /transl_table=11 + /translation="MWRDRRTHRTALVSAITAAAVVIAAAPGLAATPKPELPEPESPWT + KPTKVEAPATPAGTVKAPTSEAEAKPSAEVAAWRAAQKARAAGAERAKTSASRSAAVDA + AVAGYVPEGQGEVPWHQILDTRLNDALVARVNVSNGNLMLAATDFDIAGVGQKLQLTRT + YNSLEAPWGKVSQRWWQAYERYLQINDGEVDVFDTTGSLLRFTANADGTYTTPTGYSKD + LKKNADGTYTLTDRKSGTKDTYNEHGTLTKVTDKNKGTITVDQHDEGAEHKGFKLTETR + SGRWIDLVKTDASQWQAKDHTGRTAVLDLDAAGNLAKVTDTTGKATAYEYDSSRRLTKV + TTPEGTVTLFTYDSHNRVTSMQRATGTSGSGHTGPTWRYDYTAATPSDAGTTTVTDPDG + DETIYTHNADGEVTKVTDPLGHSRHATYKNHLTQTAIDAMGTGTDGTGGNTTTYGWDDR + NNPVSQKLPMGATASVSAYQTIAGTDLPSDMTGANGRKDSFKYDTNGNTLSVTTSGTAG + TTREYTYNKDTPTCGGFEGQRCTAKDGNGKVTSFTYDDQGNLIKVTPPAPLGETTYTYD + ALGRVETVKDGRGITTVYAYDSRDRVHEVSSTNFTVTYSYDGDGNVKSRTDASGTTKWD + YDKLNRESVRTLQNGAQTALAYTPGGDVDFYTDPTGTTDYTWDKAGRLDYLTAPDGKKT + DFDYNNNDKRTKTVYPGGTTQTVTIDKNGRPQAIKTTSGTQTFVDLTYSYANAGKDTTK + IRTRTDNLTKLKTTYTYDSQDRLSYALEADAAGTRKASWLYCWDKAGNLTSRDGSKNTC + PGGTTYTYNDASELTGKNGSTTGWSYDKLGNETAAADNTPRTDESWTDYSQLSGITAGG + KTYDLVHAGTTNAERTKLGSTWFHHTALGLASTTTNGVDTGFIREPAGTLNSMTTGGKS + YYYLTDATGNVLGLADDTGKRTHTYTYGPTGLPRTTPTEAVPQPYRYAGAYADPTGLYK + MGHRYYDPTLGRFTQPDPSGQETNPYLYAAGDPINNMDPSGLGFLDSVSNFLEDTNDIW + GAVTGCVAGVGAAAETGIIAAASTFGPWGTAGAVVTSCAVGGVLGYNNAEIITYG" + mRNA 67026..67361 + /locus_tag="JK1GL000067" + /note="hypothetical protein" + gene 67026..67361 + /locus_tag="JK1GL000067" + CDS 67026..67361 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A429NJP0" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000067" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000067" + /transl_table=11 + /translation="MKDAPAMSTPGRHTPCSRSSRHHVPAQRLTRFVQQAGRLLCWSLT + AGMTTAALDLLITPEAAWWHMMWPLPWYLTCLSAPLWATLRAHEKAAHQQAPEEDNDIP + CEWEQAA" + mRNA complement(67729..67908) + /locus_tag="JK1GL000068" + /note="hypothetical protein" + gene complement(67729..67908) + /locus_tag="JK1GL000068" + CDS complement(67729..67908) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454W205" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000068" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000068" + /transl_table=11 + /translation="MQVAWRAGEMSGVTVVFVAACALWLVLWRRRTGRGCLAWPLVVLL + CGATGVLIMAAMAG" + mRNA complement(67919..68248) + /locus_tag="JK1GL000069" + /note="hypothetical protein" + gene complement(67919..68248) + /locus_tag="JK1GL000069" + CDS complement(67919..68248) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A1Y2PQM0" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000069" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000069" + /transl_table=11 + /translation="MDESKMPEETPLMGPDGKVVKEANGKTLMVKTRVEFSESEAPMFG + PRAGEKRSVSTDAEGRETEIIEAVPSVPPAQGRKELGSRTMMSRLLEAVCALTMRARCA + PRMGR" + mRNA complement(68739..68951) + /locus_tag="JK1GL000071" + /note="hypothetical protein" + gene complement(68739..68951) + /locus_tag="JK1GL000071" + CDS complement(68739..68951) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A1A9CFR1" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000071" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000071" + /transl_table=11 + /translation="MRLRAYAILCIYALMLVNGIPRIADAPFETVMACSSVGFGFAAAA + AVLFLLSARKDSSARTAGPVAPWEG" + mRNA 68965..69090 + /locus_tag="JK1GL000070" + /note="hypothetical protein" + gene 68965..69090 + /locus_tag="JK1GL000070" + CDS 68965..69090 + /codon_start=1 + /locus_tag="JK1GL000070" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000070" + /transl_table=11 + /translation="MRIHGGVHPASIATGIGSMSVVDTASAIQWYSGFPFIPTPS" + mRNA complement(69802..70122) + /locus_tag="JK1GL000072" + /note="hypothetical protein" + gene complement(69802..70122) + /locus_tag="JK1GL000072" + CDS complement(69802..70122) + /codon_start=1 + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000072" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000072" + /transl_table=11 + /translation="MAFNVYKAAQWAMESHKGKGLIAGNRLDQDEVIAPERIPGIDAEV + IKNFRTMSEATERGVGQVLDSSKWTILVNDAWLLGGAHYMAQVVETVYGRPRQSMVCAF + SR" + mRNA 70261..70440 + /locus_tag="JK1GL000073" + /note="hypothetical protein" + gene 70261..70440 + /locus_tag="JK1GL000073" + CDS 70261..70440 + /codon_start=1 + /locus_tag="JK1GL000073" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000073" + /transl_table=11 + /translation="MSALLGSVAFPADNRRHADIARTYVASVRPRPGGGEIVLKLGDSL + LKPGVLDAWAPSGQ" + misc_feature 70270..70272 + /note="tta leucine codon, possible target for bldA + regulation" + /tool="antismash" + mRNA 70614..71384 + /locus_tag="JK1GL000074" + /note="hypothetical protein" + gene 70614..71384 + /locus_tag="JK1GL000074" + CDS 70614..71384 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A3M0I621" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000074" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000074" + /transl_table=11 + /translation="MPDAALEALGGWWGQNAVRLTDGTPGAHTVRYTPSRWAHITTWPS + MMASTFQAGDADVSRTQVASIVADALERGACEEALVATYVWGKGKGGSPAGSGPATLHK + ILLGTEGLNAILASVVNTLREQDAEAAYAELRGRIAGFGPSFYSKFLYFAGKSVRAASG + TQPLILDQVLARRMRSLAQAVGRETGYDPDGSIARWVWRDTNWSPHRYAIYLSFMQAAS + RQVAATHSWPSNATPDLLEYALFTTSWVESAEAT" + mRNA complement(72274..73149) + /locus_tag="JK1GL000075" + /note="SDR family oxidoreductase" + gene complement(72274..73149) + /locus_tag="JK1GL000075" + CDS complement(72274..73149) + /EC_number="1.1.1.340" + /NRPS_PKS="Domain: PKS_KR (8-160). E-value: 1.8e-07. Score: + 23.0. Matches aSDomain: + nrpspksdomains_JK1GL000075_PKS_KR.1" + /NRPS_PKS="type: other" + /codon_start=1 + /db_xref="COG:COG4221 NADP-dependent 3-hydroxy acid + dehydrogenase YdfG" + /db_xref="UniProtKB/Swiss-Prot:Q82IY9 + 1-deoxy-11-beta-hydroxypentalenate dehydrogenase" + /db_xref="UniProtKB/TrEMBL:A0A454WJJ0" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1001:short-chain dehydrogenase/reductase SDR (Score: + 168.7; E-value: 2.7e-51)" + /gene_functions="biosynthetic-additional (t2pks) KR (Score: + 103.5; E-value: 3.6e-32)" + /gene_kind="biosynthetic-additional" + /locus_tag="JK1GL000075" + /note="GO_function: GO:0016491 - oxidoreductase activity" + /product="SDR family oxidoreductase" + /protein_id="ncbi_JK1GL000075" + /transl_table=11 + /translation="MNWPTGEAALVTGAASGIGFGVAHALVAAGAKVALVDIDEARLAG + AEQSLRDAGGTVLALPFDISETDRWESMADRAEEALGPISILCNVAGVNGGTTVDRTPL + QVWRWVHGVNVDAQFASVAAFLPRFKSRGGRSHIVNTSSISGLIPMAGVAAYTSSKFAS + VGLSMALREELAGTHVGVSLLVPGAVATPINFNAGAAEAKLLGREMDAAVVEKNSALLL + QGADPGRVGEQVVEAMQQGQFMVVTHREWGPFAAHVHREIERAYEEFDGRHGPDPVATA + MAAGEETISS" + aSDomain complement(72670..73125) + /aSDomain="PKS_KR" + /aSTool="nrps_pks_domains" + /database="nrpspksdomains.hmm" + /detection="hmmscan" + /domain_id="nrpspksdomains_JK1GL000075_PKS_KR.1" + /evalue="1.80E-07" + /label="JK1GL000075_PKS_KR.1" + /locus_tag="JK1GL000075" + /protein_end="160" + /protein_start="8" + /score="23.0" + /specificity="KR activity: inactive" + /specificity="KR stereochemistry: C2" + /tool="antismash" + /translation="ALVTGAASGIGFGVAHALVAAGAKVALVDIDEARLAGAEQSLRDA + GGTVLALPFDISETDRWESMADRAEEALGPISILCNVAGVNGGTTVDRTPLQVWRWVHG + VNVDAQFASVAAFLPRFKSRGGRSHIVNTSSISGLIPMAGVAAYTSSK" + CDS_motif complement(72676..72738) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000075_0002" + /evalue="3.80E-04" + /label="PKSI-KR_m4" + /locus_tag="JK1GL000075" + /protein_end="158" + /protein_start="137" + /score="13.0" + /tool="antismash" + /translation="IVNTSSISGLIPMAGVAAYTS" + CDS_motif complement(73054..73122) + /aSTool="nrps_pks_domains" + /database="abmotifs" + /detection="hmmscan" + /domain_id="nrpspksmotif_JK1GL000075_0001" + /evalue="1.50E-03" + /label="PKSI-KR_m1" + /locus_tag="JK1GL000075" + /protein_end="32" + /protein_start="9" + /score="11.2" + /tool="antismash" + /translation="LVTGAASGIGFGVAHALVAAGAK" + mRNA complement(73386..73754) + /locus_tag="JK1GL000076" + /note="hypothetical protein" + gene complement(73386..73754) + /locus_tag="JK1GL000076" + CDS complement(73386..73754) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454WJH3" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000076" + /note="GO_function: GO:0003677 - DNA binding; GO_process: + GO:0006355 - regulation of transcription, DNA-templated" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000076" + /transl_table=11 + /translation="MALRLTDASTPAVDAADLGAMLLLAQTYDPEHPHEDVRALARLDR + RSADVLRTLVEADSVRSAAAELGMHHSTVQARHEALTHTLGYDPRSNVGRMRYIAAALL + LRLTDPVPPTRPGSPWNT" + mRNA complement(73739..74398) + /locus_tag="JK1GL000077" + /note="hypothetical protein" + gene complement(73739..74398) + /locus_tag="JK1GL000077" + CDS complement(73739..74398) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454WJI3" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000077" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000077" + /transl_table=11 + /translation="MHQLVGRLNSLDPQAGETLRIVSYFDVLITRGAGLDGLLRGAAVL + SGTVAGAKIRGRVTRRDPDGHPVTDDADRRRHSSRRSHADWTVWLERDGEPEPADEMIV + ERLALGVELLDARRSPERGLDAIVDQARSVAERTALLAKRRIDPATPVRVLATAADAPE + ISEAPSAIVPTRYGLLRATLDLSGTIRRPPEPVGFGTRYEPTGPPNPGRRRSWRSD" + mRNA complement(74528..75133) + /locus_tag="JK1GL000078" + /note="acetyl esterase" + gene complement(74528..75133) + /locus_tag="JK1GL000078" + CDS complement(74528..75133) + /EC_number="3.1.1.-" + /codon_start=1 + /db_xref="COG:COG0657 Acetyl esterase/lipase" + /db_xref="UniProtKB/TrEMBL:A0A0N0YWT6" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1066:alpha/beta hydrolase domain-containing protein + (Score: 140.4; E-value: 1.1e-42)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000078" + /note="GO_function: GO:0016787 - hydrolase activity" + /product="acetyl esterase" + /protein_id="ncbi_JK1GL000078" + /transl_table=11 + /translation="MVSGDQFSGLVQALPWVIEHDAVLVTVDYRLAPEHPDPYPVEDCY + AGLLWTAEHARELGMDPDRLIIAGQSAGGGLAAGVALMARDRQGPALIGQVLMYPMLDD + RDRTVSSAQFDAVGVWDRGSNVMGWTALLGERRGTDDVSAYALPHAPPISRDCHPRSST + AARPRCSGTRTSLTRRPCGTRAYRPNSTSGPVASTGSA" + mRNA complement(75120..77789) + /locus_tag="JK1GL000079" + /note="hypothetical protein" + gene complement(75120..77789) + /locus_tag="JK1GL000079" + CDS complement(75120..77789) + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A2R2WDT7" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1066:alpha/beta hydrolase domain-containing protein + (Score: 200.2; E-value: 7e-61)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000079" + /note="GO_function: GO:0008270 - zinc ion binding; + GO_function: GO:0016491 - oxidoreductase activity; + GO_function: GO:0016787 - hydrolase activity; GO_process: + GO:0055114 - oxidation-reduction process" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000079" + /transl_table=11 + /translation="MPTHPRPPFHPEAEAALTALAEPMPAVTPGAIPVLRQAALPVVSD + KTLLAAGVTRRDVTVPGHHGAELVASVIARSGHTGTGPGIYHIHGGGMIAGERVIGVSQ + ILPWIVEHDAVAVTVEYRLAPEFPDPCPVEDCYAGLVWTAEHAAELGIDPGRLIIAGAS + AGGGLAAGTALLARDRKGPALIGQVLICPMLGDRDRTVSSPQYEDAGRWVRESNRTGWA + ALLGDRCGTDEVSVYAAPARASDLEGLPPAFIDCGSAEVFRDEDAAYANALMELRRAGR + AACMARRLPRIRHARAGLRHRTGSDRGPERMSRPHSRRTVSGHERAVSRAVASAVLDRT + ERGVGTPGGARRDGPRRQERPPVTGGHGTGKRRRNMKAARFYGREDIRIEEAAEPSPGP + GQVKLRNAFAGICGSDLHFFFYPESLPFSLDEPHPLTGATLPQILGHEFSGTVVETGEG + VTDVRVGDRCAVFPLAVSCGKCAACRRGLPFSCPLMGSLGSNVEGGGLSEFTVCEASKV + HVLPDGVDLRMGALVEPMAVGWHAVARSGVRPGGSALVAGAGPIGIGTWFAFKARGVEK + VLVSEPSEDRRAIMAALGARVIDPVNEDLADAVASLTDGDGVDAAVDAAGAGAAVTSAM + AGLVPGGRLVVAALHEHTMDFQPTRLMMGETEIVGAVGYRPEEFDEVIAAMADGFYTPP + AGCGNCRWRALSTPSTRCATASAGRPFCAWAEAPEHSGTDGSRVLSVPGCARPVRTRRA + SGGGHGPRLRRSAVRHEAAHPARLMYTATMRCGRTRSSHVQQRSAPPVRPGARGRTRGP + RGPDPADPDRGHDPRHAPGGTGRGHRRDARDLRSDPTRRHDPGVPGRRNHRLCDRPGGS + SGARAGDLPHARRRHGLR" + mRNA 78186..78578 + /locus_tag="JK1GL000080" + /note="MULTISPECIES: SDR family NAD(P)-dependent + oxidoreductase" + gene 78186..78578 + /locus_tag="JK1GL000080" + CDS 78186..78578 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A454WJI7" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000080" + /product="MULTISPECIES: SDR family NAD(P)-dependent + oxidoreductase" + /protein_id="ncbi_JK1GL000080" + /transl_table=11 + /translation="MALADIDEERLDDDAKKPAGAGGTAMAVPLDVSDADSSAAAADRA + EEALGPISILRSNPAAPTSRSEPASSTFARMKGILRDFRLKGNSAHYAMLSIARLHNLA + LTGERTLRTAGHLTRVHWEIISGTAL" + mRNA complement(78575..79306) + /locus_tag="JK1GL000081" + /note="MULTISPECIES: class I SAM-dependent + methyltransferase" + gene complement(78575..79306) + /locus_tag="JK1GL000081" + CDS complement(78575..79306) + /EC_number="2.1.1.156" + /codon_start=1 + /db_xref="COG:COG2226 Ubiquinone/menaquinone biosynthesis + C-methylase UbiE" + /db_xref="UniProtKB/TrEMBL:A0A454WJJ2" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1248:methyltransferase (Score: 127.7; E-value: + 8.5e-39)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000081" + /product="MULTISPECIES: class I SAM-dependent + methyltransferase" + /protein_id="ncbi_JK1GL000081" + /transl_table=11 + /translation="MYEWLIGDDRLTPAKAAAVYYSDVVGSVPPSARVLDCACGTGQLA + VGLASLGLDVVAADASDGMVRRTEKAADEQGVSLRALHARWDELPDHLEDSTFDLVFCV + GNSLGHAEGAAGRLAALAAMSRLLKPGGRLVLHSRNWELVRSAGSRVDVRDRLVRRNDR + DAVVSYYWQIEQRWEQEHFLEIVVAQIEPDGAVRACSERLSIWPYRYEDLVVQLRSVGL + RVESTTFDPESDGYLMVASRD" + mRNA complement(79932..80435) + /locus_tag="JK1GL000082" + /note="MULTISPECIES: GNAT family N-acetyltransferase" + gene complement(79932..80435) + /locus_tag="JK1GL000082" + CDS complement(79932..80435) + /codon_start=1 + /db_xref="COG:COG3153 Predicted N-acetyltransferase YhbS" + /db_xref="UniProtKB/TrEMBL:A0A454WJI5" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000082" + /note="GO_function: GO:0008080 - N-acetyltransferase + activity" + /product="MULTISPECIES: GNAT family N-acetyltransferase" + /protein_id="ncbi_JK1GL000082" + /transl_table=11 + /translation="MVRLAQYTKADQEEILGNSDDPFGVAWTGLTWLPKEEHFGIRHHG + RLVAHAGLLRLPVAISDAETEVVGVGGVAVSPAMQGQGFARLVVTAALEHARTMGPQHA + LLFCRPPLVSLYQRLGWHPLDKDVLVEQPEGRLVTMPLRTMVTPLLDDARWPSGPVRLF + SLPM" + mRNA 80441..81022 + /locus_tag="JK1GL000083" + /note="hypothetical protein" + gene 80441..81022 + /locus_tag="JK1GL000083" + CDS 80441..81022 + /codon_start=1 + /db_xref="COG:COG1309 DNA-binding transcriptional + regulator, AcrR family" + /db_xref="UniProtKB/TrEMBL:G2GK72" + /gene_functions="regulatory (smcogs) SMCOG1215:TetR family + transcriptional regulator (Score: 94; E-value: 2.1e-28)" + /gene_kind="regulatory" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000083" + /note="GO_function: GO:0003677 - DNA binding" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000083" + /transl_table=11 + /translation="MPQWTGSQTYPHDDLSADHWPECRARDGSPGSLAAVTAGLVGLRL + IQAHAGRLFTDHGYDAVTVADVAKAAGVSSMTVYRNFPTKGDLVLIDQPAQLIAEHVAA + SSATQPLVRRIGSALIDAATASTSGNGDEQAADERFLLDCLRLMVSTPALRPRHLDSQY + ALQQAIVEALGKDAADPDAAFRAEARERHR" + misc_feature 80567..80569 + /note="tta leucine codon, possible target for bldA + regulation" + /tool="antismash" + mRNA complement(81216..81332) + /locus_tag="JK1GL000085" + /note="hypothetical protein" + gene complement(81216..81332) + /locus_tag="JK1GL000085" + CDS complement(81216..81332) + /codon_start=1 + /locus_tag="JK1GL000085" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000085" + /transl_table=11 + /translation="MRARVAAGMICAVACRRPRSGRISITQKMPRKAPPPWS" + mRNA 81456..81854 + /locus_tag="JK1GL000084" + /note="hypothetical protein" + gene 81456..81854 + /locus_tag="JK1GL000084" + CDS 81456..81854 + /codon_start=1 + /db_xref="UniProtKB/TrEMBL:A0A101MYS4" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000084" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000084" + /transl_table=11 + /translation="MVRRRRRPAGAAPRPPARTPVGSEGQLAGNWRGADGSVLQLAPGG + QAELTRVPAHNDVDEDGDFSLCDGTGTWTREEGNDFQNTDRDGVLVHLDDECGQETYWT + IGGTELKPELFVLFGDPDTGELRILTQP" + mRNA 82128..82394 + /locus_tag="JK1GL000086" + /note="hypothetical protein" + gene 82128..82394 + /locus_tag="JK1GL000086" + CDS 82128..82394 + /codon_start=1 + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000086" + /product="hypothetical protein" + /protein_id="ncbi_JK1GL000086" + /transl_table=11 + /translation="MPWNGYGEQRAMADLTPRHHRGRSAHRQSAQVVVCPGAAPAVGVE + DRAVQGEAVAGVGGLGVVEQDQVQPVTPELLVVVRVGGSGPGR" + mRNA complement(82569..83279) + /locus_tag="JK1GL000087" + /note="MULTISPECIES: alpha/beta hydrolase" + gene complement(82569..83279) + /locus_tag="JK1GL000087" + CDS complement(82569..83279) + /codon_start=1 + /db_xref="COG:COG0596 Pimeloyl-ACP methyl ester + carboxylesterase" + /db_xref="UniProtKB/TrEMBL:A0A454WJG9" + /gene_functions="biosynthetic-additional + (rule-based-clusters) Abhydrolase_6" + /gene_functions="biosynthetic-additional + (rule-based-clusters) PF00561" + /gene_functions="biosynthetic-additional (smcogs) + SMCOG1036:alpha/beta hydrolase fold protein (Score: 90.9; + E-value: 1.9e-27)" + /gene_kind="biosynthetic-additional" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000087" + /product="MULTISPECIES: alpha/beta hydrolase" + /protein_id="ncbi_JK1GL000087" + /sec_met_domain="Abhydrolase_6 (E-value: 2.4e-16, bitscore: + 59.7, seeds: 455, tool: rule-based-clusters)" + /sec_met_domain="PF00561 (E-value: 5.3e-13, bitscore: 47.9, + seeds: 48, tool: rule-based-clusters)" + /transl_table=11 + /translation="MFLHYWGGSARTWDLVVDRLSGRDVLTVDFRGWSRSSALPGPYTL + GQFADDTLAVLADAGITDYILVGHSMGGKVAQLVAAARPAGLRGMVLVGSAPARPAAQV + TPEYQQALSHAYDCAESVAGARDHVLTATELPEPVKAQIVTDSRTVTDAARTEWPLHGI + TQDITEHTRTVSVPVLVVAGEHDQVEPVGVLRDNLVPYLSHADFVVIPHTGHLIPLEAP + ANLVDAITAFAPTA" + mRNA 83457..84281 + /locus_tag="JK1GL000088" + /note="MULTISPECIES: AraC family transcriptional regulator" + gene 83457..84281 + /locus_tag="JK1GL000088" + CDS 83457..84281 + /codon_start=1 + /db_xref="COG:COG2207 AraC-type DNA-binding domain and + AraC-containing proteins" + /db_xref="UniProtKB/TrEMBL:A0A454WJH6" + /gene_functions="regulatory (smcogs) SMCOG1260:AraC family + transcriptional regulator (Score: 44.3; E-value: 2.8e-13)" + /gene_kind="regulatory" + /inference="similar to DNA sequence:INSD:" + /locus_tag="JK1GL000088" + /note="GO_function: GO:0003677 - DNA binding; GO_function: + GO:0003700 - DNA-binding transcription factor activity; + GO_function: GO:0043565 - sequence-specific DNA binding; + GO_process: GO:0006355 - regulation of transcription, + DNA-templated" + /product="MULTISPECIES: AraC family transcriptional + regulator" + /protein_id="ncbi_JK1GL000088" + /transl_table=11 + /translation="MSVIRQMTYQPAGRPATSVEVMTFGRLRELNDGGTQRADFHVLAV + VDAGPGSVTVDFRHYPLQDRSAVWIPPGAVHRWDDIADVAGHLVLFVPTAPVTHATREL + AASPDPAAHWGIPDADWPFVDTARSHLLFEASAPPSESRTELPEILLSALITRLHPPHA + EALTPQVFRLFRSSVEAHFRRHHDADYYARALGYAPRTLSRAVQQATGRTAKAYIVERI + VLEAKRLLAHDRLTAARCADVLGFPDASNFSAFFRRATGMRPGAWQAMMAAE" +ORIGIN + 1 gtggcggtga ccgccgacgc gacgacagtg aactggaaca tctggggcga cgtggcggtg + 61 gcggtgctgc cgcagccgta tctggacaag gtgacgcagg cgggcggcgc cccggtgctg + 121 ctgcccccgc tcgtggaggc ggtggagtcc gtgatggagc gggtggacgc cctgctgatg + 181 agcggtggcg cggacatcga cccggccctg tacggcgccc ggcccggtga gttcgtcttc + 241 ccgccgcacc cggcgcgtga cgcggcggag ctggccgccc tggccgtggc ggaacggcgg + 301 ggcatccccg tcctcggggt ctgccggggt ctgcagctga tctcgatcac ccgcggcggc + 361 accctcgacc agcacctgcc cgagcactcc cccgccgtgc ccggccgtta cgagccgcgc + 421 accatccggg tgaagcccga ctcgctgctg ggcggcgcgc tcggaccgtc gccgaccgtg + 481 tactgccacc accaccaggg catcgacaag ctcggcgccg ggctggtggc caccgcctgg + 541 tcggacgacg gcgtcatcga gggggcggag gccgaggacc cgtcggcgcc cttcctggcc + 601 ggtctgcaag cccacggtga actgggcgag gacaccgtcg cgctgttcga ggcgttcatc + 661 gaggcggcga aggccggacc gcgccgctga ccggccttcg ccgccggccc cggccacagc + 721 acgtgacggc cgccgcccgc ggccccgctc gatgcggggc cgcgggcggc ggccgtctgc + 781 ggtcgtcccg tgcccgggcg cgggacgccg gcgaagaccg gtccggtctc cagtgagcca + 841 ccgcaccgcg ccggcggcgc gggggatgtg accgccgcac gatgcggtgg cggcaccgga + 901 tgggacccga ccctcatctg tctgacgacg cgcgggcctc gtgtgtgacg gggcgggcga + 961 aaccggtgcc ggaccggtgt gcgccggctg gtcagacgcc ggccgcgccg acggcgtgcg + 1021 ccctgctgcc ggcggtgtcc cggccgcggc cgaaccagcg ctccagtgcc cgcccgagca + 1081 gttccacgcc gtccggggcc gcccaggcga catggccgtc ggggcgcagc agcaccgcag + 1141 cgggacggtc cccggtcacc ggctcggccc actcccccac gaccgtgcgg acccggtcgt + 1201 cccagccggc ggcggccccg cggacgcgcg cggcgtcgtc cgccgcgccg gtgaccagga + 1261 gtacaccgcg cgccgggtgg agcagttcgg cgacccgggt gcggccgccg tcctcgagca + 1321 gcagctcgtg gccgggagcc agccgcagac cgagcagcgg atggtcgccg ggacccatgt + 1381 cgtagcggat gtcgacgccg ctgacgatcc cggccaggtg ccgggcggcc tcgggcagtt + 1441 ccaccagttc acgcatgacg gcgcgcagcg gctccatctc gtcgccggtg aggtagaggc + 1501 gggtctgggc gcgggtgttg cgcatcagct tctcgccgac cgggtgccgc tcgctctcga + 1561 aggtgtcgag caggccttcg ggtgcccagc cgttgatggc cgcggccagc ttccagccga + 1621 ggttggcggc gtcctggacg ccgacgctca tgccctgtgc gccggccggc atgtggatgt + 1681 gggtggcgtc gccggcgagg aagacccggc cgctgcggta gtgctcggcc tggcgggtgg + 1741 tgtcggtgaa ggagctgatc cagcggacct ccgcgtggtg cagcgactcg ccggtcatgc + 1801 gctgccaggc gtcggcgatg tcggtgaacc tcagggcgct cttgtcctcg ggcgggcgca + 1861 ggttctcgtc gtggatgacg atccggtcca cgccgttctc caggttgaac gccatcacca + 1921 tgccgcccgg caccttctcg ccgatgggcc gctgccgcac cccggcgccg accaggtcgg + 1981 ccatgtacat gccgcgggtg gcgccccagc ccttgaagtc gatgcccgcc agggtccgca + 2041 ccaggctgcg tgccccgtcg cagcccacca ggtactgcgc ggtgtcctca ccgtgcccgt + 2101 ccgggccctc gtactcgacg acgacgccgt ccggcctctc ccggtagccg gtcacctcgt + 2161 ggttgcgcag gacgggcacg cccagttcct tgagccagtt ctcgaggatc tcctcggtgc + 2221 ggaactgggg tacgccgcgg acgctgaagt gattgtcgtc cagcttgccg aaatcgatgc + 2281 gtacgccgcc gaagtggccc tgggcccatt cgacgtcgcc gaagcgttcc agcagaccgc + 2341 gctgctcgaa cacctcggcc gcccggcggg tgaagccgac gccgcgcgac tccccgctgg + 2401 gtccgggcag cttgtcgtag accaccacgt ccacgccgcc gagccgcagt tcaccggcga + 2461 gcatcagccc gaccggaccg gcgccgacga cgatcgcgcc ctttgccatg tcgtactcct + 2521 catgcagatg gatggcgtga gtcagccgaa gaagtcgagc agggccccgg cgacgacctc + 2581 gggctcctcc tcgggcaggt agtgcaccga cttcgacgcc cgcaccatgc gcacgtcggt + 2641 ggcctgcgcg gtgagcttgc gctgaaggtc ctcgtaggtg aagttgccgc cgatgccgag + 2701 tacgggcatg gtcagcctgc cgtagccggc caggtcggcg atgtcctggt ggcacgcctg + 2761 gtaccagccg gtgccggccc ggatggcctg cgggctgttg taggcgtgcg cgtagatctc + 2821 gcggtcggcc tcgccgacca ggttctggtc ggcgagggag tgggcgaaca gccagtcgat + 2881 cacgtggcgc atgcggccgc acatcagctg ttccggcagc tgctggagct ggttgaccgc + 2941 ccaccaccac agggcggttc cggtcccggg ccggtacagc agccgcaggt cgtactcgct + 3001 ctcgtcgggg tgcggggtgt ccagcagtgc cagcctgcgg gtcgcttcgg ggtggttggc + 3061 ggcgaaggcg aacgccacca tggccccgat gtcgtgtccg gcgatgtcca cctgccggtg + 3121 gcccaggtgc cgcaccaggg cgtgcaggtc cgccgccatc gtcttcttgt cgtagccgcc + 3181 cgcgggcttg tccgagccgc ccatgccgcg caggtcgacg gcgatgacgc ggtgggtgcg + 3241 ggcgagctgg ggcatgacct tgcggtacgc ccaccaggtc tgcggccagc cgggcacgag + 3301 cagcaggggc cgtccgtgcc cgccggtcac gtagtgcagg cgcacgccgt tgaccgtggc + 3361 gcagcggctg cggaaaccgc cgggcaggga gcgggccagt tcgctgtcgg agggcacgga + 3421 gccggtgtgt tcgcgggcgt gggcggcagt ggcggtgccc gtcatggcga gggccgtcgc + 3481 tcctgtgccc agggcgagca tcgtgcgtct gttcagcgtc atctacccaa gtcctcgtcg + 3541 cttcgtggcc ggtgggccaa tcaggcgcgg aaggcgccgg cgtgctggtc cgcccatacg + 3601 gtgaaggggc gggccgggtg tccggtgagc tgctcgacgt ggtcggtgag cggcaccggc + 3661 gccgtgctgg ccgcccacag cttcagcagc gcgtcggcga tgtcgtccgg catgaagtcc + 3721 ggcttgttgg cccgccacac ctgcgggggg atccgctcga cggggatgtc ccggcccgcc + 3781 gcggccgcga tgatcgcgac gtgctcggcg aaggtgaggg actgcggccc ggtgaggtgg + 3841 tacgaccggc cgcgcagcgc ggggtcggtg aggaccgcgc acgccgcttc cgcgatgtcg + 3901 cgctcgttga ccggatcggc gtggctgtcc gggtagggca ggcccaccgc gccgcgcgcc + 3961 ttcagcgacc acgcccaggg cagggcgttg ccggccagtg cgccgcagtt caggggcgtg + 4021 gaggtgaggg acgacgcggc gagggcctgc tcgacggcga ggtggggggc ggcgatcggg + 4081 tcgtcggcgg ctgaggggcg cagcacggcg tcggcggaca tgatcacgac gtgttccacg + 4141 ccggctttct cggcctgcgc cacgaaggcg tcgaccgccg ccggctcggc gtacaggaag + 4201 acggagtcga caccgtcgag ggcggcggcg aaatcggccg gggtgtcgag tgcgagccgt + 4261 accgactcgg tgcccgcggg cagggacagc ttctcggggt tgctggaacc ggcgcggacg + 4321 gcgacgccgc gttcgtgcag tacctgcacg agcagggagc cgaccttgcc gcggctgccg + 4381 gtgacgagga cggtcatgac agtggccttc cgggggtctg ggggcggggt gaggggcccg + 4441 gcggggtgcc ggcgcggcct gcgcggcgtc gccggtggcg gggagttcgg cggtggcggg + 4501 gtgttcggcc gtggcggggt gttcggccgt ggcggggtgt ccggcggctg ccgggcggtg + 4561 ccgccgggcg gtcggcctgc gggtggcggg ccccggtgtg cgagacggcc ggggcccggc + 4621 gggcctgcgc cggtgtcaga ccgcggccgc gccgaaccag cgggtgaggg cgtcggtcac + 4681 atcgccgccg tccggggccg cccagacgac atggccgtcg ggacgcagca gcaccgcttc + 4741 ggggccgccg tcctccgccc aggtgccggc gacgacgtcg acccggtcgg accagtcggc + 4801 ggcggtcttg tggacggtgg aggggtcgcc ggtgacgatc agcacgcccc gggcctcgtg + 4861 cagcagttcg gcgacccgga cgcgggtgcc gtcggcgcgt tgcagcgcgc gctgcagcgg + 4921 caggcgcagg cccagcagcg ggtgttcgcc ggctccgacg tcgtagcgga tgtgcaggcc + 4981 gctgacctgg ccggccagat agcgggccgc gtcggggatg cgcacgagtt cgcgcatgac + 5041 cgcgcgcagc ggctccatct cctcgccgct gaggtagagc agcgactggg cgtggacgtt + 5101 gcgcagcagc tgctcgccga gcgggtgccg ctcggcgtgg taggtgtcga ggaggccgtc + 5161 gggggcccag ccgttgatcg tcgcggccag tttccagccg aggttgacgg cgtcctggag + 5221 gccgacgctg acgccctgcg cgcccagcgg cgcgtggtcg tgggcggcgt cgccggcgag + 5281 gaggacgcgg ccgctgcggt actgctcggc gaggccggtg gcgttggtga gggcggtcat + 5341 ccagcgggtg tggccgtggt ggatggactc gccggtcatg cgctgccagg cgtcggccac + 5401 ctcggtgaag gtcagcgtgc cctcgccgtg gtgggggcgg acgccgggct cgtggatgac + 5461 gatccggtcg tagccgtcgc ccaggccgac cgagaggacc atgccgccgc cctcgacgcg + 5521 ctccccgatg ggccgcggcc ggatgtcggc gccggtgacg tccgccaggt acatgccgcg + 5581 cgtcgcctcg tcgcccggga aggcgatgcc ggccaggcgg cgcacggtgc tgcggccgcc + 5641 gtcgcagccg atgaggtact gcgcgtggtc ctcgccgggg ccgtcggggc cgtcgtagcg + 5701 gacgacgacg ccgtcctcgg tctcctcgaa gccggtgacc tcacggccgc ggagcacggg + 5761 cacgcccagg cgggccgtcc agtcgccgag cagctgctcg gtgcgggact gggcgagccc + 5821 catcactccg aagtggctct cctccagcag ggtgaagtcg atgcggacgc cgccgaagtg + 5881 gccgtgccgg ccccagcgga attcccccag ctcgtcgagg agcccacgct ggtcgaggac + 5941 ttcggcggtg cggctggtga agccgaggcc acgcgattcc ccgctgggcg cgggcagttt + 6001 gtcgtagacg accacgtcca cgccgccgag ccgtagctca ccggcgagca tcagtccgac + 6061 cggcccggcg ccgacgacta tcgcgccctt tgccatgaag tactcctcac gcagatcgtt + 6121 ggtgaaccgc tcccgtgtgc gcggcggcag ccaggcacca ggaaagacct caccgatcga + 6181 gcggcgctgc agccggagtg cagggcctct caaaagcggc ccgccccgcc gcgggccggg + 6241 tccggggcgg ggtggcgcgg gcggtggcgg cggggcgtgt gaccaggtgt ccgtgcccgc + 6301 gggcggccgg ggtgcgggcg ccgcggcggc cgagcggggt cggtgacggc ggccgagccg + 6361 ggtcggtgac ggctccagcc ggcggcgagc ggatgccgag ccggccgccg tcaccgagcc + 6421 ggccgccgtc accgggcggg ggcgcggagg cgggcggggc ggggcggcgg gggcgccggg + 6481 gtgcgggcgc ggaacggccc cgccggttcg ggggacgacc ggcggggccg tggactgtgg + 6541 gtccggtgcc gcccgggaaa cgcccgggcg cggtggtgct acttctccgc gtcggccttc + 6601 accagggcgg ggccttcgcc cgcctcggcc ggggccgagc tcatggactg cttgccgcgg + 6661 ggcatcagga aggtgaccac cagcagcgcg accgtgccga gcatggcgcc cgagaggaac + 6721 gcgtcgtggt tggccgcctc gtggacctcg gcgatcagct cgggcttgcc gcccgtcgcg + 6781 gccatctcgg tgctcatgcc gctgtaggcg atggtcgcca cgacggccag gccgagggcg + 6841 ccgccggctt cctggctggt gttgatcagg ccggcgccca ctcccgcgtc ctcgtcggtg + 6901 actccgacga acgcggcgat ctgcagggtc acgaagacca tgccgcagcc gaggccgagc + 6961 aggatgaacg gggccagcag gtcgaccacg tagctgccgt cggcgggggc ccgccacatc + 7021 agcagcagac cggcgacggt gagcgtgaga cccatcatca cgaccggacg ggccgccatc + 7081 ttggtgacca ggccggaggc gatgcccgcg ccggccgcga cggagaacgc gagcggcacg + 7141 taggcgaagc ccgccttgag cggcgagtag ccgaacgcct gctgcatgaa gaggctggcg + 7201 aagaagaaca gcgagccgaa ggtgccgaag accagcacgg cggagatgtt cgcgacccgc + 7261 atggtcttca gccggaagat gcgcagcggc atcatcggcg aggcgacctt ggcctcgatg + 7321 acgacgaagg ccgtcagcag cgcgaccacg ccgaccagcg aaccgatggt gcggaaggtg + 7381 tcccagccga cggtggtggc ctcaccgagc gtgaagatca gcagcagcag gccggcggtg + 7441 agggtgaccg ctccgagggt gtcgaacttg ccccgctcct cggccttgct ctcgggcagg + 7501 atgcgcggtg ccagcacggc ggcgcccaga ccgatcggca cgttgatcca gaagatccac + 7561 tcccagcccc aggtgtcggc gagcacaccg ccgaggatca caccgacgat ggacgcgata + 7621 ccggacagcg agccccacac gcccagcgcc ttgttgcgct cgggtccctc ggcgaaggtg + 7681 ttggtcagga tcgccagggc ggcgggggtg atcagtgccg cgccgaagcc ctggacggcg + 7741 cgcgaggcga tgagcatcgt gccgttctcg gcgagaccgg aggtcagcga cgccagcgcg + 7801 aagatcacga agccgatctg gatcagccgg cggcggccga aggtgtccgc cagccgcccg + 7861 cccagcagca ggaagccgcc caggacggtg gcgtaggccg tgacgatgta gttcaggctg + 7921 acctcggaca tgccgaggcc ctcctggatg gagggcagag cgaggttcac gatcgacacg + 7981 tcggtgaaga ccatgaactg gcccatgcag acgaatgcca ggatcagccc ggggctcagg + 8041 cccgcccctg atgctgaccg ggccgtggtg gcgtcggagg cagccatcga ttactcctca + 8101 gaaggtgcag gatcgggtca tcgaacgcgg cccgcgccgg atggggccgg cgggaaccgc + 8161 tgggacagcc gccgggaggg actcggcggc cggagtgggt ccgtcgcagc tatgacgacc + 8221 ggggaccggc ggatgtgacc ggtcggcccg aatcgtctcc gggaccgccc cgcagtccct + 8281 ggatgccggc ctcgtactgg ctgatcagcc ggggtccggc ggcacgcagc tgcggcggga + 8341 agttctccgt cagcaggtcc cggccgcgcg cgggctcggg gtcgtcgagc aacccgaaca + 8401 tgaagtgcag accgaaacgc ggggagccct ggacgaacgc ctcgcgcagc cggtcgatgt + 8461 cgtccgcggg gaccccgggg aacaggtctt ccaccacggc ctcctcggcc gtgaggtgtc + 8521 cgtcgagcac ctggtggacc tgccgggcgg cctcggcgcc cgcccgggcg ccgtccgtcc + 8581 cgccggtggc ccgtgcggcc tgcgtcgcct cgtcgagggc gtcgatcgcc gtctccaggg + 8641 cgttcagcct ccggtcgagg accacgtggt cgtccgacag ttccttgagc tgtgcccgcg + 8701 cgtcggggta gagcgcctcc agcacgggcc agaagaggtc gtcctccgcc ttgtggtggg + 8761 cgtgggtgaa cgcgagcagc caccggcccg cgtcgaccag cgtcgcggtg tctgtgtcgt + 8821 ggccgtcggc cagccgctcg taggcgtcca ccaccaggcg cgtgccgcgc cgcagcaccg + 8881 cgtggatcgc gacgaactcc tcgtacatgc gggcgcccgg gctctgggcc ggatcgctca + 8941 tggacactcc cgtttcgcag tggcagggcc gtggccggac acgggtgccg gtgcggtccc + 9001 gtgggccgcg gccagtacac acgggcccgc acgaagcagc ctcgaggaat gctggaggcc + 9061 cgctcccgcc aggccgggca cgctcgagga atgcttgacg ggaagggccc gcccggcgct + 9121 tgccgtcagt ggccgcccgg cgcacgggaa acggccggcc gtgcggtgtc ctggcccgcc + 9181 ctgcgcagcg cgacctcccg cacgagcagt cccgcgccca gcaccgcggc gccgacaccc + 9241 gcgcagagca ggaacgcgac gtgggtgccc gcggcggtcg cgtgccggta ggcctcgtgc + 9301 agggcgggct ccaggcgctc aaggctctgc gcgtccagcc gggcgttgtc cagcgcgggg + 9361 acgccgggtg cccgctcggc cgtcacccgc agcacctcgc ggttgaacag ggtgcccatc + 9421 acggcgaccc cgaagcagct gcccagggtg cggaagaggg tgacggccgc ggaggcggca + 9481 ccgatgtcgc gcagttccac gctgttctgg gcgaccaccg tcacggtctg cgtcaggcag + 9541 cccagccccg cgcccagcac cgccatggac agggccgccg tgggccgcga ggtggaggtg + 9601 tccatccgcg acagcagcca ggccccggcg cacagcaggg caccgccggt caccgggaac + 9661 accttgtagc ggccgctgac cgtggtgacc ctgcccgcca ccagcgacgc cgcgatcagc + 9721 gcggccagca tcggcagcag cagcaggccg gagttggtcg ccgaggcgcc ctggacggcc + 9781 tgctggtaca gaggcaggaa gagcagcacc ccgaacatca cgaagccggt gaggaaaccg + 9841 atcaccgaca tcagcgtgaa gttgcgtacc tggaacatgt ggagcggcat gatcgggtcg + 9901 gcggtgcgcg cctgccgccg gacgaaggcc cacagggcgg caccggccgc cgcggcgagg + 9961 agcacgacgg cggcggagtc ccaggcgtag cgggtgccgc cccaggtggt gagcaggacg + 10021 gtggcggaga tcccgaccgt cagcagcgcc gcgcccaggg tgtcgacgcg ggccacccgg + 10081 ctccgtcggg gcagccgcag cagccgccag atcatcgcca gggcgagcgc gccgagcggc + 10141 aggttgaggt agaaggccca gcgccagccg aggtggtcgg tgaccgcgcc gccggccatg + 10201 gggccgccga tcatggcgac cgccatcgcg ccggagatca ggccctggta ccggccgcgt + 10261 tcgcggggcg gcaccagctc ccccacgatc gccatgacgc cggccatcag accgccggcg + 10321 cccagtccct gcacggcccg gaacccgatc agctggccca tgtcctgggc cgctccgctc + 10381 agtgccgagc cggccaggaa gaccacgatc gcggcgagca ggacgttctt gcggtcccgt + 10441 acgtccccga gccggcccca cacgggcgtg gagacggccg tggccagggt gtaggcggtg + 10501 acgacccacg acacgtgctc caggccgccg agttccgcgg tgacggtggg cagggccgtg + 10561 cccacgatca tggtgtcgag ctgggacagc atcatcgccg ccaccagcgg gatcaacagc + 10621 acccgtacgg acgtgccggc gggccggccc tgggcggcgg acgccgggtc ctcgacggtc + 10681 gtcatcacgg ctcccggctc gtacgcccgt ggagcgccgg gactatccgg cgcccagttt + 10741 gaatccgacg ccccgcacgg tcacgatcca cccgctgccg cccagtttgc cgcgcaggct + 10801 gctgacgtgg gtgtcgaccg tgcgctggga ccaggagtcc ccccagacct gcttgagcag + 10861 gtgcttgcgc gggatgacgg tgtcggggtg cgaggcgagc aggcacagca gatcgaactc + 10921 cttgcgggtc agcgcgacac cgctgccgtc cacggtgacc tcgcgggagt cgacgtcgat + 10981 gtgcagccgt ccgcggcgga tgtagcggcg ggcggccggc tgccagtggg tgcggcgcat + 11041 gacggcctcg atgcgggcca tcagttcgcg cagcccgtag ggcttggtca cgtagtcgtc + 11101 ggcgcccgcc tggaggccca ggacgcagtc cagttcggac tggcgggcgg tgacgatgac + 11161 gacgggcacc cggctgaccg cgcggatggc ccggcacacc tccagcccgt ccaggtccgg + 11221 cagttccagg gcgagcagca ccagatcggc gtccgcgtgc gcctggaggg cctgtccccc + 11281 gcactgcacg gcgacgggct cgtggccgta tcggcgcagc tgggtgacga gggagtcgcc + 11341 ggggccgacg tcggcgtcca cgacgaggat gcgccgtccg ccgggtgccg gcgcggcggg + 11401 cgcgggcgcc gtgccgtcct ggaccagccg gatgagctgg gacgtggatg tgcggagttc + 11461 cggcagcgtc tgtgccgaca tctgactcat gcctccccca gaggtcctgc acggtccgtg + 11521 gggcgtgggg agcgtcggcc ctatcctgcc gggccggctc ccgccgtgcg ccccgcccca + 11581 cggtaggaac cggtggtcga gccccggtac agcgccgggc cggacggcgt cgagccggtc + 11641 cggtcgcggc gcggccttgg cccggttacg ggttgagcac ccacgccgag ttgtgctggg + 11701 tgaatccgat gtgggggtag taggcggtgg ccgcgggcgc cgacagcagc acgatcttgg + 11761 cggtgggcgc ctccttgcgg gtggcgtcga tcagggcccg gccgatgccc gagcgctgga + 11821 gccggccgtc cacggcgatg tcggacaggt aggtgacgta ggagaagtcg gagacgctgc + 11881 gggcgatgcc gatcagggcg ccgtcgccgt cgcgggcgac cagtaccagg ttggcgccgg + 11941 tcagcatcgc cttcatgcgg tcgcggtcct cgacgggccg ccgctcaccc agtccggacg + 12001 agcggtagac ggcgagcacc tcgtccaggt ccaggtcctt gccctcggca cgctcaatcg + 12061 tccagttcac gaagggtctc caatcgggtg cgaatcacgt cgtggcgggt gaggaagcgc + 12121 tcgggttcga ggctttcgac gtcgatgccc tcgcgggcca ggccggcggc gaagtgttcg + 12181 ccggtggcga gggtgtggtc ggcggcggcc tggacgccac ggtaggcgcg ttcgcgttcc + 12241 acgccgcggg cgaggaggtc ggccaggacc gcggagctgt ggatgaggcc gtcggtggtg + 12301 tcgatgtggg cgcgcatccg ctcggggcgc acggtcaggg agtttatgag gtcggcggcc + 12361 atcactgtct ggaagtgtcc cacggacagg ctgtcgggca ggatgacccg ttccacggac + 12421 tggtgggcga ggtcgcgttc gtgccacagt gccacgttct ccagggcggt gtcggcgtag + 12481 ccccgcagca gccgggccag tccgcacagc cgttcgctgg tggtggggtt gcgcttgtgg + 12541 ggcatggcgc tggagccctg gtaggcgccg gtccggtgtt cctcgacctc gcggacctcg + 12601 gtgcgctgca gcagtcgcag ttccagggcg atctgttcga tgcaggcgcc cagcgcggcg + 12661 accgcctgca tcagctgggc gtgccggtcg cgggcgacga cctggctggg caccggttcg + 12721 acgccgaggc cgagggcgtc gcagacgtgg cgctcgacct cggggtcgat gagcgcgtag + 12781 gtgcccacgg agccggagac ggtgccgacg gcgacggcct cgcgggccgc ggtgagccgg + 12841 gtgatggagc ggtcgacggc gaaggcgtgg acgccgagct tgtgtccgaa ggtggtgggt + 12901 tcggcgtgca cgccgtgggt gcggcccacc atgacggtgt cccagtgttc cagtgccttg + 12961 ccgaccagtg tcgcgcgcag gcggcgggcg gccgccagga gcaggtcggt ggcgcgggcc + 13021 agggtgtggc ccagggcggt gtcgacgagg tcgtagctgg tcatgccgag gtggacccag + 13081 cgtgcggagt cctcggggat gtcctcgcag tacgcggcga ggaaggacag cacctcgtgg + 13141 tcgcgttcct tctcgatctc ggcgacccgg gcggccagcg gcacccgcgc gcgccgcatg + 13201 tcctccaccg cggcggcggg tacccggccg agcccggcct gtgcctcgga ggcgaggatc + 13261 tcgaccttca cccaggtcgc gtagcgggac tggtccgcga acaggtcggc catctcgggc + 13321 agcgtgtagc gaggaatcat cggtcggcct tcgtcgaggg gggtggggtc ggggacggcc + 13381 gtgcgggcac gccggacgcc gccccggtga ggggggtgtt cggggtgccc gcgccgtcag + 13441 tacacgccga agtactcacg ctgctcccag tcggtgacct gaccgggcgc gggcgcggtc + 13501 tgtgagctcc atgccgtgaa gcggcccagc tcgctctcct tgagcttggt catgcaggcc + 13561 gcgaggggcg cgccgagcag ctggtccgcg cggcccgtgc ggaaggcgtc cagggcctcg + 13621 gcgagggtct gcgggacggt ctgcggctgt gtctcggtgg gcgcctcgcc gcggggtgcg + 13681 gtctgcgggt cggcgggctg ggccgtcagg ccctccaggc cggcgaacag ctgggcggcg + 13741 atgttgaggt aggggttggc gcagggctcg cccacccggt tctcgatgtg ggcgccggct + 13801 ccgctgccga cgacccgcag catcgcggtg cggtcctcga agctccagcc gagccgggtg + 13861 ggggcgagcg cgtgttcggc ggccaggcgg cggtagccgt tgacggtggg cacggacagc + 13921 aggaacagtt cccgtgccca cgtcagcagg ccctccgcgt aggcctttcc gttcggtgac + 13981 agcccgcccg acaggccctc ggcgctgaac aggttgcggc cggtggccag gtccacgacg + 14041 gactggttca ggtgccagcc gctggggtcg gcggcgtcga gccgcggctg ggacatgaag + 14101 gaggcgtggt ggccgcggcg ggcgcagaac cgtttggtga cggtgcggaa cagcagcatc + 14161 gcatcagccg tgtcgagggc cgtcatcggg ctgaaggtgg tctccacctg gccggggccg + 14221 gactcgtgtt ccatcgagcg cagcggcagg ccgagctttc gcaggtggag tccgagcggg + 14281 ccggtgatcg gggcgacggt gtcgtaggcg gcgtcgaggt tgaactggta gccggcgttg + 14341 acggcggtca cgcgcggtgc ctggccctgc agcccgaagc cgttgccctg gttgccgggc + 14401 tcgtcgtcca ggcgccgggt gaggtaccac tcgacttcca ggcccagtac gggctggagg + 14461 ccgagtgcgg cgtagcggtt gacgacgcgg cgcagcacgg cccgggagga cagcgggtgg + 14521 ggggtgccgt cgcgcaggta ctcgtcgccg agcacccagg cggtgcgggg gccgcgttcg + 14581 ggcagcacct ggaaggtgac cgggtcgggc acgaggacga agttgcccgc gccggcgatc + 14641 tcgtcgacgc cgatgccgtg gtcgccgagg aagtcgacgg ccacggcgtg gccggtgtcg + 14701 aacaggaacg ggcccgggct gaagttcatg ccgttgcgca gcaccgagcg gaacgcgtcg + 14761 gcggtgaggg tcttggagcg ggccaggccg tgcgggtcgc cgaagacgag ccggacgaag + 14821 tcgacctcgt ccagggcggc ctcgacgcgt tcggcggcgg cgacgcgttc gtcgtcccac + 14881 agcccgtggt cggtgacgaa ggagggccgg ccgacgctgc cgtccggggc gggtgaggac + 14941 caggaccggg catacatggt ttcagaacgt cctttcgccg gtggtaccgg tggaggcggc + 15001 gaccggaggg gccgcgggcg gctggggcag cggcggcagc atcgcctcca ggcggcgggc + 15061 caccgtcagt acgaggtcgt cggcgccgac cgggccgacg agctgcactc cggccggcag + 15121 tccggaggag gtcaggccgg cgggcaggga ggcggcgggc tggccggtca tgttgtacgg + 15181 gtacgaggcg ggtgcccagg ccagccacag caggtcgcgc acgtcggcgg cccagtcggg + 15241 gcctatggcg ccggcgtcga agggttcgac gggcacggtg gccatggcga gcaggtcgta + 15301 gtcgtccatg accgagcgca gggtggcgcg caggttctgg cggatctcct ccgcctggat + 15361 caccgcgacg ccgctgaggg tgcgtccgtg ccggacgacg tgcaggcggc cggggtcgat + 15421 gagttcctcg tcctcggggc gggtgccggc cgcctcggtg gcggcgagga tgtcgacgac + 15481 ggccgggtag aggttgtggc agcgcacctg gacctcctcg accaggtggc cctcgtcgag + 15541 gagtacgtcg cgggccgctt cggtgacgcg gcggatctcc gggtcggtgc cttcgtactc + 15601 gatccagccg atgcgcaggg agcgcatgtc gcgcggggag tccagggagc cgagtccgga + 15661 gtcggggtcg gtggggtgcg ggccggcgat gacctggccg agcagggcgg cgtcggcgac + 15721 ggttgcggcg atggggccct ggtgggcgag gcggtcggcg ccgttggggt agtagggcac + 15781 ccggccgaag gagggcttgt agccgacgac gccgcagaac gcggcgggga tgcggatcga + 15841 tccggagccg tcggtgccca gcgccccctc gcacagtccg gccgcgacgc tcgccgcggc + 15901 accgccgctg gagccgccgg cggagcggct cgggtcgtag gggttgcggg tgggcggggc + 15961 gagccggccc acggtggagg cgctccagcc gaactcggag gtggtggtct tgccgacgac + 16021 gatcgcgccg gccgctcgca gccgggccac ggccggggcg tcctgtgcgg gccgcccgtt + 16081 gggcagcagg gagcccctgg tggtgggcag gtcccgggtc tgcagcaggt ccttgacgga + 16141 gaccgtcacg cccagcagcg ggaggtccca ccatgcctcg cggccgcggt cgcggatcag + 16201 ttcgtccgcg cgggcggccg cccggatcgc ctcgtccccc gcgaccgcga cgtaggcgcc + 16261 caggtggtcc cgttcccgga cggcggccag cacgtcctgg acgtgctcga cgacggtgag + 16321 ctcccggcgg gacagcagtt ccttggtccg gcggatgccg cgggcggtca tcgctcactc + 16381 cttccgctcc tggtccttcc tcacgggggg tcaggagcgc tgctgacggt gcgggacggg + 16441 atggtgcgcc cggcgggacg ggggatgacc cgccgggcgg ccgtgggggg tcaggacgcg + 16501 cgggtggcgg ggtcggcgcc gccggtgacg gccgaccagt gccacgggga gtcgaacgcg + 16561 gtgacctcga tctgttcgcc cgccgcggcc agttcggcga ccaggcccgt ggcccgcgcg + 16621 gtgaacgcgg acacgcggtg cgcggcgagc aggtcctgct cgccgaacgg ggcgccgtcg + 16681 cagcgcagca gccgcaggtc gacgaaaccg ttgaagcgcc gtccgtcgac cacgacggac + 16741 tgcggcgaac ggatggagaa ccgcacgttg ttgttgacgt gcccgtggtg gtgctggtcg + 16801 gagtagaagg cgacgtccgg gatggtgggc gggacgaagt ggtcgcggtc gaccacctcg + 16861 ggggccttgg gcaggttgcc ggcgatgaag tgccaggagt tgtactgcat gcgcgaggac + 16921 atcgcccagg ccgcgtcggc gagggcggcg gtggagtcgc cgaagtgccg ggcggcagag + 16981 gggtcgggca ccacgcagca gaagaagcgg gtgatctccc agtcgcagat ctccgcccag + 17041 cgttcctcgc gcagcgccgt gatcaggtcg ggcagcgagc gcatgccgcg gctcatcgcg + 17101 aagtcggcct cgaacgcctc ggtggcggcg gcggccgact cgtacaccag ggcctcgagc + 17161 ccggtggcga agtcgccgtg cggagcggcg agccaccccg gggccgcggc gagggcctcc + 17221 cccagctccg cgaggttgtc gccgcgcagc ggcagccggg acgtcagccg tgccgtcacc + 17281 gcgtcctcac gggcgcgggc caggtccgcg cagggaccgg cgaccttctc gatcttgtgc + 17341 atgagagcgc cgtggatctc gcggtacagc tgggcctcgc gggcgacctc gccgcggtgg + 17401 gagcgcagtg agacggccag ttcgtgcagg tcggcgaccg tcgcggacgc ggcgggcggc + 17461 acctggtcac ggcccagggc ggcgttgtag ccgactcgga tgcgctccag catgtgggcg + 17521 acgtggtcga cggtgagctg ggtgccgttg gcctcctcga cccggccggg gccggccgag + 17581 cggatcagca gggtgaggca caccaccagc tgcacgtcgt ggtcggacca cagttccagc + 17641 ggcaggtcct gaagactgct gagggcgcag tcgggatgcc cgggccacag cgtctttccg + 17701 gtgagggtgt tgtggtcgcg gaagttcgtg tactgcctgc cctgctggta gagcacgaag + 17761 ggcgcggtgc gcagcgccgc ctccttggcc tgctccagca gttcaccacg cccttcggcc + 17821 ccctgctcgg cgagccagcc gcggcagtcg gcgacggtcc gggcgacccg gtcctcggca + 17881 cgacgcagct gcgcccggta ggcgtcgagg gtggcccggg tccacggcac ccgccgcaca + 17941 ccgccgacca gtccgtcggc cttcagcggg gccgcggagg ggacgcgcag gacgatgcgg + 18001 ccgctggtgg cgagcgcgat ctcgccggag aagacggtct cctcggcgtc accggacgtg + 18061 ccgtcgccgg gagcagcggt cgcgggagcg gcgtcgccgc gagcggcggg ggcggcggtg + 18121 gcggtagcgc gccagctcag accgcacagg gccgccaggg cggcctcctc ggcggcgctg + 18181 agcgcgcgca gctgcacatc ggcggggacg tggccgtcca gggtgagcag cacctcgacg + 18241 aacgacctga ggtcctcggt ctgttcggcg cgccgccaga cccgcttgag cagtcccggg + 18301 aatccggcgt cggcttcacg cacccggtcc ggcttgagcg tggcgccggc gaccaggccg + 18361 aggcgactgg ggcggcggct gatccgcttc cgggcgttgg cggcgcggcg ggattccccg + 18421 cgttcgggca aggcactcat cacgcaccct ttgcggtgag ctcgatgtgg ttccacatgg + 18481 cgtcgtcggt gggcgtccag tcctcgtcga cgtagatgca gtcgacgggg cactccagga + 18541 cgcacgccgg gcagcccgag cacagctcgg ggatgatcac tacgtccaga ccccggtcga + 18601 agatggcgcc gaactccgcg gggcagctgc gcaggcacgt gtcgcacgtg atgcactcgg + 18661 acttctcgat acgccgcggc ggcttcttcc agttgtcggg gcggtcacgc tgggcaattc + 18721 gctcgacccg cccagacagc gcggccgacg aagcgatctt cttcatgagc tcggaacccc + 18781 ttcgggtgag tcttcctggc cacaaccggg atgcatccga tggtccttcg gccttctcga + 18841 ccggccccgg agccgtgatg ggaatcgggt cgagcccgcg ctcccgatgg cttgtttcag + 18901 accgtcgtcc cggtgcgcgg ccgtggttcc tcgcgggcgg cggcggactc cagtccggcc + 18961 agtcggagca ggagttgttt cacgtcggtg gccgcgacgc ggtcgccgac agcgcggggg + 19021 atggagcaga tgaggagcgg accgtcgtcg tcgctcgcgg ggaggcggcc gtggctgcca + 19081 cgaacaggtg aggcgtccag ggggacgacc gccatgcggt agcgcatgcc gagcttcttg + 19141 cgggccaggg cggtggccgc cttgaccttc acgtaggggt cgagggggtc catgaacaac + 19201 tcgaccgggt cgtagccggg tttgcggtgg atctcgacca gctgcgcgaa gtcgggcgcg + 19261 cgggcgtcgt cgagccagta gtagtacgtg aaccaggcgt ccggttccgc gacggcgacg + 19321 agttcaccgg cgcggggatg gtcgaggtgg tgggccttct tgccctcgtc gtccaggagc + 19381 gtctcgattc cgggcagacc gtccagggcg gcgcgggtgg cgtccaggtc ctcggggcgg + 19441 cggacgtaga cgtgggcgat ctggtgatcg gcgaccgcga aggcgcggga ggccatgggg + 19501 tcgaggtatt ccatgccgtc ctgggtgtgg acctcgagca gaccggcgcg gcgcagggcg + 19561 cggttgatgt cgacgggccg gctgacgggg gtgatgccgt actcggagag ggcgacgacg + 19621 gtgcgtccct cggcgcgggc gtcgtccagg agcggggcca gggccgtgtc caggtcggtg + 19681 gccgccttgt gggagcgggg gtcgtcgggg ccgtagcgct ggaggtcgta gtcgaggtga + 19741 gggaggtagc acagggtgag gtcggggtga cgcgtatgca tgatgtggcg ggtggcgtcg + 19801 atgatccact ggctggagac caggtccgcg cccggtcccc agaagtggaa gagggggaag + 19861 gtgccgagtc tgtcggtgag ttcgtcgtgc agggcggcgg ggcgggtgta gcagtcgggt + 19921 tccttgcggc cgtcggcgta gtagacgggg cggggggtga cggtgatgtc ggtgtcggcg + 19981 cccatggcgt accaccagca gatgttggcg acgctgtagc cggggtgggc gcggcgggcg + 20041 gcgtcccaga gtttgtcgcc ggtgaccagg ccgttgtgct ggcgccacag caggacgtcg + 20101 ccgagttcgc ggaagtacca gccgttgccg acgatgccgt gctcggacgg gtaggtcccg + 20161 gtgaggaagg tggactgggc ggcgcaggtg acggcgggca ggacggtgcc cagcggggcg + 20221 cgggagccgg actggccgag ccgtttgagg tggggcatgt ggtccaggag ccggggggtg + 20281 aggccgacga cgtccaggac cagcagcggc accggccccc cggaagatgt ggtgggggtc + 20341 atggcagctc cttcaggccg aggtcggtca gcaggtcacg ggcgagcatc agctccgcgg + 20401 cgatcccgtc ggtgagctgg gcccggcccc ggggccgcaa ctgggccggc aacgcctgcc + 20461 aggtgtaggt ctccacctcc agatgccggg tcaacggacg cgccccgccc accagccggg + 20521 acaaggccga cttcagcacc ggcagagtcg aggtgagcgg cgcggccgga tccgcgtgca + 20581 gggggacgtg gaagtgcgcc cgccagggcg ccgtgtcggg cagcggaccg ccgccggcca + 20641 gggcctcgtc caggtcatcc gtgccacgca gcccggccgt ggcggcggtg gtgcgggtct + 20701 ggtgcaggaa acgcggctcg gcgaaggccg ccagggcatc gcgtacttcg gggcgagaag + 20761 ggtgttcggc gtgcagggcg gcggagagct gcgacttgac gacggggacg cgggccgcgg + 20821 tcagggcgtc cagggcggtg tgcgggtcct cgaaggaggt ggcgaggtga caggtgtcga + 20881 cacagatacc gatgcggtcg tgtccgatgg cgcccagcgg ggcgatcgca tcatgtgtgg + 20941 tctccacgac gcagccgggt tcgggttcca ggccgatgcg gatggagcgg ccggtcagct + 21001 cgtggagggc gtccagacgc tcgccgagcg tggccagcgc cgcgcgcgcc ttgtcggcgc + 21061 gggtctcgtc ccaggcggtg cgccaggcca gcggcagggt ggagatgctg ccgtccgtga + 21121 cgtcgtcggg caagagtccg gcgaggacac gggccaggga cgtggtgtgc tccagacgct + 21181 ccgggtcggc ccagtccggc ttgtagacgc ggtacttgac ctcttcggcg ccgaagccct + 21241 cgtaagggaa gccgttgagg gtgacgacct ccagtccccg ccggtcgagt tcggtgcgca + 21301 gtccgcgcag cgcggagggg tcggtggcca gggcgtgggc ggcgtccttg gccagccaca + 21361 gcccgatgcc gagacggtcg cggcccaggc ggcggcggac cggctcgcag tggtcgcgga + 21421 gctgggcgag gaccccgtcg agggtttcgg cgggatggac gttggtgcag taggcgaggt + 21481 ggacggtgga gccgtccggg tgccggaacc gcaccgttca cgctcccgtc ggcagcggct + 21541 cggcggccgg ggcgccgcgc aggacggagt tgccctcgtg ggtgggcgcg gtggccgtga + 21601 cgtcgaggtc gaggcgtccg ctgaggccgt agaaggcgac ggggttgcgc cacagcaccc + 21661 ggtccacgtc gtcctcgccg aaaccctcct cgagcatcag gtcaccgacc ttgcgggtct + 21721 tgagcgggtc gctcctgccc cagtccgcgg ccgagttcac cagcaccttc tccgggccgt + 21781 actcacgcag cagagcgacc atgcgggcct cgtccatctt ggtgtccgga tagacggaga + 21841 accccagcca ggcaccgctg tccttggcct ccttgaccgt ggtctcgttg aggtggtcga + 21901 ccagcacccg gtccgtgggc agcgcggact cgcgcaccac gtccagggtg cggcgcagcc + 21961 cggcgagctt gtcccggtgc ggggtgtgca ccagcgccgg caggccgtgg tcggcggcga + 22021 gctgcaactg ggcggccagc gcggtgtcct cggccggggt catcgagtcg tagccgatct + 22081 cccccaccgc caccacccgg tccttgacca gatagcgcgg cagctcggcc agcaccggag + 22141 tgcagcgcgg atcgttcgcc tccttcgggt tcaacgcgat cgtgcagtga tgggcgatcc + 22201 cgtactgcgc cgcacggaac ggctcccagc ccagcaacgc gtcgaagtag tcacagaagg + 22261 aggccggaga agtgcggggc tgccccagcc agaaggcggg ctcgaccacg gcacggacac + 22321 ccgcggcatg catggcctcg tagtcgtcgg tggtccggga cgtcatgtgg atgtgggggt + 22381 cgaagatgcg caagtcactg ctcctgggtc agggcgagca cgcggtcgag gtcggccggg + 22441 atgtctcggt gggcggcggt gcgctcggcg gcgtaggcgc gcagcattct ggccagttcc + 22501 gcgtccgcgc gggcgcgggc cgccaggttt gccacggtgg ccacgggcac gccggtgaac + 22561 aggcacttga gtacggcgtg ccgccattgg tgggcgtcca ggtgccgggc cgcgtagggg + 22621 ccgagggcgg cggcgagcag ggtggtgtcg ttggcgcgca gggcgtcttc gaccagcggc + 22681 agagcgtggg cgggttcggt gtcgagtccg tccagggcga gcaggaccgc acgccgttcg + 22741 gcggccgtcc cccggtggta cagcagggtc acggtctccg cgtcggggcg tgccgccgcc + 22801 agcagcagta cgcgggcggc gtcggcgtgt tcggtgccgc agcggcggcc cgcctcggcg + 22861 aagcgcagtt cccagtcggt gtcccgggcg gttgccgagg cgcgggcggc ggtgagccag + 22921 cggcgtgcgt cggtgccgag gccggcgaac tcgccgggca ggtccgcgtc cggcggggtg + 22981 tgtacgacgg tcatctcgtc cctccgttgc gcaggaaccg catcgactgt gcggccagtt + 23041 cgggtccggc gtgggagtgc cggggcagtt cgacgacggt caggccctgg tagccggtgg + 23101 cggcgagggc gtcgagcacc ggcgggaagt cgatctcgcc gtccccgaag gggaggtgtt + 23161 cgtggacgcc gcggcgcatg tcctcgatct gcacgtgccg cagccagggc gcggcggccc + 23221 gtacgcagtc ggcgggcggc aggggctcca gacactggca gtgcccgatg tcgagggtca + 23281 gtcccagtgg ttcggggtcg cccagttcgg tgcgcaggcg gtggaagtcg gtcagtgtgg + 23341 ccagcaggtg gccgggctcg ggttcgaccg ccagggggac gccggtgtcc tccgcggcgt + 23401 ccaggacggg gccgagggcg tcggccaggc gtttccaggc ggtgtcctgg tccaggcccg + 23461 cgggccgtgg gccgctgaag cagtgcacgg cgtgcgcgcc gaggtcggcg gcgacgcgta + 23521 ccgagcggat cagcaggcgt acgcgtgccc agcgggcgtc cgggtcgtcg tcgagcaggc + 23581 tgggtccgtg cttgcggcgt gggtcgagga cgtagcgggc gccggtctcg acggtgaccg + 23641 cgaggccgag gcggtgcagt tgccgggcga cgtggcgggt gcgggccgcg aggtcggggg + 23701 cgagcgggtc gaggtgcatg tggtcgaggg tgagtccgac gccgtcgtag ccgaggtcgg + 23761 ccagcaggcg cagggcgtcc tccaggcgca ggtcggtcag cccgttggtg ccgtagccga + 23821 ggcgcagcgg gctcatgtgg tgctcacttt ccgggccagg tgcgcggcga ggggggccag + 23881 ggcggcggtg aggacgccgg tgccgggtgc gccggcccgg gccatcagtc cgctctgcag + 23941 ggcgatcgtg gcgcggacgc cggcgccgac ggcccgctgt gtcagttccg gggaggggtt + 24001 gagcgcggcg tgggccaggg ggcgggcgaa ggtggcggcg taggaagcgg ccagggcggc + 24061 gcgtacggcg cgggcggcct tgtcggccgg tggtgtcgcg ggagtaggtg cgccggtgct + 24121 ggcgtcgggc gcggggtggg cggtggggcg gccggcgagg acggtggtga gggcgcccgc + 24181 ggcggcgagg gccgtgaggg gtgcggtgct ggagccgccc tcggtctcgc ggcgggagac + 24241 gagggagacg gccagggtgt ggctgccgag gaacgccgcc gggacgatcg cccgtcgcac + 24301 ggcgcccggg ccggcggccg cgcccagcag caggtccagg gagcgggcgg cggccatcgc + 24361 cgcgggtccc gccggggtgt gtttcaggcc caggtcgtac gcccatacgg tggcggccag + 24421 ggggccggcg accgcgaggg cccgtcgtcc cgcgcatgcg gcgagggcca ggcccgcggc + 24481 ggagagcagg cccgcggcgg cgagggcggc gccgggccgg acgcggccgg acggcagggg + 24541 gcggtggggc cgggcggtgg cgtcctcctc gcggtccgcc cagtcgttga gtgccatgcc + 24601 cgcctcgtac aggcacagcg aggcgccggc cgcgagggcg gtgcgtccgg tgggccgtgt + 24661 gccggcggcc gcggtgccgg cgaggacgtc accggggacg gtgaacgcgg cgggggcgcg + 24721 cagcagttcg gcccaggcgt ggaggtgccc gtcgcgggcc gggccgtggg cgggccgctg + 24781 agcgctcacc tggttcctcc gagccggccg gcgagggtga gcagtcgggt gtactgctcg + 24841 gccagggcgg agccttcggc gtcggggtcc ttgaagtaga agccgagttc gcccagcggg + 24901 ccggacaggc cccgctcgtg ggcgcgggcg agcaggcggg ccaggtcgag gacgagcggt + 24961 gcggcgaggg cggagtcgca gccctgccag atggtctgca ggaccatgcg ggtgccgagg + 25021 aagccgtcga aggcgacgtg gtcccaggcg gtcttccagt ccccgagggc ggggacgtcg + 25081 tcgatgtgca cctcgccttc gacccgggtg ccgagggtgt cggtgaggac gcgttccttg + 25141 ccggcgttct tcgccgcggc ggcggcgggg tcggcgaggg cggcgccgtc gccgccgccc + 25201 agcaggttcg tgccggacca ggcccgtacc gccagtgccc gctgggcgaa catcggcccc + 25261 agcaccgaac gcagcagggt ctgcccggtc ttgccgtcgc ggcccgcgta cggcaggccc + 25321 gaggcgcggg ccgcgcccgc cagctggggg tggctcagcc cggtcgacgg cgtgaagttg + 25381 acgtaggggc agcccgcccg cagggccgcc gcggcgtaca gggagctggc cggccacgcg + 25441 ccgtgtgcgg ggtccggttc ggtggaggcg acgttgacga cgaccgtgcg ggcgacgccg + 25501 gtggtgcggg cgaaggtgcg caggtcggtg gcgaagtcgg ctatcagctc ttcggtggcg + 25561 cgacggtcgc cgggtaccgg tcctccgggg cggatgtgtt cgtccgcggc ggccagttcc + 25621 ccctggacgg cggtcggcag ccagggcggc agtactcctt gggcggccag ttcctcggcg + 25681 cgtttgggca ggggggtggt cgccgtgtcg tggccgccga agacgaggga ggccagggcc + 25741 ggcaggccgc agtcggcgaa ggggggcgtc tcggtgacca tgccggtggg tggcagcagt + 25801 cctgccgcca gcgccgcgca gcccgacacc gccgtcgtgg cgaccgaacc gcgggctccg + 25861 acgagccaca cgccggtccg ggtctcgtcg gccgaggtca tggcatcttg cgtcacgggg + 25921 cagcctccct gagcgtcgaa tgtgttgtcc ggcaagtgga tgcccggcca ggatgccgag + 25981 ccgggctgtg cgggggcgtc gccctccgtc ggctgtcgag cggccgccga gcggattccc + 26041 atcggccgcg ggcgtccggc gccgggcaca gcgaggcccc gccggtcgca ggggtgcggg + 26101 accggcgggg cctggcaggg gggtgtgcgc ggcgcacccc tctgcggggg gtcagcggtt + 26161 gacgcggacc agctggccgt tggtgccgag cgtgttgttg gtgacgtaca ccttgccgca + 26221 ggggtcgacg gcgacgccgg tgggctgctt gagctggtcg ccggtgggga tttcggtgac + 26281 cgcgccgctg tcggcgtcga tctcgaacag ggcgccgggc tgcggcgggc cggccagcgc + 26341 ggcggcgctg taggacaggg cgatcaggtc gccgtcccgg tccaggtcca ggtcgatgag + 26401 gttggtcatc ccggtggcga ggatctcggg ctgctggccc ggggcgatct tccagacgcg + 26461 ggaggcgccg acccggccgc cgctcatgtc ggcgacgtac acggtgccgt cggcggcctt + 26521 ggcgatgccg gtgggtacgg tctcggcggc gccggtgggc agttcgttct tgggcaggag + 26581 gtactcggtg gcggtggtgc cgtcggcgtt gccgcgtacg acggtgttgg cgcccgcgtc + 26641 ggtggccagg tagccgctgc cgctgcgcgt gagccgccac gggttggcgt gcacgtcgcc + 26701 gccgtcgggg ttcagtcgcg tctcgtggtc ggtgaggtcg gcgagcacct tgtggtcgcg + 26761 ggtgcggaag actgtgccca gggtctgggc gccctcgccc agcgcggcgc gcgactcggt + 26821 ggtgccgccg aggccgctga cgacgacgta gccgccgaac cggtcgggca cgacgtcgct + 26881 ggggccgttg gcggagatcg gggcgcccgg ggcgacgccc ttggccgtgg aggcgaggcc + 26941 ggtggcgacg cggccctgga agctgccctt gaccttgtag acggagccgg tggtgcccac + 27001 gcacgtctgg tcgaccgggc agtcggcgag tccggcgccg gcctcggcga ccagcacgcc + 27061 gccgtcgccc agcgcggtga cgccgcgcgg gttgttcagc tgggaggcca cgacggtcac + 27121 ggtcgcctcg gtacgggtgt gggtgtgggt gtgaccgtgg cggtgggcct ggggctgggc + 27181 ctggacgggg ccggcggtca gcgggacggc gacggcgccg gccgcgcccg ccgccagaag + 27241 tatcttcgtc caggagttac gcgagttcgc catttctctc ctcggtttcc aatgctcccc + 27301 ccttttcccg gagagcggat gcgaaatcag cgccacccta gggcagtcgc cggttttatt + 27361 gcgtcaaatt ttccgcagga aaaagtgggt gcacccgtga accagcggta ttcgagtctc + 27421 cctccaggag gcgtcgacct ttttccatat cgttgtagtc ccggtccctt ccggcggttg + 27481 ggacagactt ttgcgctcct gccatggagg aaactcatgc ccgaattgcc gcctccgcac + 27541 gtcgtacggg aagcggagaa agcacgagcg gatctgcagc ggcagagccg ggaactcgcg + 27601 cctccgccgt tcgctctgct ggaattgatc atgggtgtca tggtcacgcg tgcggtgcac + 27661 gtcgccgccg aactgaaggt ggccgaggcg ctcgccgagg gtccgctgtc cgccgacgag + 27721 ctcgccgggc gggtcggtgc ggacgcggac gcgctcggcc gggtgctgcg cctgctggcg + 27781 agcaacggtg tgttcgccac gcgcccggac ggtgccttcg agctgacgcc gatggcggac + 27841 gcgctgcgcg ccgaccatcc gatgtcgatg cggggcatcg cgctgctgat gggccacccg + 27901 atccactggg aggactggag cggcttcccg gagacggtgg tcaccggcga gccggcgctg + 27961 ccgaagctgc gcggcatgca cgccttcgag ttcctgacga agaacgcgga gtacggccag + 28021 gtgttcttcc agggcatggg cagcatgtcc gcctcggaga cggagccgat cctggcggcg + 28081 tacgacttct cgcagttcgg gacggtggtg gacttctgcg gcggccaggg cgcgttgctc + 28141 gcgggcatcc tgggtgcggc gcccgggtgc gagggcgttc tgttcgaccc gcgggtcgag + 28201 gagaacgggg ctgcggagtt cctggccgcg cagggtgtgg ccgaccggac gaagcgggtg + 28261 gccggcgacc tgttcgacgt gccgccgggc ggcgccgacg cctacgtcct caagcacatc + 28321 gtgcacgact ggcccgagga gcaggccctg cggatcctgc gcaacgtgcg ggcggcgatc + 28381 aagccgggcg gcaagctgct gatcgccgag atggtgatac cggagcaggg tgaccagccg + 28441 cactccggga agctggtcga cctgtggctg atgctcctgg tcggtggccg tgagcgtact + 28501 cccggccagt acgccgatct cctggcccgt gccgggttcc gtctggagcg ggtcgtggag + 28561 acggcggcgg cgatctccct cgtggaggcc gtccccgtgt gaccaccgtg gagggagggc + 28621 cccgtcgcgt gatgagggaa cgcggcgggg ccctccggtg tgtgcggccg ggcagcggcg + 28681 gccgggtggg cgggggcgcc ggcgggcagg cccgcgggga gcgccgggcg gcggggggtg + 28741 ccgggcggcg gacgaaggcc cccggcgtgc gcgcacgccg ggggccgcta gagggggtgc + 28801 gggtcagcgg ggcgggccga accaccgttc cagggccgtt tccaggccct gcgcgcaggt + 28861 gcccgtccag gcgacgtagc cgtcggggcg gatcagcacg gcggtggcgc cggcgagggc + 28921 gtccgggccg tcggtgggct tggcgacggc ggtgaccacg tccacccggt ccgcgtggcc + 28981 ggccgcggtc gcgcgtaccg tctcgtcgtc ggcgaggtcg agcagcacgc cgtgcccggc + 29041 gtgcaggagg cgggcgatgc gggtttcgcc gtccgcgccg acgagcagcc gcggcggcat + 29101 ccggcgtccc agcagcgggt gggtggggcc ggtcgcggtg tcggcgaggt cgtagcggat + 29161 gtccaggtgg ctgacgatgc cggccaggtg gcgtttgacg tcgtcgtagc ggaccagttc + 29221 ggccatcagc tcgcgcagcg ggtcggactc ggcgccgccg aggaagacga tgccctgggc + 29281 gcgggtgttc atcagcagcc gggcgccgac cgggtggcgt tcggcgtggt aggtgtccag + 29341 cagttcccgg ggggcgtcgc cgcggatcac cgaggccagc ttccagccga ggttggcggc + 29401 gtcctgcacg ccggtgctca ggccctggcc gccggccggc aggtggatgt gggcggcgtc + 29461 gcccgccagg aagacgcggc cccgccggta ctcggaggcc tgccgggtgg cgttggtgaa + 29521 ggagctgacc cagctcgcgc cgccgtggct gatgtcctcg ccggtgatgt cctgccaggc + 29581 ggcggcgacc tcctcgaagg tgacggtccg ctcacggtcg tgcgcggggc ggccgtcggg + 29641 gcagacgatg atgcgccaca cgccctggga gagcggtgcc gccatcacca tgccgttgtt + 29701 caggcgctct ccgaggaagc gcggggtcag ctccacaccg gtgatgtccg ccaggtacat + 29761 gccctgggtg gcgtcggttc cgaggaagtc gaacccggcc gccctgcgga cccggctgga + 29821 gccgccgtcg cagcccgcca ggtaggaggc gcgcagggtg cgttcctcgc cctgcggggt + 29881 gcgtacggtg atctcgacgc cgtcgccgtc caggaagccg tcggtgaggg agacgaactc + 29941 ccagccgcgg cggatgtccg cgccgagttc gcccgcccag ccctccagga ccgcctcggt + 30001 gtcgccctgg gggatgcccc gggccccgaa gtgggcgtcc tcgaggacgg tgaagtcgaa + 30061 ctgggcgccg ccgaagtgcc ctacggggct ggtggccagg gtctctccct ggccgaaccg + 30121 gggcagcagc ccgcgttcgt cgaacgtctc catggcgcgg gcggtgaagc ccaggccgcg + 30181 ggactgcccg gtgggggcgg ccagcttctc gatgacgacg acacgggccc cgcccaggcg + 30241 cagttcgccc gcgagcatca gtccggtcgg gccggcaccg acgacgatca cgtcggtgtc + 30301 cgccgctgtc ccttccatgg gtggtccttc ctggcagtgg ggtcggttcg gggcccggcg + 30361 gtggggggcg gcgcgtcgtg cggtgccggt cgtccccgcc gggccggggc gcacggcagg + 30421 tcagcgggga ggtccgaacc agcgggtgag tgcctcggcg aggccgtcgg tgcccgggcc + 30481 ggcccaggcc acgtggccgt cggggcggac caggacacgg tcggtgccct gcagtgaact + 30541 gcccggcgag ggctgggcgt ccagtgcggt gacgcggtcc gcccagccgt cgaggactgc + 30601 cggcggccgg ccgggccgtc cggtcaggtc cagcaggacg ccgccgcccg agcgcaccag + 30661 ctgggtggtg gtgagcaggc gtcggcgtgc ccgcacctcg gtgcacggca gccgggcccc + 30721 gagcagcggg tgggcggggc cgccgacgtc gtagcgcacg tccaggccgc tgatcatgcc + 30781 ggccaggcga cggcgtacgt cctcctgccc gatcaactcc gtcagcaggt cgcgcagcgg + 30841 ctcgacctcc ggtccgccga gcagcagcag cgactgggcg cggatgttgg ccaggacctg + 30901 ccggccgacc tcgtgccgtt cgtcgtggta gctgtcgagg agggtctgcg gtgccttgcc + 30961 gcgtaccacc agggccagtt tccagcccag gttgaaggcg tcctgcatgc cgaggttgag + 31021 ggcctggccg ccgaccggca tctgccggtg ggcggcgtcg cccgcgaaga ggacgcggcc + 31081 gtgccggtag cgagtcagct ggcgggaggc gtcgccgaag gcgttggccc acaggggggt + 31141 gccgccgctg atgtcctcgc cggtgacccg cttccacacc gcggtgatct cctcgaagga + 31201 gacgtcgccg tgcgggcggg cccgcgcggc ggagccgaac tcgtggacca tcacccgggt + 31261 caccccgtcg gggcggcggg cggcgatcgc caggccgtgc tccaggcgtt cgaagcgccg + 31321 gcccgggatg tcgatgccgg cgacgtcggc gcgcagcagt tcccgcgtcg cgtccctgcc + 31381 ggggaagtcg gcgccgatca ggcggcgtac ggtgctctcc tcgccgtcgc aggcgaccag + 31441 gtagcggcag cgcagccgca gcgtccgtcc gtccgggccg gcggcttcgg cctcgaccag + 31501 gtcgccgctg tcgtcgagcg cggtcagttc gtgcttgcac tgcagttcgg cgcccagtga + 31561 cagcgcccac tcccccagga tcacctcggt cctggtctgc ggcaccttcc actggccggg + 31621 gtgggaggag ggcagtgtca gatccagcgg gatgcccccg aagtggccgc gcggctcgtt + 31681 cggcgggtcg ccgaactcgg gcagcaggct ccggctgtcg aggatctcca tcgtgcgggc + 31741 gtgcagggtg gaggcccggg actcggtgct gggagcgcgt cgcttctcca cgaccaccac + 31801 gccgacgccg ccgtgggcca gttccccggc gagcatcatc ccgacggggc cggctccgac + 31861 gacgacgacg tcggtggtca gggcgtccgc tgccacggtt cagcccttct tctgctcggc + 31921 gtaggccttg gcgtgggcga gggtggcgcg gctgttggtg gacagggccg tgtggacgta + 31981 ggcgcgggcg tcggcgacgg tggcgtcctg gccgaggatg cgggcgatgt tggcggtgtt + 32041 gagggtgacg gtgtgctggg aggaggcggt ggtcgcctcg tcgccctcgg tgaaggtcca + 32101 ttcgccggtg tgcagggtca tcagcgcggg cagggtgacc tgcttgtagg cgatcttgtg + 32161 gtgggggaag acgacccggt aggacttggt ggtgtgcacc gagccgtcct tggcgcgggt + 32221 gtccatctcc agctcctgca ggccgggggt gtcctcgctc aggcgcacca cggcgacgtg + 32281 cgggagccgt tcggcccaca gctgggcctc gttgatgaag tcgaagacgt ccttggcggc + 32341 gccgtcgatg tgcacggtgt cggtgaagga gaacgtcagc tcctcggtgg cggcggcgtg + 32401 cgcggcctcg acgttgacct tcagggcggc cagctcggag gtgctgttct tgtccacggc + 32461 ctgctcgatc cacagcaggt cgtgcgggtc gtcgccgacg gcgctgtagt cgtgcaggag + 32521 ccgtacccgc gaccggtcgt cggcgagcgg ctcgatgatc caggtgccgc ccatgtgctt + 32581 gaccggggcg gcggggatct cctggcggaa ggtgatggtc aggttctcgc ggtcgagcgt + 32641 gcggcgcgag gtccactcct tggcctggcc gttggcggtc gcccagatgt ggatgcgttc + 32701 gtggtcgccg tcggcctcgg tgcggtcgac gtggatggtg ggcgggaaga tgcgcggcca + 32761 gttggtcacg tccgcgagca gctggtagac ggcgtcggcc ggtgcgccga tcgtgatctc + 32821 gtgctcgacc tcacgtgtgg tcatgaggct cactcctcgg gaaggggtcg ggtgccgggt + 32881 gcgtcagaag ttgccgaggc cgccgcagac gttgagggcc tgcgaggtga tggacgcggc + 32941 ggtgtcggag gccaggtagc cgacgaggcc ggcgacctcc tcgggggtgg agtagcggcc + 33001 gagggggatc ttcgcctgga acttctcgag gatggcgtcc tcggaggtgt cgtaggcggc + 33061 ggcgtatccc tggcgcacgc gctgggccat cggggtctcg acgtagccgg ggcagaccgc + 33121 gttgacggtg atgccggtgg gggccagctc gttgcccagt gccttggtga agccgacgac + 33181 gccgtgcttg gacgccgagt acggggcgcc caggacgacg ccctgcttgc ccgcggtgga + 33241 ggcgacgttg atgatccggc cgcggtcctt ggcgcgcagg ccgccgatgg tcagggcggc + 33301 gcgggtgacg cggaagacgc tgttgaggtt ggtgtcgatc acgtcgtccc acagctcgtc + 33361 cgcgatgtcg gcggtggggc cgccgccgga gcggccggcg ttgttgacga cgacgtcgac + 33421 gctgccgaag cggtcgacgg cggcctggat ccaggcgttg acggactcgg tgtcgcggac + 33481 gtcgacgacc gtgccgtccg cgtcgatgcc ctcgccctgg agttccttga cggtggcggc + 33541 gacgttctcg gcgttgcggg cgccgatgaa gacttggtgg ccctgccggc cgaggagccg + 33601 ggcggaggcc aggccgatgc cgctggtggc gccggtgacg acggcgacgc gctgggtggt + 33661 ggtgtcggtc atggtggggc tccttcaggc ggccttggcg ggcgcgagct gcgcgttgac + 33721 gacctcgatg aagctgcgcg gcgtgttggc ctcgccgacg gcctcctcgt ccagggagat + 33781 gccgtactcg cgctcgatga ggctgccggc ctccagcagg gcgagggact cgtagccgat + 33841 cacctcgaac tcggtgtcga ggatgtcgcc gtccaggtcc acgccctcgg cgacgcccgc + 33901 ggcctcccgc agggtgcgct tgaggtcgtc gagggtgaag gacttgctgg ccatggtggg + 33961 tcctttcgtc agtacgtggt ggcggttgcg gtgcgtcggt cgggtgcggt gcgcgggggt + 34021 cctcaggcgg cgcgcacgac catggcggag ttgaagccgc cggctccccg ggccaggacc + 34081 agggcggtgc gcagctcggc cgggcggggt tcgcccagga ccaggtcgag ggggtagtcg + 34141 gcgcacgggt cgatgtgcac ggtgggcggg atgacgccgt cgcgcagggc gaggaacgcg + 34201 gctgccaggt ccaggggcgc gccgccggag tacaggcgcc cggtcatggt cttgggcacc + 34261 gtcaccggca cgccccggtc gccgaagacc gtgctgacgg cgcgggcctc ggcgaggtcg + 34321 ccggccgggt cgccggcgcc gtcggcgaag accacgtcga tgtcggcggc gttcacgtcg + 34381 gcgtcggcca gtgccgtctc gatggccttg gccaggttgg gttcgcgtcc gctgccgggc + 34441 cgggggtcga tggtggctcc gtagccggcg atctcgccgt aggggcggac gccgcgggcg + 34501 cgtgcggcat cggcgtcctc ggcgatgagg atcgcgccgc cctctccggg gacgtagccg + 34561 ttcgcgtcgc ggtcgaaggg caggtaggcg tggtcgggtt cgtcgctggt ggtgagtcgg + 34621 ccgcaggcca gctgggccac ccagccccag gggcagatgg aggcgtcgac gccgccggtg + 34681 acgatcagcg gggtgccccg gcggatctgc cggcgggcct gcgcgacggc gtccaggccg + 34741 cccgcgcctt cgctgacgac gacgccggag gggcccttca tgccgttgcg gatggagatc + 34801 tggccgctgt tgacggcgta gaaccaggcg aaggactggt aggcggagac gtactggctg + 34861 ccctggctcc acagggcctg cagttcgccc tggccgaact cgaagccgcc cgcggcggag + 34921 gccgtgatga cgcccatgtc gaactcgggc aggtgcgcgg ggtcggcgcc ggcgtccgcg + 34981 agtgcccagt cggcggccac cagggccagc cgggtgacgc ggtcggtctg cggcagcagc + 35041 cggctgggca gcagttcctc ggcgtcgaag tcctcgatct gcccggccag acgggccggg + 35101 tagccggtgg ggtcgaagcg ggtgatgcgg ccgatgccgt gcttgccgcc cagggtggcc + 35161 gcccagtagt ccttcacccc catgccgttg ggtgagacga cgcccaggcc ggtcaccacc + 35221 acggaggcgg tcatacgagg ctcctttcgg gggtggcgag caccatggcg ctctggaagc + 35281 cgccgaatcc gctgccgacc gtgaggaccg cgtcgatcag ctggtcgcgg gcgaccaggg + 35341 gcacgtagtc gaggtcgcac tcggggtcgg gggtgtgcag gttggcggtg ggcgggacga + 35401 cgtcgtactc catggcgagt gccgaggcgg cgatctcgat ggagccgatc gcgccgagcg + 35461 agtgcccgac catcgacttg atggagctga ccggggtgcg gtaggcgtgg tcgccgaggc + 35521 tgcgcttgaa cgcggccgtc tcgtgccggt cgttctgctt ggtgcccgag ccgtgggcgt + 35581 tgatgtagtc gatggactgc gggttcagcc gggcctcgcc cagggccagg tcgatcgcct + 35641 cggccatctc cacgccgtcg gggcgcaggc ccgtcatgtg gtaggcgttg gagcgggtgg + 35701 cgtagccggc gatctcggcg tagatgtggg cgccgcgctt gcgggcgctg tcgagttcct + 35761 ccaggacgaa gaaggcggtt ccctcgccga ggacgaatcc gttgcgggtc ttgtcgaacg + 35821 gccgggaggc gcactcgggt tcgtcgtggc gcggggtggt cgccttgatc gcgtcgaagc + 35881 aggccatggt gatcggtgag atcggcgcgt cggaggagcc ggcgatcacg acgtcggccg + 35941 atccctcgcg gaccagttcg acggcgtagc cgacggagtc gatgccggag gtgcagccgg + 36001 tggagaccac ggtgctgggg ccttcggccc ccaccgccca ggcgacctcg gcggcgaagg + 36061 agctgggcac catgtagtcg tacaggtgcg ggaccgcgta ggtgtggtcg accgtgtcca + 36121 gccgtccccc gtcgctgacc acccggtact cctggtccag gcccatcgtg gcgccgacgg + 36181 cgctgccgac ggtgacgccc acgcggtgcg ggtccaggga ggggatgtcg aggccgctgt + 36241 cggcgacggc gccgcgcgag gcgacgacgg cgaactgcgc ggcccggtcc aggcggcgga + 36301 cctcctgcgg ggtcaggccg tgctcgtagg ggtcgaagtc cgcttcggcg gccacccggg + 36361 agcggaaggg ggcggggtcg aagaaggtga tgccccgtgt cgcggtacgg ccgttgctca + 36421 gcaggttcca gaagttctcc ctgccgacac cgccgggggc gatcacctcg atcccggtga + 36481 tcacaacgcg tcgcccgctc aacgggaggc ctcccagctg tagaagcgcg tggccatcgc + 36541 gtcggccggc gagcgccagg tcgtggggtc gtaggcctcg atgaagggct tgaggtcctc + 36601 gctgatccgc acgaagcgcg ggtcggcctt ggcggcctcg atcagttcac cgccgttgtc + 36661 ctcgtcgaag tcctggaggt ggaagtacag gccccggtag gagaagagct ggcggcgccg + 36721 tgtgcccatg cggtgcggca tctcggtggc gtcgaagtcg gcgaacaact gggccacgtc + 36781 gttgctcgag gtggccgcca tccgggcgac gatcagcgtg ctgtgcatag ggattagctc + 36841 ctcggcggtt gcgcggaagg gttctcgaag cgggcggacc ggcccggccc ggcggcccgg + 36901 ggggctgcgg cgccaccgcc ttcgacggtg cggcctggcg gtagcgcccc gcacggggcc + 36961 tgcctgagtc ccgcctgagc cgaagcggcg ggtgcacacg agcacgcctt cgggcctgcg + 37021 cccccgggtg ccggggacga ggtccgaagg cgtgcgggtc ccgtgcgccg tccggcgcgc + 37081 cgggctcact cgccggcaga gcgcgtgtgc acgacccggt aggtgttcag gtagggctcg + 37141 ccggtgacga cggcgcggac gcgggccacg gcggccttgc gggcgtcggc ctgctcctcg + 37201 ggggcctggt cgcggtagac ctcgaaggcc tccttgctgt cccactggga gtaggagatg + 37261 acgaaggatc cctccaggcc gcgggcgcgc aggcccttga gcacgacgtg ggcgcggaag + 37321 ccgggcacgt cggcgaggaa ggcctggccg gggccgaggg cgtcgacggc ctcgtcctgc + 37381 ccctcggggg tgaccgggaa gagggtgaag acggtgtagt cgtcgcggtc cgggccgatc + 37441 tcgatcttgc cgccgagggc gtccgaggtc agcgtgtggg cgacctcgtt ctgcatcagc + 37501 cggatcgagg tggtgatctc gccgaagacc gggagcgtgc ggtgcttgaa ctcctcgccc + 37561 gcgtagcgct tctcgaggtc ctcgccgctg cgccactgga tgaagttgag ggtgccgtag + 37621 ccgtcgacgc ccgagtggac ggtggaggac atccagccct cgtacgcggc cgcgttgacg + 37681 atcttcgtca tctcctcgat cagcttggcc tgcttctcgg gagtgtccgt ggtgaacagg + 37741 ttcaggacgg tgaggtgctt gtcctcggcg gagatgatgg gcatgggtcc ttcgctttcc + 37801 ttggtgggtg cggtgggtgt cgctgcgcgg cccgcgacgg tcaggcggtg gggccgaacc + 37861 agcggccgag ggcggcggtg agaccgtccg gcccggcgcc gaggccggcg acccaggcga + 37921 cgtagccgtc ggggcggacg aggatgccgt ccacgggggc ctcgcagccg tcgaactcgg + 37981 ccgcgacgag gtcgacccgg tcggcccagc cggcggccgc ggtgcgcagg ccgtggtcgc + 38041 ccccgagttc caggagcacg gggcgtgcgg tgcgcagcag cgcgtagaac ggggtcttct + 38101 caccgtcgac gaccagttcc cggtccggca ggcgccggcc gagcaggggg tggtcgcctt + 38161 cgccgacgtc gtgccggatg tccagtccgg tgaccatgcc ggccaggtgg cgctggacgg + 38221 attcgtgggc gcccatcagc tcggcgagca cctcgcgcat cggcgtgatc tcgtcgccgc + 38281 cgaggtagag gatgcgctgg gcgagggtgt tggtcaggat gcgggccccg acggggtggc + 38341 gctcggcgtg gtaggtgtcg agcagccctt cgggcgcctg gcccttgatg tcgagggcga + 38401 gcttccagcc gaggttcacg gcgtcctgca cgcccgcgct catgccctgc gcgccgatcg + 38461 gcaggtggat gtgcgcggcg tcgccggcca ggaagacgcg gccgtggcgg taccggtcgg + 38521 cctggcggct gacgtccgtg gtggagctga cccacagcgg ggtggcgccg ctgacgtcct + 38581 cgccggtcag gcgctgccag gtctgggcga cctcgtcgaa ggtgatcggg tccgggctgg + 38641 tgcgcagcgg ctcggagctg tcgaagtaga tgacgcggca gcggtccggg cccatcggga + 38701 tgaccatgac catgccgccg gcgacgcgct ccccgctgaa ccggggccgc agcgccactc + 38761 cggccaggtc ggcgaagcgc agctcgatgg ccggctcggt gccggggaag ccgatgcccg + 38821 cgagcttgcg cacgatgctg cgggcaccgt cgcagcccac cacgtggcgg gcgcgcaggg + 38881 agaaggggcc gtcggcgccc gcggcggtga cggtcaccga ggcgtcggtc tgctcgatgc + 38941 ccgtgacctc gcacccgcgg cggatgtcgg cgcccagctc gcgcgcccag ccgcccagga + 39001 cgccctcggt gcgggcctgc gggatgccgc gcgccccgta cgaaccgccc tcgatcaccc + 39061 ggtagtcgag cgggacgccg ccgaagtggc cgaccgggat gactccgacc tcgccgaacc + 39121 ggtccatcag cccgcgctgc gcgaattcct cgatggtccg cgccgagaaa cccagggcgc + 39181 gggattcctg aatcggctcg gaaagtttgt cgagaaccac caccgagact ccagcgagcc + 39241 tcaattcacc tgcgagcata agaccggtgg gaccggctcc cacgacaatg acatctgaat + 39301 cgtagaattc catctgccct cttctcactg gtgttccatc aatagtgcga gggcttacga + 39361 gggctgtaaa taggcgttgt tacaggtctt gtgcagtcaa tgccagaaaa acgtctggta + 39421 cgtcagagct tcgacaagcg gtcttgcccc gggcgcgtgg ggtgacggca ttctctggca + 39481 tgacctccag tctgacgacc gatcaatccg catccgtttc cgccgccgag tcgagcgcac + 39541 aggtcgccgg tctgctgcac cggtatctgg tctcgctcga cgacgagcgg ctcgacgacg + 39601 cctggaccgc cggcctgttc accgaggacg cggtcgtcgc gttcccggtc agccggcacg + 39661 agggcgccga cggcatggcc gagtaccacc ggtcggcgct gtcggcgttc gcggccaccc + 39721 agcacctcgg ttctccggcc gtggtcgacg tggacgggga ccgggccgtg ttccgggcga + 39781 acctgatctc cacccatgtg caccacccgc gccacacgcc tcccgagggg gacctgcccc + 39841 cgctcttcgc gacgggcacg ttcgtgaacg gcgaggcgcg ccgcaccgcg cggggctggc + 39901 ggctgagcct gctggccttc cggctgctgt gggcggacgg ctcccctccc ccggcccggt + 39961 gaccccggcc gcggtgcggc ggcgcctgga cgtccggcgg cgccgcgccg cggtacacgc + 40021 gcgtgccgcc ccggacgcgg tccggggcgg cgggggcggt gggggggggt gatgggggcg + 40081 gtggtgggtg gtgggggtgg tggtgggggt ggtggtgcgg agccggcggg gcaggcgttc + 40141 agacgttcag gcgttcaggc gttcaggctg aggacgcggt cgaccgcgat ctcgatgacc + 40201 acccggtcgg acggggtcgg cggggcggac cagtaccgct tggcgtacag ccgtgccccg + 40261 agcgccaccc gttcggggtc ggtcacgacc gtgccggtcc cctccagcgt gacccagcgg + 40321 aagccgtcca cctggcagag cgccaccggg gcgccgggcg tggccagcag gttgcgggcc + 40381 ttgcgggagg agctcaccgt catcacccgc gcgagctggg cgtccgcgtc ccaggtgaag + 40441 cgcacggggg ccacgtgcgg tgtgccgtcc ggccgcatcg tcgtgaacgc ggcgacgagc + 40501 gccgtaccgg tcaggaacgc ctggacggag tcgggcaccg tcacggcgtc cgggcgcggc + 40561 atcgacggca tgggcgggtc ctcgcttcca gagggtgttg cgtgcgtggg cgcttcccgt + 40621 gctccgggcg gctgtcgcgc gggcgtcggg ggcggccgtg ggtccggggc cagcttgccg + 40681 ggggccgctc gaccctcgct ggacccggct cccccgcccg gcccgccgcc cgcctccgcc + 40741 gtacgccgta cggcatgtgt cgtgcgctgt gcgcccgtgg gtcgtgcctc gtgcgtcgtt + 40801 tcgggtgtcc gggctagtcg atgctgcgga cgatgacgcg tccgtcctcg tcctcgcgct + 40861 cctccgcgcc cgccagccgc aggggcggcg ggccgccgtg gaccgccctg gcgcatcggg + 40921 ccgtgtcacc ctcgtgccgt tcgtcgtcgc cttcgtgcat gggcacctcc tcggtgatcg + 40981 gtcggcccag agtgtcaagg gtggctcgcg gcccggtcga cggccgcccc gaaggaagtg + 41041 gagcgcggcc ggagccagga cccggccggt cgcggcctcg agggccgcgg cgcgatgcgc + 41101 ggcagtgcct caccggcgag cacgtccagc acggccccgt tggtggtggc ctcgtcggtg + 41161 ccgggcagat gccgcagcag ccgggcgcag tgcccggcca gcaggcgggc gtcggcgtcg + 41221 gagatccggt tgcggtcgtg gtcgacgcag aaggtgaggc ggccgtcgcc gccgggacgg + 41281 accagcaggg cgacgggcag gtcggggcag gcgccgtgcg ccggttccgg ctccagtgcg + 41341 atgccggcgt cggcgagttc gttcctcagg ttgcccggcg ggcgcggaag gctgtcgacc + 41401 gagaccacgc tctgcagcag ttccccgtcg gggcagcggc ccgtccagcg gtggatccgg + 41461 cgggtggaga cccattcgta ggcggccatg tccagcgccc ggtcccgcag ggccgtcagc + 41521 agccggccga ccgtctcgcc agggtccacg cggaccacca tcggcaggca gttgcgcagc + 41581 ggcccgggca gccgctcggc gcagtccagg gtgatgccgc ggccggagac ggtgacgccg + 41641 aagcccaccg tcgcggcccc gccgggcccg gccgcgcggt acagcagcag cgcccagacc + 41701 gtctccaggg cgctggagtc gggtacggcg cgcagggcgg cccagcggtg gagccgttcg + 41761 gcctcggcgg ggctcagccg tacctcggtc ctgccccggc cccgctggcg ggtgcgcggg + 41821 ccgggccggg cgggcagcac ggcgaccggc ccgtcgggca cggcgccccg ccagaagtcc + 41881 cgggctccag cggggtcctg ccgctggagc cagcccgccc agtcgcgcag gtcggggcgg + 41941 cgctcgccgc cgggcagctc gccgccggcg aggtaggccc ggcacagctc ctgcatcagc + 42001 aggcacacgc tccacgcgtc cagcagcgcg tggtggaagg tgaggaccac ccgggtcacc + 42061 ggcccggcac cggccgggtc gtcggtgcgc tccacgaggg tgacgcgcag cgggcagggg + 42121 cggctggggt cgaggccgcg ccggcggtcc cgctccagca gccggtccca tccggcgccg + 42181 cccgcacggt ggcgcacgac gtcgccgtgg gcgtgctcgt gcaggaccag gtgcggccgg + 42241 ggccccgggg ccagggcggc ccgcagcacg ctctcccggt cgacgaccga ctgccaggcc + 42301 gcggcgaacc gctcggtgtc cagcgggccg tgccagcgcc agacgagctg ctcgacgtgg + 42361 cgcccggcgc cacggcgccc gccgaagtcg cccagcaggt cgaggtgggg ccacagggcc + 42421 ggtacgcccg gcggacgggc cgtgccgggg ccccgcaggg cacgcgggcg gctgtgccac + 42481 gccatgggac gccctcctcg tcgctgcctc ctcccgcacg ggccggccgt gcgcacggtt + 42541 ctcggggagc ggcgggcccc ttgagggggc gcggtactcc cccggcatcg tggcaccggt + 42601 ggctgccatg ggcctgacgg cccgctgacg ctgctcgcga ccgggcggag aaacgcttct + 42661 gcagcggtgg ggccgtaccg gaacgcccgc tactgctgtc ccgtgtccgt catcgccgac + 42721 aggaacccct ggtccagcat ggtccccacg gaggtgtccc cggcggtgct cagtccggcg + 42781 ttgtggcagg ccacgctgag caggaagcgg tccatgacgg ggtaggtggc gaagccccac + 42841 tcgtcgcggg tgacccggct gccgtcgggt gcgctcagcc ggccctgccg gaagccgaac + 42901 tccttgaagc cgaaccgcag tccctgcccg agggccttgc tgtaggcctc cttcagggtc + 42961 cacaggcgca gtgcgtgggc ggtccgctcg ccttcgggca gctcggccag ttcccgggcc + 43021 tcggccggtg tgaagacctg ggtctcgagc aggtccagcc gtacgggccg ctcggccggt + 43081 tccacgtcca ccccgatgcg gccgatgcgg ctcaggccga cggccatgac gtccccggtg + 43141 tggctcaggc tcagttcgat ctggtcgaag ccgcgcaggt agggccggcc gcccagccgg + 43201 taggccaggt ccaggtactc gggcgggacg gccagggcgg cggccgccgt gtacttgatc + 43261 agcatgcggg aggcggcgaa ccggtagcgc accgcggcgt cgcgggtacg ccggtagcgc + 43321 tgccagtcgt cgccgagcag ttcccgcagc cgcggggtgg tcagcacgct gggcagccat + 43381 tcgctccacg tcgtgcagac cagtgcgttg ccgtgccgga agaggtcctc gcgcaccgcg + 43441 ggccaggggc cgtggggccg cggcacgtga aggggcgcgg cacatgtgac ccgctccatc + 43501 gtcgtctccc tgcgtgtggt tctcgccggc ccgctccccc gttggggggc gggccgaggt + 43561 ggggggcgtc ttgccgtgcc gtctcggtca gccggccagt ggggtgtcgt acaggtcgag + 43621 actgcggccg tgccggcagc gtcccagcgc ctcggccagg accgcctgtt ccgcgtccgc + 43681 cggtgtctcg ggtacggcga tgccgagtct gcggccgatg cggctgagga cgagcaccgc + 43741 ccaggccggg tcggcgagga agccgtcacc gtccgcctgt ccctcccaga ccccgaggca + 43801 ggcggcggcg cacagcagca gggcgtagcg gtcggccagg gcgcaggcca gcgggtcgaa + 43861 cacggtgctc ccggcggccg gcagggccgc gcagcgcgcg cgcagcaccc gcagctcctc + 43921 caccagggcg cgggccagcg cggcgagggc ggcgtgcagt ggttgtgtcc ccgtccgtgc + 43981 ggccagccgt tcggcggccc cgatcagggt ggccgtgagc gggtcgtcgg tcccggagtg + 44041 cgtcagcctg cggtggtcga gcggtggcag cggcgcgccc ggcaggaaca gtgcggcgct + 44101 cggttcggcg gtccggaacc acgccgtgcg tgccagggcc ggcagctggg gtacgagcac + 44161 cgcctggcag acggccgttc ccgagtggcc gagtccggcc acgggcaggt cgcgggcgag + 44221 tttctggaag ccgccgtaca gcgggccgcg gtcgtagccg cgggcgccga gcacggcggc + 44281 gagttcttcc aggtcctcgc gcagcaggtc cggcatggtg tatttgaccg ccgccgcgag + 44341 cagatgggcg tgctggggta cgaggctgag cgcccgcagt cccgtgacgg ccatggcgtc + 44401 gcaggcgagc aggtccgcga agaccccgct gagtgccttg tgccagcggc gggcgggccg + 44461 tccgtcgggc cggttctcgg tggcggcgcg caccgcgagc cgcaggacgc tgtccacgcc + 44521 cgcgagcacc gtgcccggga tgaggcagtg gctgatctgg aagctgcgca gggccagggt + 44581 gacgccctcg ccgagcgagc cgaccagggc gctgtcgggc agtcgtacgt cggccaggcg + 44641 cagtccgtgg aagcgggccc cgcgcatgcc gggcatctcc acccgcgcca gccggcgcac + 44701 ttctccggag gcgggtggtc cgggcagcag gagcaccgag tggctggcgg agccggagcc + 44761 ggcggaggtg cgggcgtaga cgacgaaggt gtcggtgcgg tcggcgttca tgacggcgtc + 44821 cttgctgccg ttgagcagga agccgccgcc cgcagggcgt tgtgcgcgga cctcgcggcg + 44881 caggatggcg ttggcgtgtg ccacctcccg gtgcacgatc gcgacccggc ctccgccgag + 44941 caggacgtcc gcgagggccg cgcgctggtg ggtgtcgccc gcggtccaca ccgaggacgc + 45001 ggcgaacagc gaggtgatgc cgaagccgta gccgagggcc aggtcgcggc ggaagagcgg + 45061 gcgcagcacg cgggccagct cttcgaggtc cctcaggcgt ccgccgaggt cgtgggggac + 45121 gaactcggcg gacaggccgt gctcggtcag gagcgcctcg gtggcgtgtg gtgcctcgcg + 45181 ggtgtcgtcg gcccggacca gggccaggtg tccgtgcggg ttgaccgggt cgaaggggtc + 45241 gccgagcgcg gcctccagcc gggcggcgcg ctcgggttcg ggtgcgcggg tgatgtgttg + 45301 ggattcgggg gtggtgtgtt cgggtgcggg tgtgggggtg gtgctgcgcg ggtcgggggc + 45361 ctgccccgtc ggcccggcgg ccgtgtcgag ggcggcggtc acaggacccg caccgcgtcg + 45421 gaggcgtggc gcacggcgtg ctccagcagg cggcggccgg cccggccgac ctcgtcgcac + 45481 acccgccggg cggcgtcctg gtccagtgcg gcgtcgtcgt tgagcagcac gtcgtgccgc + 45541 acggtgacgt cgaggccggc tccgggctgg ggctcgatgg tccactcgcc ggtgtacgcg + 45601 gccagcggcc cggacgtgcg ggtgtgtttg tgcacgaggc ggccggcggc ggggaagctg + 45661 atgcgcaccg cctcgccgcc ggtggccgac cggccgtcca gggcgaggac ctggatgccg + 45721 ggggtgtcct cctgcaccgt cagggggcgg gtgccggcga ggtcgtcggg ccagtcgccg + 45781 gcccggtaga ggaagtcgaa gaccagctcg gcgggcacgt tgacccggac ggtgtcctcg + 45841 aaggacatca cgaggtcgtc cagccgggtc cagcgctcgg cgagccaggc caggcgctgg + 45901 agctgggcgc ggctgttggc gcgggtgacc cgctcggtcc aggccgcgtc ggccggagcg + 45961 tcgccgacga cggtgaaggc gtgttccagg gtcacccggg agccgtcgcc caagggctcg + 46021 acggtccaca ggccggtcat cgtctcgacc ggggcggagg gccgttcctg gcggaactcc + 46081 acccgccgct gtccgacgtc caggcgacgg tgggagaccc aggagctgat ccggtcgccc + 46141 gccacggccc acatgcgcag ccgttcccgt gtcccgtcga agtccagttg ttccacgtgg + 46201 acgctgggag ggaagaacag cggccacacg gtggcgtccg cgatcaggcc gtagagcact + 46261 ccgctcgggg ccggggccgt catctcacag gcagtacggt gcactcgcgc atccggcatc + 46321 gtccacaccc tccgtcgtcc aaggcgtcgc cgccgggccg gtccccgctg ggccgcacgc + 46381 gtgccgggtc caccgggggc gggccggtgc ggccgggccc gtcgtactgc ggcttttctc + 46441 gaccctgtcc ggaaccgcta gggatgtgcc ggtagcgcgc tcgtgtcccg ctggagcggc + 46501 gccccggggg cacgcgctcc agcgggaacc gtcgggtcct cgagcccggt ggccgacggt + 46561 ggcctgcggc cccagaagcg atccgggagg tggcagggat gagacgcttc cgcccgcgcc + 46621 gatgcgtccg tggcctgtgg gagggtctgg tcgcctacgg gcggctctgc ctggccggcg + 46681 agacggaccg gtacgaccac cctccgcgcc cgcgcgtccg gtggcaccgg ccgccgccgg + 46741 gacacccgga acgggtgcgc gacgacatgc ctctgaccga cctggagcgg cgcctggccc + 46801 gcgaactgac cgacgaggac cacgacgtcc gctaggcggg gacgccacca cgcgtgccgc + 46861 gggcggggcg gcggacgccg ggcagccggg agacacggac ggccgggcag ccaggagacc + 46921 ggcaaggccg gaaggccgga aggccaggag ccggaaggcc gggcagccag gagacctggc + 46981 agaccgggga gccaggaggg ccaagagccc aggagcccgg gaggccagga ggccaggagg + 47041 ccgggagccc aggagcccga aggccggaag accggagggc cgggagtccg ggagggccgg + 47101 ggagtcggcg ccgggggtgt ttccctttgc gcggcccgcg gggcgcgggc cgttcctggc + 47161 cgccggtgtg ttccgctccg tctcgttagg ggcgggccgt cactgcgcct gaggggcccg + 47221 gagcactgcg gcggagttga agccgccccg tccgcgggcc agtaccagcg ccactcgcag + 47281 ccggggcagt tcccgtgggg ctccggtgac caggtccagc gggcagtcgt cggcgacgcg + 47341 tccggttccg gtggtcgggg ggacgacttt ctcgcgcagg gcgagcagcg cggctgccac + 47401 gtccagggcc gagccgcccg cgcccagccg cccggtcatc gtcttcggca cggtgaccgg + 47461 tactccgtag ggtccgaaca gcgcgcacag cgcctggctc tcgacgaggt cggcgcgccg + 47521 ctcggcggcg ccgtcggcga agaccacgtc cacgtgttcg ggggccaggc cggcgtcggc + 47581 cagggcgagt tccgcggcct ggcgcagtgt ggggcggtcg gggccgtcga aggtggcggc + 47641 gcagccggcg atgacgccgt agccggtggc gccccggcgg gcggcggccc gggcgtcctc + 47701 caggacgagc agggcgccgc cctcgccgac cgcgtggccg tcggccgtgg ccgcgaaggg + 47761 ccggtaggcc cgggcgggtt cggtggccgg gctgagccgg ccgtccgcca ggtgcgcggc + 47821 ccagccccat gcgcacagtg tggagtcgat cccgccggtg accatgaggc atgccccgtc + 47881 gcggatccgc cgccgggcgc gggcgagtgc gtcgatgccg ccggcctgtt cgctgacgac + 47941 ggtcgagccg tggccgcgca gccggtgccg gatggagatc tgtgcggggg ctgccgcgtg + 48001 gaaggacgcg aaggactggt aggcgctgac gtgctgggcg cctttgctcc acagcgcggc + 48061 cagtccccgt tcgccgaatt cggcgccgcc cgcggagctg gcggtgatca cgccggcgcc + 48121 gtatgcgggc aggtcggccg ggctcacgtt agcgtcgcgc agtgcttctt cggctgcgac + 48181 cagggcgatg cgggtgccgc ggtcggtgga gggcagcagt ctgctgggga tgtggtcctc + 48241 gtcgacgaag ccggggatct cgccggcgat gcgtacgggg tagccggagg cgtcgaagcg + 48301 ggtgatgggg cccagtccgg tgcgcccgca cagcacggcg tcccaccagg ctctggtgcc + 48361 caggccgttg ggtgcggcga ctccgatgcc ggtgaccagg gtctggcggg ggccctgggc + 48421 gccggcgggg cgggccggtt cgggggcctg ggtcgccttg gtcatgcggc ctccttgagc + 48481 tgtggccggg tgaggacggc ggccgtgtgg aagccgccga agccgctggc gacggtgagg + 48541 acggtgctgg tgcgctgttc ccgggcgaac aggggggtgt agtcgaggtc gcaggtgggg + 48601 tcgggttcgt ggaggttggc ggtgggcggg acggtgtcgt gccggatggc cagggcgctg + 48661 gcggccaggt ccagggcgcc ggcggcgccc agggcgtgcc cgatcatcga cttgatggag + 48721 ctgacgggca cgcggtgggc gctgccgccc aggctttcct tgagggcgtg tgtctcgtgc + 48781 cggtcgttgt gccgggttcc cgcgccgtgg gcgctgatgt agtcgacgtc ggcggggttc + 48841 agccgtgcct ggtcgagggc ggcgcggatg gcgtcggcca tctccagtgc cccggggcgc + 48901 agtcccgtca tgtggtgggc gctgctgtgg gcggtgacgg cggacagttc cgcgtagggg + 48961 cgggcgccgc ggcggcgggc gtgttcgagt tcttccagga ccaggacggc ggcgccctcg + 49021 ccgagcacga atccgtcgcg ggtgcggtcg aaggggcggc tggcggtggc ggggtcgtcg + 49081 ttgcgggagc tggtgaggcg caggcggtcg aagcaggcca tggcgatggg cacgatgggt + 49141 gcttccgttc cgccggcgac gacgatgtcg gcgctgcctt cccggatcag gtcggcgccg + 49201 tggccgacgg cgtccaggcc ggaggtgcag ccgctggaga cgagagcgac ggggccctgt + 49261 gcgccccggt cgcgggcgac ggtggcggcc agggagctgg ggacgaagta gtcgtagagg + 49321 gattcggcgg cctcggtgtg gtcgagggtc caggtggtgc cgcagtcgct gaggatggcg + 49381 tactgggtgg ccaggctcgt ggtgcagccg atggcgctgc ccaggctgac gccggtgcgc + 49441 agggggttgc ggccgatgcg gtccgcgacg ccgctgtcgg cgacggcttc gcgtgcggcg + 49501 accagcgcga actgtgccgc gcggtccagg cgttcggtgt cggcgaggtc gaatccgtgg + 49561 gcggcggggg tgaagtcgac ctcggcggcg acgcgggagc ggtagccgca ggcgtcgaag + 49621 agggtgacgc ggcgggtggc ggtgcggccg acggtgagca ggtcccagaa gccggcggtg + 49681 cccaccgcgc cgggggcgac gacgccgatc ccggtgatca cgacgcggtt caccggccgc + 49741 ctcccgtggg cagcgcggtc acgtggccgc ggcaggcccg gccgacgtgc tgggccaggc + 49801 tcgaggagct tgcgaagaag tgtcccccgg cgacggtgtg cagttcgatc aggttggtgg + 49861 tccactgctg ccagtggcgc agggcggcgg gtgcggcgag cgggtcgtcg cggcccgcga + 49921 agaccaggac gggcacgtcc agcggccctc cggtgaccgg gtccagggcg gcgttgcgca + 49981 gcgaccgggc caggcgcagg tcgtcgcgca ggacgggcag gaaggtgcgc cgccacagtc + 50041 cgccgggaga ggccgaggcg cccggcggca gggagccgat ctcgtcgagc agcggcagca + 50101 ggtcctcgtc gggcaggtcc gccgcgtccg ccaggacggt ggtggtgtgc gggggcgggc + 50161 aggcgccgac ggccaggaac agcgggggca ggccggagtc ggccagggcc cgggtgagcg + 50221 tgtagccgac gagggctccc atgctgtgtc cgtagagcgc gtaggggccg cggcgtgccg + 50281 tctgaagcag ggtcggcagg aagtcggcga gcaggccggc gcgttcggtc aggcgtggtt + 50341 cgcggcggcg gctgtcgcgg cccgggagcg gcagggcggc cacgtcgatg ccgggtccga + 50401 ccgccgcgga ccagccgcgg tagctcgcca cgcccgctcc ggcgtgggcg aggcaggtga + 50461 gtgtgatccg tgcggtgccc gcctcacggt ccctggagcg ggaagccatg cgtcgccctc + 50521 cttgtgaacg gtccggtccg gccccatccg ggcgggcgcc gccggcgtgg cgcgtgccac + 50581 gcggtgccgt cccggcgccg gtccgggggg tgggtgcccc tgcgcaccga gcgtcgcccg + 50641 cgcggctcgt gcggcgctca accccgcggc gaggcgggcg gcgaccccgg ccggcggccg + 50701 cggcggccgc cgcccctgcg ggggccggcc tgccgggtcc ggccgggcgg cgagggcacc + 50761 ggcgtctcat gccgcgtaca ggtcgaacgt ggaggtgcgc cgggggcccg ccacgatgtc + 50821 caggcgcggg tcgacggcga gcatcgcctg gtgcagccgc tgcagttgcg gggagggttc + 50881 gacgccgagt tcgtcgatga gccgctggcg gagcctgcgg tacacgtcga gggcggcggc + 50941 ctgcctgccg gagcggtaga gcgccaccat ggcctgggag tgcagccctt cgtgctgggg + 51001 gtggcgggcg atcaggtcgg tgagttcggc gatgagttcg acgtgccggc ccagccgcag + 51061 gtcggcgtcg atgcggcgct cgcgggccac cagccggctc tgctccaggc gcatcgcctc + 51121 gatctccagg acgggcccga cccgcacgtc gaccagggcg gggccgtccc acaggtcgag + 51181 cgcccggcgc agcaccgtgg ccgcccgctc gtcctcgccg tcctcgtagg cctgtcgtcc + 51241 ttcggtcacg agccgctcgt aggtgaacgc gtcgaccgcc tcggcgggta tctgcagcag + 51301 gtacccgccg tagcgggtgg ccaggacgtc cttggccgag cccggcacgt cggggcccat + 51361 ggccgtgccc agcaggcggc gcagctggag gatgtacgtc tgcagcgtgg tcatcgaact + 51421 ctgcggcagg tcggtgcccc agatctcctc catgagggtg ggcaccggca ccacccggcc + 51481 ggggtacagg gcgagcagcg ccaggatctg ccggggcttg cccgcactgg ggacgaccga + 51541 gattccctcg aattcggcgt tcaacgcacc caggactttt atttccataa ttccctccgc + 51601 aatgtttcgg ggcgactggt tctgagccgt tgacggagct acttgatact gcctccttgc + 51661 gcctgtccgc gtcattcccg ccactccgcg gcaagaggaa ccggacggtt ctctgatcgg + 51721 cgcgcgaggg cggctctagt tattcttgac ccgtccctgg aagacaggag gctgcggctt + 51781 tgtccgggct gtcgccgggt taccgctcac gggtggtgat tttgcgcccg gtacggtcgg + 51841 gggcgtattc gtttcggttg tttttccggc cacggcgagg gccgcggtga gggccgcggt + 51901 gacggcgtcg ggcggcgcgt gcggggccgg ggagcggtgc cggccgtccg gggacggtcg + 51961 tggccggccg tccggtggcg gagggtttcc tgtcccgggc ggcggcgccg agcccctgtc + 52021 ccggccggtg gcggagggtt ccctgttccg gccggtggcg gagggtttcc tgtcctggcc + 52081 ggcggtaccg ggtttcctgt cctggcgggc ggcgggtggg tgtcaccggc tgtccgggcg + 52141 gggcgggctt ttcggtcgcg gtgtcctgtc cttttcgggc gggccggggc cgcgggggct + 52201 gaagaactct cgaggaatcg cccacgccgg tacggggccg gctggagaat agcgtgccgg + 52261 aaaccatggg cggatagagt ccgtgcggaa ggaagtgcac ctgctattcg tgagggaata + 52321 ccggggccgt gatccgggcc ggcggatgcg gaatcgggtg cttcccgggc aagggcgaga + 52381 tggagttccg gattcttggt tccgtgcaga tccacgacga gcgttttggc gtccgggtcg + 52441 ttcccgcggg tgcgaagcag cgtgcgctgc tgggtgcgct gctggtgagg gccgggcagg + 52501 cggtgccggc cgagtgcctc gtggaggagc tgtggggcgg gcagcctccg gtcaatgccg + 52561 ccaacgcgct gcaggcccat gtggcccggc tgcggcggct gctgccggcc ccgggcccgg + 52621 gcgggccgcg ccatgtgtgg ctgcggacct ccccgttggg ctacaccctg agcctggggc + 52681 cggcggtgac ggacgcgcag cgcttccacc gtctggtggg ccaggggcgc gagctggccg + 52741 ccaccgcccc gggccgggcg gtggaggtgc tgcgcgaggg tctggcgctg tggcgcgggc + 52801 ccgctctgca gggcagcggc caggggccca tctgttcggc cgaggcggcg ctgctggagg + 52861 agagccggct gcgtgccctg gaggtgctct acgacgtgtg tctgcgggcg gaccgctgtg + 52921 cggagatcac cggtgagctg gaggagctgg tcgccgtgca cccgctgcgt gagcggttcc + 52981 acgagcagct gatgacggcg ctgcaccgct gcggccgccg ggcggaggcg ctgagcacct + 53041 acgacagggc gcgccggcgg ctggcccgtg atctgggtat cgggccgggc caggtgctca + 53101 gccgtcgcag agaagcgatt ctgcgttcct gtgagccggc ggcggactcc gccgaccggg + 53161 cgggggccgg gacggccggg cagggcgggg acgaactcgg ggtgctccgg gaggagctgg + 53221 tgcggctgcg cggccacgtg gagctgctgc gccggcagca gcgggagctg tccgagcagg + 53281 tcgcccggct cacggcacac catccgtgcg gcccgtgagg aacggcggcc gggtcagcgg + 53341 gtgacgaggc ggccgctgcc gccggcggcg gcgggcgtct cggggcgggc catgaggatg + 53401 gagcgctgca ggcggctgag tgcggcggag ggttccaggc ccagttcgtg cacgagtgtg + 53461 ctgcgcagcc gctggtagac gttgagggcc tcaccgcgcc ggcccgagcg gtgcagggcc + 53521 agcatgaact ggccgtgcag gctctcgtgc atgcggtact ggttgaccag gaccgtcagt + 53581 tccgacagca gttcccggtg gcgtccgagc cgcaggtcgg cctcgatgcg ctggtcgagc + 53641 gcgcacagcc gggcctcctc cagccgcttg acctccgtgt cgatgcgcag gccggcctgg + 53701 atgtcggtca gggcctgccc gttccacagc gcgagcgcgt cggccagccg gcgggccgcg + 53761 ccggcgtagt cctcggcgtc catggcccgg tagccgaggc cggcgcgctg gtcgaactcg + 53821 cggtagtcga cgtggccgcc gcgtgtctgc aggcggtagc cgccgggaac cgtggcgagg + 53881 atgtccttgg cggtgcagcg ttcgtcgggg ccgtgggcca gcgcctgggc catcagctcg + 53941 cgcagctgca ggacgtaggt ctgcagggtg gtccgcgcgc tgcgcggcgg gttctccccc + 54001 cacagttcgt cgacgagcgc ggccaccggg accacctggt cggcgttgag cgcgagcagg + 54061 gccaggacct ggcgcggctt gggtgcggtc ggcacgaccg acaccccgtg ttcgcgcacc + 54121 gacagcgcac ccagcacttc gatgtccacg tttcccccat gttttcaagg ccgcaggccg + 54181 gtggccggcc tgcgcgtctc ccgctgaccg ggacccggcg cggctgcagt cccgataaaa + 54241 aaacagctca gtcggtttgt caatgtggac tcgacgcgtc gccccggcat cgcccagatc + 54301 cagtcaaacc ctgatcgaac atctgcccac aacccggctc cgagcaggcc gttcatcact + 54361 caacccgccc atgattcgcc agtgttgcgc gaaaccgcgc cctgtacagc accggagcga + 54421 ttgactggaa accatcggcg cggatcgcgc gggacgggga agccccgcac agggaaaagg + 54481 ggcgccattt cccgaatgcc cgattcgggc gtccggtcgg cgcccccaaa ggagaccgta + 54541 cggtctttaa ttatccggtg gcggtcccgg tccaggagcc ctcggcctgc cagagcccgg + 54601 cgtgcggcgc cggcgcgagc gcgggcagga gcagcagcca gaactgggcg accgtgctgc + 54661 gtgacagcca cgcctggttg cgcatgccga gcacctcgaa gccgctggtg gcggcgacca + 54721 cggcggccac ggcgctctcc ggcgcgacgc tctcgcgcag ctcgccgccg cgcccggccc + 54781 ggccgaccat gtcggtgacc cagttctgcc agcacagccg caggtcggtc cgcggctgcc + 54841 ggccggcctc ccggctcagc tcgaaacccg cccgcagcac cacgtcgttc tgcagggcgc + 54901 aggccagctc atgggtggcg ttcaccaggc actgcagaac cccgggcggt cccccgtccc + 54961 accggccgca gacggcccgc agcacgtctg cggccgcttc ctccaccgcg tccgccagcg + 55021 ccgccttgct ggcgaagtgg aagtgcagtg cgccgttgct cacccccgcc ctggagctga + 55081 tcgtggtgag cgcggcggcg tggaagccct cgtcgtggaa gatctcggcc gcagacctga + 55141 tcagggcttc ccgcgtacgc accgcacgtt cctgtctggc catcgatcac tccgtcactg + 55201 cggggggttg ccgtgcttgc gggagggcac gtcggcgtcc ttggtgcgca gcatcgccag + 55261 ggactcgatc agcacctcgc gggtctcggc ggggtcgatg acgtcgtcga ccaggccgcg + 55321 ttcggccgcg tagtaggggt gcatcagctc ggccctgtac tccttgacca tgcgggcgcg + 55381 caccgcgtcg gggtcctcgg cctcggcgat ctgccggcgg aagatgacgt tggcggcgcc + 55441 ctccgcgccc atcaccgcga tctcgttggt cggccaggcg taggtgaggt cggcgccgat + 55501 ggactgggag tccatcacga tgtaggcgcc gccgtaggcc ttgcgcagga tcagggagat + 55561 acgcgggacg gtggcgttgc agtacgcgta cagcagcttg gcgccgtggc ggatgatccc + 55621 gccgtgctcc tggtcgacgc ccggcaggaa gccggggacg tccaggaagg tgacgagggg + 55681 gatgttgaag gcgtcgcaca tctggacgaa gcgggcggcc ttctcggaag cttcgatgtc + 55741 caggacgccg gccagggcct gcggctggtt ggcgacgatg cccacgacct ggccgttcag + 55801 ccgcgccagg gcgcagatga tgttgcgggc ccagccctcg tggacctcca ggtactcgcc + 55861 gtcgtcgacg atctcctcga tgaccctggc catgtcgtag gggcggttgc cgtccgccgg + 55921 caccaggtcc agcagcgcct cggaacgccg ggactgcggg tccgagcagg gcgtgcaggg + 55981 cgggaactcc cggttgttct gcgggagcat cgacagcagg tagcggacct cggcgaggca + 56041 ggtctcctcg tcgtcgtagg cgaagtgcgc gacaccggag gtctcggcgt ggacgtcggc + 56101 cccgcccaga ccgttctggg tgatctcctc gccggtgacc gccttgacca cgtcggggcc + 56161 ggtgatgaac atctgcgagg tgtcgcggac catgaacacg aagtcggtga gggcggggct + 56221 gtaggccgcg ccgcccgcgc acgggccgag catcacactg atctgcggga tgacccccga + 56281 cgcccgggtg ttgcgctgga agatgccgcc gtagccggcg agcgccgaga cgccctcctg + 56341 gatccgggcg cccgcaccgt cgttgaggga gaccagcggg gcgccggccg cgatggccat + 56401 gtccatgatc ttgtggatct tcgtggcgtg cgcctcgccc agcgcaccgc cgaagatccg + 56461 gaagtcgtgc gcgtagacga agaccgtccg gccctccacc gtgccccagc cggtgatcac + 56521 accgtccgtg tacggcttcc tggcctccag cccgaacccg gtcgcccggt gccgccgcaa + 56581 ctgctcgacc tcccggaacg accccgcatc cagcagcagc tcgatccgct cccgcgcggt + 56641 cagcttgccc ttggcgtgct gcgccgccgt cgccttctcg ctcggcccgg ccagtgcctg + 56701 cgcacgcaca ccgtgcagct cggccacccg cccgcgcgcg tccgccggct ccgcgggaag + 56761 cgccacccga ggaatgtcat tgagtatcgt cacgatctgt ccctccctca tggcgcggcc + 56821 cggtcgtcgc ttcaccgtaa caaaccatct atgcggtttt ggttcgggga gctcggcgcg + 56881 cacaggaatc agccatggaa gatgcggtgc cggcctaccg ccagcagtag ggggaccggt + 56941 aggccccggc ccggtgtccg ggccgccacg gggcagcccc ggaccgctcc cgcccgcccg + 57001 gcccctcgtc ccggcgggcc gtcagcgcgt acagcacggc ggtgagcgcg gccagttcct + 57061 cggcaccggc acgtccgcgc tcgatgcgca cagcgggcac ggcccgctcc ggttcggcca + 57121 tgtcccctcc tctcggcgtg cggccaccgt ccgcccgcgc actacaggag cgctgcactt + 57181 ccgctcgaga ggacgggcgc cggccccgcc gccccgcagg cgcccgcagg ggcccgcctt + 57241 cggcaacaga gcagggtgcc gggcggagcg acggcttccg gaagggcggc ctccaagagc + 57301 ggctcgtcgg agggaccggt tcccctagaa atcaaaccgg acggtcccta tctttcatca + 57361 cgtccgtcac cgacggcgga cggagcgctt tcgatacgtc cattagcagg gggaaaaatg + 57421 gctaccagcg cgttccccgc aacacacccg gccctcggcc aggagcccgt actgcccgcc + 57481 ggcaccccgc ggttgcggcc cagcctcttc cgctacccga acctgacgac gaccgtcccc + 57541 aaggaactgg tccaccgcgc cgccgtcgcc gaggtcatgc tcaccgactg ggagcgcgtg + 57601 gacgacacac gcttcaaagt cgccgcccag tggccgcgcg gccacagctt cttcaccccg + 57661 atcgacggcc gctaccacga ccctctcatc gccgccgaaa cgatccgcca ggtcggatcc + 57721 ctcctcggcc acgccgaatt cggcgtcccc ttcggccacc actacctgct gcacgacctc + 57781 agcctgcgcg tcgacccgca ccacctgatg atccaccagg cccccgcctc cctcgacctc + 57841 gacgtgacct gcgaggacct caagatgcgc ggcggccgcc tcgccgccct gcgctacgag + 57901 gccgtcgtac gccgcgacgg ccacaccgcg gcgaccggcg tcttctcctt ctcctgcgtc + 57961 tcccccaccg tctaccggcg gctgcgcccg ccccacgtgt tcgccgacgg ccaccgcccc + 58021 ctgccgctga ccgcacccgc cgccccgcag agcgtgggac gcatgtcccc cgccgacgtg + 58081 gtcctctccc ccaccgagga cccccaccgc tggcagctgc ggctggacac ccagcacccc + 58141 gtcctcttcg accaccccgg cgaccacgtc cccggcatgg tcctcctcga agcggcccgg + 58201 caggcagcag caggagccct gggaagaacc tccctgctcc ccctcggcct gaccagcgaa + 58261 ctggtgcagt acgccgaact cgacatcccc tgcatcatcg aggccgcccc ccaccccacc + 58321 cacagccccg gcctcaccac cgtccacatc accggacacc aacgcggcca gaccgtcttc + 58381 acctgcaccg tcacagcagc agacgcctga cccccgccac cccgccgccc ggtcagcggc + 58441 cggaaaaacc cgccacatgg tcggccgccc actgaccaaa cgaccgcgca ggcctgccca + 58501 ccaggcgggc gaacgtcccg tccaccccgg ccttggcccc ctcccgctgc cgcacagcac + 58561 tccgcagcag cgcctccacc accgccggcg gataccgccg gccccaccgg gcccgggcct + 58621 cctcccaccc cagctcctcg aaacgcagcg gacggcccag cacacacgac agccgggccg + 58681 tccgctgaac cgccgagacc gcctccggac ccgtcagcac atacgcacgc cccgcatgcc + 58741 ccggccccgt cagcgcccgc accgccacct ccgccacatc ccccggatcc acacacgcgt + 58801 tcaacgacgc cccgaacagc tcacgcacca caccctcggc ccggacctcc gccgcccacc + 58861 ccagactgtt ggacatgaac gaccgcggcc gcaacaacgt ccaggccagg cccgaggaac + 58921 gcagcagttc ctcgctctcc cgctgccagc gggtgatcag gtcgtcggcc cccgcatcct + 58981 cgacagcggc cgccgacagc ttcaccacat gctccacacc cgcatccgcc gccgcccgca + 59041 caaaacacgc atcctgatcc cccccgacca ccgtcgtcac caaaaacgcc cgcctcaccc + 59101 cccgcagagc cgcccgcaac gacgccgcgt caccgtaatc cccacggacc accctcaccc + 59161 gccccccggc cgccacccgg gcaggatcac gcgccagaac ccgcacctcc acaccggccg + 59221 gcaaccgccg caccacctcc ccgcccaccg tccccgaccc acccgtcacc aaaaccacca + 59281 caacgccccc caccccgaac ggccgatccc cacctgtcgc caccgaagtt acccacccgc + 59341 acgtcttggc cacacgccca ccgacgttaa aatacgaact agacggtttg taagcgaagc + 59401 cttccacagg gctcatcgca caacgggagg gcaacgtgcc ggcacaagaa cgagcgatcc + 59461 gcacacgcca gaacatcatg ctggccgccg ccacagtctt caacgaacgc ggctacaaag + 59521 ccgccaccat cgccgacatc ctcaccacag caggcgtcac caaaggcgcc ctctacttcc + 59581 acttcccctc caaagacgac ctcgcccaag aagtcctcgc cacacagaac cgcaacctca + 59641 ccatccccga acgcccctcc aaaacccaag aactcatcga cgtcgtcatg ctccacaccc + 59701 accgactcca gaccgacccc atggtccgcg cagccgtccg cctcaccatg gaccaactct + 59761 ccacagaatt cgaccgcacc ggccccttcc gccaatgggc cgacctcacc cgccaacgcc + 59821 tcgaacaagc ccgcgaccaa ggcgaactcc tcccccacgt caaccccaca gaaaccgccg + 59881 acgtcctcgt cggcgcctac gccggcatcc aatccatgtc ccacgccctc accgactaca + 59941 ccgacctcac cacccgcgcc aacgccctcc tccgccacct cctccccacc atcaccctcc + 60001 cctccatcct cacctccctc gacctcaacg aaaaccgcgg cgcccacgtc tacaccgaaa + 60061 tccacaccac cacctgaacc acacccaaaa acaatgaagt ggatcgcgcc tgattgcctc + 60121 atccaagagg cgagttgagc gatcaatccg aactgagaac gtcttccgtg aaccgtgcgg + 60181 gatgaaccgc gggacggccc caagccattg ccgccgcagc atgaacgcaa gtcccggtgc + 60241 cccggccgca ggccgctgcc ggaccgggaa gccccgtgca ggaacaacac cctgccccca + 60301 acacagcaca agccggccgc acactcggta ggccgtagcc gccagccagt tccagcagga + 60361 ccgggcgttc gacggaacac ccccgtgtcg gcgggaagga ccgctgccta cccctccacg + 60421 cctgcccgca cctgaccttc ccggcacacc gccccgtgag tgccggaacg cggaggtcgc + 60481 cgaccgacgc gcagcagcct cactgaggcc cacttggtcg gccccgctgc agacctcgat + 60541 cgcaagaacg ttgaggaacg cgccgtggag gccatcacac gcttcctctc cctccctgac + 60601 ctggaattgc tgccctcggc agaccgcggg agatccaaga ccgttggttc aagcgagtcg + 60661 cagtcggcct aggttgcggt ggccacgtcc gaacacatct caaggagaag ttcatgtctg + 60721 acgcgaagga ggccggagac agagccatgt cacatgaggc agcggacgac agcgaccgag + 60781 acggcggaag aggatcctct aggctaggct ggcggctttc ctgcctggcc gttgtggtgg + 60841 ccgttctcgc cgtcgggacg ggaggccggt atcggcacac ctccggctga gatcgaccgc + 60901 tccggtcctt cctcgacaac aagagatcgg ccaccagggc tactggatca ccaacgcggt + 60961 ccaggtcacc ggcgactaca ggctcgtcgc cgagcgaccg gacgtggcac gcggccagca + 61021 gtcataggcc gtaagcgccg ggtcgcgggc agcggccctg tgcgatcact gacccaacac + 61081 cagagctccc gtaacgagac cgcgatccgc agtcctcagt ccccagacag cgggcgcgcc + 61141 acccggcttg ggttagtcag ctgtgctgct ggctgccctg gagagactgg tcggtcatgt + 61201 cggcaacctg gcctgctggc ggggcctcgg cgttgacctc agtgccgaag tccgagaact + 61261 ccatcaccgt gctcatctgc agctgctgag gcgaagcgct gccttccggc ttcgcggagg + 61321 cggaggctgg ggccttgagg gtcatctcta tctgctgacg gcgcagtcgc cctttgtcgt + 61381 cgagccagac gtgcatcggc agcgtcgggc cgacctgctt gctcagctgc tcgccgcccg + 61441 gcagcttgga gacgtccacg gacaccttgt actgcgtggt gttggccccg tcgatctcct + 61501 cggttccggc cttggtgacg tccttgttgg tgatcgccct ggcgtaggcg gcggtctggg + 61561 ccgggtcgcc gatctgctgg ttgctcaggc cctgctgcgc ggcgaccttt tccaagtcga + 61621 tcttgatcca gggtttgccc cccagagcct tctcaccggg aatcttctgg tagagaacct + 61681 ggtcgaccac gcgttgttcg atggtcttgt cctgcacggt aagggtcatg acactgtcgc + 61741 cctccgccag gtcgaggacg cccttaccgt cggatgtgat cgtcttgccc tccgcggcga + 61801 gcttcatctt gatcgtcatc cgcgcggact cggcttcggc cgtcttgtcg taggcagccc + 61861 gaacctccac cgtgccctgc tcctgggtgc cggcgctgct actcgcgctc ggcgacaccc + 61921 cgtccctctt ggcctgcgaa ccgtcaccgt caccgcaacc cgacaggaca acgctccccg + 61981 tcaccgcggc cactacgatc gcgccggcct tcatccccct gtagcgcatg cgaatctcct + 62041 caacgagtac caacccccgt cacgtcggtc tgctgggctc cgaatgccct gaccaagggc + 62101 caacacgcct gtgtgcaaag tgaattgttg atacgtcccg cacggagaca gatattcacg + 62161 cttcctgcca ggtccaacgc tgctgctgcg atgtacgccc acacgcttcc accagccgca + 62221 atcaccatcc tgctgcccat cgaccgcatc gccgccgacc gcccccttct gctccggcga + 62281 gcacaagaga cacgggatga acgtgcaggt cccggccgat ccgtccggcc ggctgctgtg + 62341 ggcctctccg gctctgcccg gtgccgtcca cgacgtccga gccgcccgtg aacacgacat + 62401 cgtccgcaag ctcacggacg ccggcatcac gtgttggacc gacaagggat accgaggcgc + 62461 cgggggcacg gtccgcgttc cgttggggcc gtcgggagac acttcccgag gccagaagga + 62521 cgtcaaccgg tctcacgcca agaaatgggt cctggtcgag caagccgccg ccaccctcaa + 62581 tgcctggcga ctcctccgca acctacggtg ctcgaccagt ggcgtcacaa gcctcgtccg + 62641 ttccgtcgtg accgtgcatt tggccagcac agacggaaaa ggctcaatga cgaccttttg + 62701 agcgtcccat acagatgccg actgctaccg cgaggacggc aacgacgaaa ggaccgttcc + 62761 catggttccg ccagggaacc aaagtgcagc cagagcagtc atctttttcc accctattat + 62821 gtgctgcgtt actgctccag atcctgcagg cctagcaaca caacgggccg accgccgggc + 62881 cctcgcctgg actgacacac ccctcatccg ctggacttac gaccactctt catggcgtag + 62941 gtaagcatcc cgatgccggc gactccgaga actcctagcg tgaggagtat gaccctccca + 63001 gatccctcga tgagagatcc ttgaacgaga gcagcaactg acaccacacc actgacagcg + 63061 gtgaatatct tcaactttcg cttttcatcc acttccaata ctccgctctt gagacatgaa + 63121 cacgaccagc ggtggagagc cctacatgcc ctccaccgca gatgacgaat agggtcagcc + 63181 cttcctgaac ccctcagccg taggtgatta tctcagcgtt gttgtagccg aggacccctc + 63241 cgacggcgca gctcgtcact acagcgcccg ccgttcccca cgggccgaag gtgctggccg + 63301 ccgcgatgat tcccgtttct gccgcagctc cgactccagc gacgcaaccc gtgacagctc + 63361 cccaaatgtc gttggtgtcc tcgaggaagt tggacacact gtcgaggaac ccgagtccgg + 63421 acggatccat gttgttgatg gggtcgccgg cagcgtagag gtaggggttg gtttcctggc + 63481 cggaggggtc gggctgggtg aagcggccga gggtggggtc gtagtagcgg tggcccatct + 63541 tgtacaggcc ggtcgggtcg gcgtaggcgc ccgcgtagcg gtacggctga gggacggcct + 63601 cggtcggcgt cgtgcgcggc agtccggtgg ggccgtaggt gtaggtgtgg gtgcgcttgc + 63661 cggtgtcgtc ggcgaggccg aggacgttgc cggtggcgtc ggtgaggtag tagtaggact + 63721 tccccccagt cgtcatggag ttcagcgtgc ccgccggttc gcggatgaat ccggtgtcga + 63781 cgccgttcgt cgtggtggag gcgaggccga gggcggtgtg gtggaaccat gtggagccga + 63841 gtttggtgcg ttcggcgttg gtggtgccgg catggaccag gtcgtaggtc ttgccgcctg + 63901 cggtgatgcc ggacagttgg ctgtagtccg tccaggactc gtccgtgcgg ggggtgttgt + 63961 cggctgcggc ggtttcgttg ccgagtttgt cgtaggacca gccggtggtg gagccgttct + 64021 tgccggtcag ctcgctggcg tcgttgtagg tgtaggtggt gccgccgggg caggtgttct + 64081 tgctgccgtc tcggctggtg aggttgccgg ccttgtccca gcagtacagc cacgacgcct + 64141 tccgcgtgcc tgccgcgtcg gcctcgagcg cgtaggagag gcggtcttgg gagtcgtagg + 64201 tgtaggtggt cttgagcttg gtgaggttgt cggtgcgggt gcggatcttg gtggtgtcct + 64261 tgcccgcgtt ggcgtagctg taagtcaggt cgacgaaggt ttgcgtgccc gaggtggtct + 64321 tgatcgcctg cgggcggccg ttcttgtcga tggtgacggt ctgggtggtg ccgccggggt + 64381 agacggtctt ggtgcgcttg tcgttgttgt tgtagtcgaa gtcggtcttc ttgccgtccg + 64441 gtgcggtgag gtagtcgagg cggccggcct tgtcccaggt gtagtccgtc gtcccggtcg + 64501 gatcggtgta gaagtcgacg tcgccgccgg gggtgtaggc gagtgcggtc tgggcgccgt + 64561 tctgcagggt gcggacgctc tcgcggttga gcttgtcgta gtcccacttg gtggtgccgg + 64621 aggcgtcggt gcgggacttg acgttgccgt cgccgtcgta cgagtaggtg acggtgaagt + 64681 tggtggagga gacctcgtgg acgcggtcgc gggagtcgta ggcgtagacg gtggtgatgc + 64741 cgcggccgtc cttgaccgtc tcgacccggc ccagcgcgtc gtaggtgtag gtcgtctccc + 64801 cgagcggcgc cggcggtgtc accttgatca ggttgccctg gtcgtcgtag gtgaaagagg + 64861 tgaccttgcc gttgccgtcc ttggcggtgc agcgctggcc ctcgaaaccg ccgcaggtcg + 64921 gggtgtcttt gttgtaggtg tactcgcggg tcgtgccggc ggtgccggat gtggtgaccg + 64981 acagggtgtt gccgttggtg tcgtacttga aggagtcctt gcggccgttg gcgccagtca + 65041 tgtcgctagg caagtcggtg ccggcgatcg tctggtaggc gctcaccgac gctgtcgcac + 65101 ccatcggcag cttctgggag acggggttgt tgcggtcgtc ccagccgtag gtggtggtgt + 65161 tgccgccggt gccgtccgtg ccggtgccca tcgcgtcgat cgcggtctgg gtgaggtggt + 65221 tcttgtaggt ggcgtggcgg gagtggccga gggggtcggt gaccttggtg acctcgccgt + 65281 cagcgttgtg cgtgtagatc gtttcgtcac cgtcggggtc ggtgaccgtc gtcgtacccg + 65341 cgtccgaggg ggtggccgcg gtgtagtcgt agcgccaggt cggcccggtg tggccgctgc + 65401 ccgaggtgcc ggtggcgcgt tgcatggagg tgacgcggtt gtggctgtcg taggtgaaga + 65461 gggtgacggt gccttcgggg gtggtcacct tcgtcaggcg gcgtgaggag tcgtactcgt + 65521 aggcggtggc cttgccggtg gtgtcggtga ccttggcgag gtttccggcc gcgtcgaggt + 65581 cgaggacggc ggtgcggccg gtgtggtcct tggcctgcca ctggctcgcg tccgtcttga + 65641 ccaggtcgat ccagcggccg gagcgggtct cggtgagctt gaagcccttg tgctcggcgc + 65701 cttcgtcgtg ctggtcgacg gtgatcgtgc ccttgttctt gtccgtgacc ttggtgagcg + 65761 tgccgtgctc gttgtaggtg tccttggtgc cggacttgcg gtcggtgagg gtgtaggtgc + 65821 cgtccgcgtt cttcttcaga tccttcgagt agcccgtcgg cgtcgtgtac gtgccgtccg + 65881 cgttagcggt gaagcgcagc aggctgccgg tggtatcgaa gacgtccacc tcgccgtcgt + 65941 tgatctgcag gtagcgttcg taggcctgcc accagcgctg cgacaccttc ccccacggtg + 66001 cctcgaggga gttgtaggtg cgggtcagct gaagtttctg gccgacgccg gcgatgtcga + 66061 agtcggtcgc ggcgagcatc aggttgccgt tggagacgtt cacccgcgcg accagtgcgt + 66121 cattcaggcg ggtgtcgagg atctggtgcc agggcacctc tccctggccc tcgggcacgt + 66181 agccggccac cgcagcatcc acggcagccg agcgagatgc ggacgtcttg gcgcgctctg + 66241 caccggcagc gcgggccttc tgcgccgccc gccaggccgc gacctcggcc gacggcttgg + 66301 cctccgcctc cgaggtgggc gccttgaccg tgccggccgg tgtcgccggc gcctccacct + 66361 tggtcggctt cgtccacgga ctctccggct ccggcaactc cggtttcggc gtcgccgcca + 66421 gaccgggagc cgccgcgatc accacggcag ccgcggtgat cgccgagacg agagcggttc + 66481 tgtgtgttct ccggtcacgc cacatgggcg tgcgcgcagc acgcgagtgc atcagcttcc + 66541 ccccacagga agtcagaccc ggcaacccca gcggtcgcca gcggcacaca agctgtcaca + 66601 agacgcacac aaatcggcgc ggcatccccc cgacgtacag atgcatgcgg gccggaacca + 66661 gccctaccgc ttcaccccga caaaccagga cgctacccct gtaaacccgc atacagcggg + 66721 cggagttgtc ggttccgtta tcgttttcgg agggcagctt gactggaatt gtttgatcca + 66781 gggcgtcttc cggtccgcta cggtttccga ccgccgtctt tcggccagtt tcagaccttt + 66841 ccgggggcct gtcgcgcagg ctgagcaggg tgttctcgct ggccatgacg gcgaacaggt + 66901 gatcggagaa gttgtctcag aggacggggg gcacggcagg tgccgctgcg cacccggttt + 66961 cgccgaatgc acacttggcc cgtcctgcat gcgtggtccc ccagcccgcg gcaaccaccc + 67021 ctgtcgtgaa ggacgcccct gcgatgagca caccgggcag acacacgccc tgctcccgtt + 67081 ccagccgcca ccacgttccc gcccagcggc tcacgcgctt cgtgcaacag gccggccgcc + 67141 tgctgtgctg gagcctcacc gccggcatga ccaccgccgc cctcgacctc ctcatcacac + 67201 ccgaagcagc ctggtggcac atgatgtggc ccctgccctg gtacctcacc tgcctctccg + 67261 cccctctctg ggccaccctc cgcgcccacg aaaaggccgc gcaccaacaa gcgcctgagg + 67321 aagacaacga catcccctgc gagtgggaac aagccgcctg actcgacgac accggcggat + 67381 ccggctggcg gggtaaccga gcatggcggc ggcctgtgac gccgtagccg cgtgctgctc + 67441 catgacgccg gccgtccgct gcgcgcgcag ggccttcagt gccgcctggg cggtgttgcg + 67501 atgtacgccg aagcggtcgg tgagggcggg ggcggcgtcc aggagctgcg cgacgcgcgc + 67561 gggcagctgg tcgcggggga cttggtcccc ggcgccagtg ggccggccgt ccccgccgtt + 67621 ggtgcggcgg cgtccggggt atagtcccag acgatgtggc ggggccagtg ctcgaccccg + 67681 cccacgcgca ccaggtgctc gctgacgacc gcttccttgc tgcgccggtc aaccggccat + 67741 agctgccatg atcagcacac cagttgcacc gcacagcagc accacaagcg gccatgccag + 67801 acagccgcgt ccggtacgcc tgcgccacag caccagccac agcgcacacg ccgccacgaa + 67861 caccaccgtc acaccgctca tctcgcccgc ccgccacgcc acctgcatgg cgccagggtc + 67921 agcgccccat acgaggagcg caacgagcac gcatcgtcag cgcacacacc gcttccagca + 67981 gcctgctcat catcgttcta ctcccgagtt ccttccgtcc ctgcgcgggc ggaacggacg + 68041 gcacggcctc gatgatctcc gtctcgcggc cttccgcgtc cgtgctcacg gaccgtttct + 68101 cccctgcccg aggaccaaac atgggtgcct cggactccga gaactcgacc cgcgtcttga + 68161 ccatcagggt cttgccgttt gcctctttga cgaccttgcc gtccggcccc atcagcggcg + 68221 tctcttcagg catcttggac tcgtccaccg tgccatcagg atttacccac tccggggtgg + 68281 gacgtccccc atcagagcgg gcccagcgtc agaaacagct gctcgccttc aacgacgtca + 68341 ccgtcgagat ccgatcctcg aactctcaag aaccgtccca gagccccaga cgtgtgagcc + 68401 gacgctgccg cagccgctct ccagccgctg tcagagcgaa gaggagccac acactcagcc + 68461 cggccagcgc tgctaccaca gggccatcag attcctcctc agacgacaca atcaggaaga + 68521 agaatgcaaa ggacacagcc atgcagaggc cggcgccgac cgggtgccgg gccacccact + 68581 tctgaatccg agtcgggcgc ctctgcccac caagcgcccg gtccaccgcc caaaacgcat + 68641 tacccagaga ccgccaccag ctcgtcactg ctgaaggata cgacagccag tcgggcacgc + 68701 cgatagaagg ctcgggcccg agctggttga gagacaactc agccttccca aggtgcgact + 68761 gggccagctg tccgggcgct tgaatccttg cgtgccgata gcaggaaaag gaccgcagcg + 68821 gcggcggcga acccgaagcc gacgctgctg caggccatga ccgtctcgaa tggagcgtcg + 68881 gcgatccggg ggatgccgtt gacgagcatg agggcgtaga tgcacaaaat ggcgtaggcg + 68941 cgaagccgca tcccggcttg tcgcttgcgc atccacggcg gcgtccaccc cgccagtatc + 69001 gccaccggca tcggcagcat gagcgttgtg gacactgcca gcgctatcca gtggtacagc + 69061 ggatttccgt tcatcccgac cccttcgtag gcgatcacca gcctacggag ggttggcgag + 69121 gcccgcccca cgccgaacac tacgagcttc cggcgggtgg cggcaccgga gcaggtgtct + 69181 caggagttcg ccgcgaccgt agtggactgg atcggatgca tctgacctcc ggcgtcccag + 69241 cctccgttct ctcagaggta agcccaggcg acaggcccgg gacgggacac aaacccaccc + 69301 gctcaaatgc ccgctggacg acacctgcgg ggcttctcgt cgaacgccgc tgtcacggac + 69361 gccctaatag ctcgggggtg cggggaagcg gtcagtctga ccaggtcgaa gacctcgcag + 69421 gtggcgttcc gcttcaggcc atatcgttcg tgaggctggg tggggcccca gacaggtcgt + 69481 cggctcgtgg ttcggggatc cacccgacag agcccgccca attgcctggc gggccacgtt + 69541 gcccctcatg gctgcgattg caaacccaac gtccccgaga gaacagcgcc gaagacaacc + 69601 cgcatgacga gtcgaacgcg tcgcgcgtgc gcgcacagtc atcttcacag cgatgcttca + 69661 ccagagcatc ccggtgaagc atcgtctcat ggctccgggc agaggcccgc caagggtgct + 69721 cctcggcggg gcctcgatct atcaccggcg ctgtcacgcg tctgtcacca actacgccga + 69781 cgccaccgga ccgcaaggcc ctcacctgct aaacgcacac accatggact ggcgtggacg + 69841 cccatagacg gtctctacaa cctgtgccat gtagtgcgcg ccaccgagca gccaggcgtc + 69901 gttcacgagg atcgtccact tgctggagtc caggacctgc cctaccccac gctcggtggc + 69961 ctcgctcatg gttctgaagt tcttgatcac ttcggcgtcg atgccgggga tcctctccgg + 70021 ggcgatcact tcgtcctggt ccagccggtt cccggcgatc agtcccttgc ccttgtggct + 70081 ttccatggcc cactgggcgg ccttgtagac gttgaaagcc acgcgtacgc gctcttcgga + 70141 gaaggaggtt tccaggccct ttttatcctc ttctctggcc gagttgatgt acagagggcg + 70201 ggcttcggcc gccgcccgct tgaattcatc tcagttctgc tacatttccg gtttcctctc + 70261 gtgagcgcat tactgggttc cgttgccttc ccggcggaca accgtcggca tgccgacatc + 70321 gcccgcacgt acgtggcgag cgtccgtccc cggccgggcg gcggcgagat cgtcctcaag + 70381 ctcggtgact cgttgctgaa gccgggagtt cttgatgctt gggctccgtc cgggcagtag + 70441 aaacagctaa cacgaggcgg ctcgtcatgt cccatcgcct gcggtacaac ggggcgtgct + 70501 cgcggcagaa ggccatggga cgggcagaga tgggacgggc agagatacgg gggtggttta + 70561 tgaacagaca ggaccgagcg aatgcggtgg accgggagat gtctgcgcga ctgatgccag + 70621 atgcggctct cgaggctctg gggggttggt ggggccagaa cgccgtacgg ctcacggacg + 70681 ggacgcccgg cgcccacacg gtccgctaca cacccagccg gtgggcgcac atcactacgt + 70741 ggccctcgat gatggcatcg accttccagg cgggtgacgc cgacgtcagc cggacacagg + 70801 tggcctccat cgtcgcggac gcgctggagc gcggagcctg tgaggaggcg ctggttgcta + 70861 cctatgtgtg gggaaagggc aaaggcggct ccccggccgg aagcggacct gccacgttgc + 70921 acaagattct gctgggcaca gagggcctga acgcgatact cgccagcgtc gtcaatacgc + 70981 tgagggagca ggacgccgaa gcagcctacg cggaactgcg gggtcgcatc gccgggttcg + 71041 gcccgtcgtt ttactccaag ttcctgtact tcgccggtaa atcggtccgg gcggcgtccg + 71101 gcacccagcc gctcatcctt gatcaggtcc tggcccggcg catgcggtcg ctggcccagg + 71161 cggtgggtcg ggagaccggc tacgaccctg acggctcgat cgccaggtgg gtctggcggg + 71221 acacaaactg gtcaccgcac cgctacgcga tctacctctc cttcatgcag gcggcttccc + 71281 gtcaggtagc agcaactcat tcctggccct ccaatgcgac gcccgacctg ctcgagtacg + 71341 cgctgttcac gacctcgtgg gtcgagagcg ccgaggccac atgaaaccga gggacgaccc + 71401 cggcagtccc ggccgccagg gataggacct gggacaggtg gtcgatccaa ggtggttcgc + 71461 gagcgtctgc gccgcaggcc cccacgacgt ctgcgcaccg gcctgggccg accgctgacc + 71521 agacaacgca tgaacagaca cggcccagga ggacacgcgc ctcacacggg aagagtgctt + 71581 gggacaactg actagctcca ctcagatcgg ggctggctgt cgcgctcagc atgggaaggg + 71641 gcttctggac ctcggtctga cggtcctgtt gctggggctc gagacggcgt ccctggctgc + 71701 gttcctgttc gtctaaggtt ctacaagcgt gggctgcaca aggaggaccg gttccggtgg + 71761 gaagcctcgc ctcccctccg ccctgaacgg cgcagcggcg tcgtcggcct cgatcgtgtc + 71821 ccggatcagc cgcagcggaa cctcggagac cagcgcgcct tcggctcgtc gccgccgtcg + 71881 accctccgga tccgctggtt caccgactcc gcgaggtcgg cgaggcgggc ccgacactgg + 71941 tcgggcggca tggaactact cccacaaacg cggtacggct cataggcccg gaccgcgacc + 72001 tgccccgacc tggagctgcc cttggcgagc gcagggacga cggttctgcc cgttgcgcgg + 72061 cctcgcctcc caggacgacg ggccgaccca gccgatgttc ccgccgggga cacggcaccg + 72121 tcccgtgcag tgccaggtcg gacgacgacc gcgagcggta agacacgctt gacgtgatgc + 72181 ggtgcccggg agccggactg ctcccccggg tctccgtgat ccggatcaag gagttcacgt + 72241 gagcggcccc ttgatcgcaa ccgaatgggc tctctaggag gagatggtct cttcgccggc + 72301 tgccatggcg gtcgcgaccg ggtctggacc gtggcgcccg tcgaactcct cgtaggcacg + 72361 ctcgatctct cggtgcacat gtgccgcgaa gggtccccac tcgcggtggg tgacgaccat + 72421 gaattgtccc tgctgcatgg cctcgaccac ctgctcgccg acccggccgg ggtcagctcc + 72481 ctggaggagc agcgcgctgt tcttctcgac gacggcggcg tccatctcgc ggccgagcag + 72541 cttcgcctcg gcggcgccgg cgttgaagtt gatcggggtg gcgaccgcgc cggggacgag + 72601 cagtgaaacg ccgacgtgcg tgcccgcgag ctcctcgcgg agcgccatcg acagccccac + 72661 gcttgcgaat ttcgaggagg tgtaagcggc cactcccgcc atgggtatca ggccggagat + 72721 cgaagaggtg ttcacgatgt ggctacggcc gccgcgactc ttgaaccgcg gcaggaacgc + 72781 tgccacagag gcgaactgcg cgtcgacgtt gacgccgtgg acccagcgcc acacctgaag + 72841 cggcgtgcgg tcgaccgttg tgccgccgtt cacgccggcg acattgcaca ggatcgagat + 72901 cggtccgagc gcttcctcgg cgcggtcggc catgctctcc caccggtcgg tctcactgat + 72961 gtcgaagggc agggccaaga ccgtgccgcc ggcgtcccgc agggactgct cggctcctgc + 73021 cagccgtgct tcgtcgatgt cgaccagcgc gaccttcgca ccggcggcga cgagcgcgtg + 73081 ggcgaccccg aagccgattc cggatgccgc gccggtgaca agtgctgctt cgcctgtcgg + 73141 ccagttcatt atcgtctccg cttcgtcgag ggacggttga atgggacgac gccccggttg + 73201 cccgaagtca cgcgtgggca ggccgaatcg tcagtcggga aacgcgtggt gaataccagt + 73261 gccacgctag tgaccgccga tcgcatgatc gcccgccgac tgtggcgcgc tcgagcccag + 73321 tcccccgccg actggcgggg gacgctggtg ccggttcggc cctctgtccc gtgtggccgg + 73381 accgactacg tgttccaggg gctcccgggg cgtgtcgggg ggacggggtc ggtgaggcgc + 73441 agcagcaggg cggcggcgat gtagcgcatc ctgccgacgt tgctgcgcgg gtcgtagccc + 73501 agggtgtggg tcagtgcttc atggcgggcc tgcacggtgg agtggtgcat gcccagttcg + 73561 gccgccgcgg agcggacgct gtcggcctcc accagcgtgc ggagcacgtc cgcggagcgc + 73621 cggtcgaggc gggcgagggc gcggacgtcc tcgtgcgggt gctccgggtc gtaggtctgg + 73681 gccagcagga gcatcgctcc caggtccgcc gcgtcgacgg ccggtgtgga ggcgtccgtc + 73741 agtcggagcg ccacgatcgc cgcctcccag gattcggggg cccggtcggc tcgtaccggg + 73801 ttccgaaccc gactggttcc ggcgggcggc ggatggtgcc cgagagatcg agggtggctc + 73861 tcagaagtcc gtaccgggtc ggcacgatcg cggagggggc ttcgctgatc tcgggggcgt + 73921 ccgcggcggt ggccaggaca cgcaccggtg tcgccgggtc gatccggcgc ttggcgagga + 73981 gcgcggtgcg ttcggcgacg gagcgggcct gatcgacgat ggcgtcgagg ccgcgctcgg + 74041 gactgcggcg cgcgtcaagg agttccactc ccagcgcgag ccgctccacg atcatctcgt + 74101 cggcgggctc cggctccccg tcccgctcga gccacaccgt ccagtcggcg tgggacctgc + 74161 gggagctgtg gcgccggcgg tcggcgtcgt cggtgaccgg gtgtccgtcc gggtcacgcc + 74221 gggtcacgcg ccctcggatc ttcgcgccgg cgacggtgcc ggagaggacc gcggcaccgc + 74281 gcaggagtcc gtcgagtccg gcgccccgcg tgatgaggac atcgaagtac gacacgatcc + 74341 gaagcgtttc gcccgcctgc gggtcgagtg agttcagtcg tccgaccagc tggtgcatct + 74401 gtactccttc gcaccattcc ctcagcttac cgaggaccgg ggacgtcgcc tcaggacccg + 74461 aggaggcggg cgacccaggc gttacgggcg gcggtcatgg cgtgcgccag agcggtgtgg + 74521 ggtgcggtca ggccgaaccc gtggaagcca ccgggccaga tgtggagttc ggcctgtacg + 74581 cccgcgtgcc acagggccgt cgcgtaagcg acgtcctcgt cccggaacac ctcggccgag + 74641 ccgcagtcga tgaacgcggg tggcagtccc gtgagatcgg tggcgcgtgc gggagcgcgt + 74701 aggccgatac gtcgtcggtt ccgcgcctct ctcccagcag cgcggtccag cccatgacgt + 74761 tgctcccgcg gtcccatacg ccgacagcgt cgaactgggc cgaggagacc gtccggtccc + 74821 ggtcgtcgag catcgggtac atgaggacct ggccgatcaa ggccgggcct tgccggtcgc + 74881 gggccatcag tgcgacgccg gcggcgagac cgcccccggc gctctgtccg gcgatgatca + 74941 gcctgtcggg gtccattccg agctctcggg cgtgctcggc cgtccacagc agacccgcat + 75001 agcagtcctc gaccggatag ggatcggggt gctcgggtgc gagccggtag tcgacggtga + 75061 ccaaaacggc gtcgtgctcg atcacccacg ggagggcctg gaccaggccg gagaactgat + 75121 caccggagac catgccgccg ccgtgcgtgt ggtagatccc cggcccgagc ccctgatgat + 75181 cctcccgggc gatcacagag acggtgattt cgtcgcccag gtaccccggg atcgtgacgt + 75241 cgcgtcgggt cagaccggag atcgcgagca tctcgtcggt gacctctgcc ggtgccgccc + 75301 ggcgcatgtc ggggatcatg tccgcggtca gggtcggcgg gatctggtcc gcgagggccg + 75361 cgagtacggc ctcgagctcc gggtcgaacg gggggcgcgg aacgctgctg gacatgggaa + 75421 ctcctggttc ttccgcaccg catggttgcg gtgtacatca atcgtgctgg gtgggccgcc + 75481 tcgtgccgaa ccgccgaacg ccgcagtctc ggaccgtgtc ctccgccgct cgcgcgtctt + 75541 gtccgtaccg ggcgggcaca gcccggtacg gacaagacgc gcgagccgtc cgtaccggag + 75601 tgttcaggag cctcagccca ggcacagaag ggtcttcccg ccgatgccgt ggcgcagcga + 75661 gtggagggcg tcgacaaggc tctccagcgg cagttcccgc acccagccgg tggtgtgtag + 75721 aacccgtcgg ccatggccgc gatgacctcg tcgaactcct cgggccggta gccgaccgcg + 75781 cccacgatct cggtctcgcc catcatgagc cgggtgggct ggaagtccat ggtgtgttcg + 75841 tgcagtgcgg cgaccaccag gcggccgccg gggaccaggc ccgccatggc ggaggtgacc + 75901 gcagcgcccg cgccggcggc gtccaccgcg gcgtccactc cgtcaccgtc ggtgagcgag + 75961 gcgacggcgt ccgcgagatc ctcgttcacg gggtcgatga cacgggcgcc cagcgcggcc + 76021 atgatcgcgc ggcggtcctc actcggctcg gacaccagca ccttctccac cccgcgggcc + 76081 ttgaaggcga accaggtacc gattccgatc ggtccggccc ctgccacaag tgcgctgccg + 76141 cccggtcgca caccgctgcg cgcgacagcg tgccagccca ccgccatggg ctcgacgagc + 76201 gcgcccatcc tcaggtcgac cccgtccggc agtacgtgca ccttcgacgc ctcgcacacg + 76261 gtgaactccg acagaccgcc gccctccacg ttcgacccga gcgagcccat cagcggacat + 76321 gagaagggca gcccccgacg gcaggccgcg cacttaccgc aggagaccgc cagagggaag + 76381 acggcacagc ggtcgccgac ccgcacgtcc gtcacgccct cgccggtctc gacgacagtg + 76441 ccggagaact cgtgaccgag gatctgcggc agggtggccc cggtgagggg gtgcggctcg + 76501 tccagggaga acggcagcga ctcggggtag aagaagaagt ggaggtcgga gccacagatg + 76561 ccggcgaacg cgttgcgcag cttcacctgc cccgggccgg gactgggctc cgccgcctct + 76621 tcgatgcgga tgtcttccct gccgtagaac cgtgctgcct tcatgtttct ccttcgtttc + 76681 cctgttccgt ggccaccggt gaccggtggc cgttcctgtc ggcgcggacc gtctcgtcgt + 76741 gcgccgccag gtgtgccgac cccacgctca gtccggtcca ggactgctga ggcgacggcc + 76801 ctgcttaccg cccgctcgtg cccggagacg gtgcgtcgag agtgcgggcg actcatccgt + 76861 tccgggccgc gatcgctgcc cgtgcgatgg cggagtccgg cgcgagcatg tcgaatccgt + 76921 ggtagccgcc gggccataca tgcagctcgg cctgcacgcc ggagttccat aagagcgttc + 76981 gcgtaggcgg cgtcctcgtc ccggaacacc tcggccgagc cgcagtcgat gaacgcgggc + 77041 ggcagtccct caaggtcgct cgcgcgagcg ggcgcggcgt agaccgacac ctcgtcggtg + 77101 ccacaccggt cgcccagcaa cgccgcccat cccgtccggt tgctctcccg gacccatctg + 77161 ccggcgtcct cgtactgggg gctggagacg gtgcggtccc ggtcgccgag catcgggcag + 77221 atcaggacct gcccgatgag cgcgggtccc ttgcggtcgc gggccaggag tgccgtgccc + 77281 gcggcgagcc cgcctccggc gctggcgccg gcgatgatca ggcggccggg gtcgatgccg + 77341 agttcggcgg cgtgttctgc ggtccacaca aggcccgcat agcagtcctc gaccggacag + 77401 gggtccggga actcgggcgc gagccggtat tccacggtca cggccacggc gtcgtgctcg + 77461 acgatccagg ggaggatctg gctcaccccg atcacgcgct cgccggcgat catccctccc + 77521 ccgtggatgt ggtagatgcc cggacccgtg ccggtgtgac cggagcgggc gatcacgctg + 77581 gccacgagct cggcgccgtg gtggccagga acggtcacat cccggcgcgt gaccccggcg + 77641 gcgagcaggg tcttgtcgga gacgacgggc agagcagctt gccgtagaac cgggatcgcc + 77701 ccgggtgtga cggccggcat cggttcggcc agggcggtca gggctgcctc ggcttcgggg + 77761 tggaagggcg ggcgcgggtg cgtgggcatc aggctccctc ggtatctgtc aggtgcccat + 77821 ccgggtgggc tcctgtcatg gtccggcggg agaacaggcc gacggcaccg ccgcacaggg + 77881 cagatgtcgg gcagttgccc cgccatccgc gcgccgtatg cccgtgggga gccgcgggca + 77941 gaggcagcgg cctccgcgcg aagcgcgtga acggcgggtc gagcggtggg catccgccgc + 78001 gaacggggtg ccgtcaggca acgccccggt ccaccgtggg tgtagtccgc tgcgaacccg + 78061 agcggcggta cacaagcgag cggagaagca gaatcgggtc ggcgggggaa gcggccttcg + 78121 tcaccggcgc ggcatcggga atcggcctgg ccgtcagccg ggcactcgtc accacggggg + 78181 cggaggtggc gctcgccgac atcgatgagg agcggctcga cgacgacgcg aagaagccgg + 78241 ccggtgccgg cggcaccgca atggccgtac cgctcgacgt gagcgacgct gacagctcgg + 78301 cagccgcggc cgaccgcgcc gaggaggcac tgggaccgat ctcgatcctg cgcagcaacc + 78361 cagcagctcc cacaagcagg tcagagcccg catcgagcac cttcgcccgt atgaagggga + 78421 tcctccgcga cttccgtctc aagggcaaca gcgcgcacta cgcaatgctc agcatcgccc + 78481 gcctgcacaa cctcgccctc acaggtgaac gaacactccg caccgcaggc cacctcaccc + 78541 gcgtccattg ggagatcatt tccgggacag ccctttagtc gcggctggcg accatcaggt + 78601 acccatcgct ctcggggtcg aaagtggtcg actccaccct gagcccgacg ctccgcaact + 78661 gcaccacgag gtcctcgtac cggtagggcc agatggacaa ccgctccgag caggctcgca + 78721 ctgccccatc gggctcgatc tgggcgacga cgatctcgag gaagtgttcc tgctcccagc + 78781 gctgctcgat ctgccagtag tagctgacga ccgcatcgcg gtcgttgcgg cggacgagtc + 78841 ggtcgcggac gtctacccgt gagccggcgg agcgcacgag ctcccagttg cgtgagtgga + 78901 gcaccaggcg tccgcccggt ttcagcagcc gtgacatcgc tgccagcgcg gccaggcgcc + 78961 cggctgcgcc ctcggcgtgc ccgagtgaat tgccgacgca gaacaccaga tcgaacgtgg + 79021 agtcctccag gtggtcgggc agctcgtccc atctcgcgtg gagggctcga agcgagacac + 79081 cctgctcgtc ggcggccttc tcggtccggc gaaccatccc atcactggcg tctgcggcga + 79141 ccacgtcgag gccgagactc gcgagaccga cggcgagctg gccggttcca cacgcgcagt + 79201 cgaggacgcg tgcgctgggc ggcacagagc ccacgacatc gctgtagtag accgcggctg + 79261 ccttggcggg ggtcaacctg tcgtccccga tcagccactc gtacacctcg gaaagcgccc + 79321 catacccagc caccgcgaca acctccacca ctcgacgacg cgcgggctgg accacccggc + 79381 gattcggacc ttgcgcctcg cactgtcccg ggccgtgtca gcgaagcatc ggccaggacc + 79441 caaccacgtt tagccgctga gactccaccg gatttcgtgg gaaaccgcga cacgacgcac + 79501 cgatgcgatt gccctctcac cggtacccat cagtcaccgc ggggaccacg gtcggcaacg + 79561 atgttggaaa agccgaacaa tgcacggatc gcagccctcg catcagcctg gggcaagtcc + 79621 gcctccgtga cggtggcgtc aggcgcgatc ttcagcgctc cagtcttctc ggagcgggac + 79681 cagtccggga aaaccactct agctgccctg acctgcgccc tgtccggtgg cagtctgcgg + 79741 cgcactcgcc ggagcggtgt gcggcgcggc gtgatcggct gacttcgtga ccgagagccg + 79801 acaccgtttg tcaccgagtt tgggcagcgc ttgtcgatcg cagagccgga aaacgttggt + 79861 gagaactgac accggcgcga gatgagtgaa cctgtctcgc ggcgctgcgc ggctcttact + 79921 aaaggggccc gtcacatagg gagggagaac agccgtactg gccctgaggg ccaccgggca + 79981 tcgtcgagca ggggcgtcac catggtccgc agcggcatgg tcacgaggcg gccttcgggt + 80041 tgttcgacga gtacgtcctt gtcgagcggg tgccatccga ggcgctggta gagcgacacg + 80101 agaggaggcc ggcagaagag gagtgcgtgt tgaggaccca tcgttcgggc gtgctccagg + 80161 gcagctgtga cgacgaggcg agcgaagccc tgaccttgca tggcgggtga gacggccacc + 80221 ccgccgacgc ccaccacctc tgtctcggcg tcgctgatcg caacaggcag tcgcagcagg + 80281 ccggcgtgtg ccacgaggcg gccgtggtgc cggatgccga agtgctcttc tttcggcagc + 80341 caggtcagac cggtccaggc gacaccgaag ggatcatcgc tgttgccaag gatctcctcc + 80401 tggtccgcct tcgtgtactg ggcgagccgc accacagtcg gtgccacagt ggactggttc + 80461 tcagacatac ccacatgatg atctctccgc cgaccactgg ccagagtgcc gtgcccgcga + 80521 tggctcaccg ggttcgctgg ccgctgtgac cgctggactg gttggattac ggctgatcca + 80581 ggcgcacgca gggcggctgt tcaccgacca cggctacgac gcggtgacgg tggccgacgt + 80641 ggccaaggct gccggcgtct cctcaatgac cgtgtaccga aacttcccca ccaaagggga + 80701 cctcgtcctc attgaccagc ccgcccagct catcgccgag cacgttgccg cgtcgtccgc + 80761 aacgcaaccc ctggtgcgcc gcatcggcag cgccctcatc gacgcggcca ccgcctcgac + 80821 cagcggcaac ggggacgaac aggcagcgga cgaacggttc ctgctggact gcctccggct + 80881 tatggtctca acgcctgcgc tgcggccccg gcatctcgac agccagtacg cgctccaaca + 80941 agccatcgtc gaagcgctcg gaaaggacgc ggccgatccc gacgccgcgt tccgtgccga + 81001 ggcccgcgaa cggcatcggt aggtctctct cgccacggag acgcccctgg gtcgtaggct + 81061 gcgggcatga ggcgggggga gacggaaaat cacagcgggc gtcgacggct cacatggtcg + 81121 aacgtcgagt ggaatcgggc ggctgcgctg tgcacggggc aactgccgct ggtgtggttg + 81181 gcatggtggt tcgtcatgga ggcgggccac gacgactacg accaaggcgg cggcgccttc + 81241 ctcggcatct tctgcgtgat gctgatcctg ccgctcctcg gcctcctgca cgcgaccgca + 81301 cagatcatgc ccgccgcgac cctggcccgc atgcggcctc gtgccgtccg aggcccggag + 81361 tgggcctggc atctgggcgg atccgtgctg atcggcaccg ggtggtcggc gcttgggtat + 81421 gccttgtggg gttggccagt agccgacgcc ctcccgtggt tcgccggcgt cggcgccctg + 81481 ccggtgctgc tcctcgcccg cctgcgcgga cgcccgtggg gtccgagggg cagctcgccg + 81541 ggaactggcg cggtgcggac gggagtgtgc tgcagctggc cccgggcggc caggccgagc + 81601 ttacccgcgt gccggcccac aacgacgtgg atgaagacgg tgacttctcc ctgtgcgacg + 81661 ggaccggcac gtggacccgc gaagagggga atgactttca gaacaccgac cgcgacggtg + 81721 tcctcgtaca cctcgacgac gagtgcggcc aggagacgta ctggacgatc ggcggcaccg + 81781 aactgaaacc ggaactgttc gtactgttcg gcgacccgga caccggggaa ctgcgcattc + 81841 tgacccagcc ttgaacacct cccggccgtc ccttccaacg ccgcgacgct cattcccaca + 81901 accaccgagg gaacgccacg gcagaaggac gacgccatcg aagcggccca gcgagccctc + 81961 accgttacca cccgctacca cgacgaacac gtggttaccc acgccgctcg cggacacctg + 82021 cacagactgg ccgccgacct tcgctccttg gacacggcag ggcgcgctct tcgcgaaggc + 82081 atctgggaca tctacggtgc acgccgcgct cagcacgccc ctgcgaagtg ccctggaacg + 82141 gctacggcga gcagcgggcc atggccgacc ttaccccccg tcatcaccga gggcgaagcg + 82201 cgcatcgaca gtcggcacag gtagtcgtct gcccgggcgc cgcgccggcg gtgggcgtcg + 82261 aggatcgcgc ggtgcagggc gaggcggtcg ccggggtggg cgggctcggg gttgtggagc + 82321 aggaccaggt ccagccggtc acgcccgagc tgctcgtggt tgtgcgggtg ggggggtcag + 82381 gaccagggcg atgaggggct gcgcctggcc ggtggcgcag ttgggggcag tgtcgctcca + 82441 ctgcgcgccg gaggcggcag catgagcagc cgcctccggg atcgcccggc accggttttg + 82501 gcccggcgcg ggctccgctg ttacggccgc ttcccaccgt cgcagctgcc cggtaaccgt + 82561 ggggacggtc aggctgtcgg cgcgaatgcg gtgatggcgt cgacgaggtt ggcgggggct + 82621 tccagcggga tcaggtgacc ggtgtggggg atcaccacga agtcggcgtg ggagaggtag + 82681 ggcaccaggt tgtcgcggag cacgccgacg ggctccacct ggtcgtgttc tccggcgacg + 82741 acgagaacgg gcacactgac cgtgcgcgtg tgttcggtga tgtcctgcgt gatgccgtgc + 82801 agtggccact ccgttcgggc ggcgtcggtg acggtccgcg agtcggtcac gatctgcgcc + 82861 ttgaccggct cgggcagctc ggtcgcggtg aggacgtgat cccgtgcccc ggccacggat + 82921 tcggcacagt cgtaggcgtg cgacagggct tgctggtact cgggagtgac ctgtgcggca + 82981 ggccttgccg gggcggagcc gacgaggacc atgccccgga ggccggcggg ccgggcggcc + 83041 gcgaccagct gtgcgacctt gccgcccatc gaatgcccca ccaggatgta gtcggtgatc + 83101 cccgcgtccg cgagcacggc gagtgtgtcg tcggcgaact gtccgagcgt gtaaggaccg + 83161 ggcagggcgc tcgaccggct ccacccgcgg aagtcgaccg tgagcacgtc acggcccgac + 83221 aggcggtcga cgacgaggtc ccaggtgcgg gcggaaccgc cccagtagtg caggaacacc + 83281 agagtgggtc cggtccccgg ccggtggtcg taagtgggca gtagcgtctg ctgcgtcgtt + 83341 tccatgatga ctcttccggt cgatgctccg ggcggtagcc ccgtgcattc attgaaactt + 83401 ctgcacccgg ccgggtcatt ggagtgactg gtcgcccgat agtgaaaact ggacacgtga + 83461 gcgtgatccg gcagatgacc taccagcccg cgggacgccc cgccacctcg gtcgaggtga + 83521 tgacgttcgg ccgccttcgc gagctgaacg acggcggcac gcagcgcgcc gacttccacg + 83581 tccttgccgt cgtcgacgcc ggcccaggat cggtcaccgt cgacttccgc cactacccgc + 83641 tccaagaccg gtccgcggtg tggattccgc ccggcgcggt gcaccggtgg gacgacatcg + 83701 ccgacgtggc agggcacctc gttctgttcg tgccgaccgc gcctgtcacc cacgccactc + 83761 gagaactggc cgcctcccct gacccggccg cgcactgggg catccccgac gccgactggc + 83821 ccttcgtcga caccgcgcgc agccatctcc tcttcgaagc atccgcccca cccagtgagt + 83881 cccggacaga gctgcccgag atcctgcttt ccgcgctcat cacccggctg cacccgccgc + 83941 acgccgaagc actcacccct caggtgttcc ggttgttccg ctccagcgtc gaagcgcact + 84001 tccggcggca ccacgacgcc gactactacg cccgtgcgct gggatacgcg ccccgcaccc + 84061 tctcacgagc ggtgcagcag gccaccggcc gcaccgcgaa ggcgtacatc gtcgaacgga + 84121 tcgtcctgga ggccaaacga ctcctggcac acgaccgcct caccgccgcc cgctgcgccg + 84181 acgtactcgg attccctgac gcatccaact tctcggcgtt cttccggagg gcgacaggca + 84241 tgcgcccggg cgcgtggcag gcgatgatgg ccgccgagtg a +// From 3ac3e91c4fd721e93444ca2dcf20ed5b4b0aa8ea Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:42:16 +0200 Subject: [PATCH 33/55] add real data tests --- tests/unit/genomics/test_runbigscape.py | 20 ++++++++++++++++++++ 1 file changed, 20 insertions(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 8fefa1c78..3882928b5 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -24,6 +24,26 @@ def test_run_bigscape_v2(self, tmp_path): assert result is True + def test_run_bigscape_small_dataset_v1(self, tmp_path): + result = bigscape.run_bigscape( + antismash_path=DATA_DIR / "bigscape/minimal_dataset", + output_path=tmp_path, + extra_params="", + version=1, + ) + + assert result is True + + def test_run_bigscape_small_dataset_v2(self, tmp_path): + result = bigscape.run_bigscape( + antismash_path=DATA_DIR / "bigscape/minimal_dataset", + output_path=tmp_path, + extra_params="", + version=2, + ) + + assert result is True + def test_run_bigscape_wrong_version(self, tmp_path): with pytest.raises(ValueError) as e: bigscape.run_bigscape( From 0db25d8b60939a240744cb56fdaa530c272a57d4 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:54:54 +0200 Subject: [PATCH 34/55] remove class --- tests/unit/genomics/test_runbigscape.py | 113 +++++++++++++----------- 1 file changed, 59 insertions(+), 54 deletions(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 3882928b5..30833dc97 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -3,76 +3,81 @@ from .. import DATA_DIR -class TestRunBigscape: - def test_run_bigscape_v1(self, tmp_path): - result = bigscape.run_bigscape( - antismash_path=DATA_DIR, - output_path=tmp_path, - extra_params="--help", - version=1, - ) +def test_run_bigscape_v1(tmp_path): + result = bigscape.run_bigscape( + antismash_path=DATA_DIR, + output_path=tmp_path, + extra_params="--help", + version=1, + ) + + assert result is True + + +def test_run_bigscape_v2(tmp_path): + result = bigscape.run_bigscape( + antismash_path=DATA_DIR, + output_path=tmp_path, + extra_params="--help", + version=2, + ) + + assert result is True - assert result is True - def test_run_bigscape_v2(self, tmp_path): - result = bigscape.run_bigscape( +def test_run_bigscape_small_dataset_v1(tmp_path): + result = bigscape.run_bigscape( + antismash_path=DATA_DIR / "bigscape/minimal_dataset", + output_path=tmp_path, + extra_params="", + version=1, + ) + + assert result is True + + +def test_run_bigscape_small_dataset_v2(tmp_path): + result = bigscape.run_bigscape( + antismash_path=DATA_DIR / "bigscape/minimal_dataset", + output_path=tmp_path, + extra_params="", + version=2, + ) + + assert result is True + + +def test_run_bigscape_wrong_version(tmp_path): + with pytest.raises(ValueError) as e: + bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, extra_params="--help", - version=2, + version=3, ) - assert result is True + assert "version" in e.value.args[0] - def test_run_bigscape_small_dataset_v1(self, tmp_path): - result = bigscape.run_bigscape( - antismash_path=DATA_DIR / "bigscape/minimal_dataset", + +def test_input_path_not_exist_v1(tmp_path): + with pytest.raises(FileNotFoundError) as e: + bigscape.run_bigscape( + antismash_path=tmp_path / "not_exist", output_path=tmp_path, extra_params="", version=1, ) - assert result is True + assert "antismash_path" in e.value.args[0] + - def test_run_bigscape_small_dataset_v2(self, tmp_path): - result = bigscape.run_bigscape( - antismash_path=DATA_DIR / "bigscape/minimal_dataset", +def test_input_path_not_exist_v2(tmp_path): + with pytest.raises(FileNotFoundError) as e: + bigscape.run_bigscape( + antismash_path=tmp_path / "not_exist", output_path=tmp_path, extra_params="", version=2, ) - assert result is True - - def test_run_bigscape_wrong_version(self, tmp_path): - with pytest.raises(ValueError) as e: - bigscape.run_bigscape( - antismash_path=DATA_DIR, - output_path=tmp_path, - extra_params="--help", - version=3, - ) - - assert "version" in e.value.args[0] - - def test_input_path_not_exist_v1(self, tmp_path): - with pytest.raises(FileNotFoundError) as e: - bigscape.run_bigscape( - antismash_path=tmp_path / "not_exist", - output_path=tmp_path, - extra_params="", - version=1, - ) - - assert "antismash_path" in e.value.args[0] - - def test_input_path_not_exist_v2(self, tmp_path): - with pytest.raises(FileNotFoundError) as e: - bigscape.run_bigscape( - antismash_path=tmp_path / "not_exist", - output_path=tmp_path, - extra_params="", - version=2, - ) - - assert "antismash_path" in e.value.args[0] + assert "antismash_path" in e.value.args[0] From 65fa549e21e33f19b00830db89da8e68cb2f5cc1 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Tue, 16 Jul 2024 12:57:23 +0200 Subject: [PATCH 35/55] force string for mypy --- src/nplinker/genomics/bigscape/runbigscape.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 3c2a764a2..0d43bd581 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -57,7 +57,6 @@ def run_bigscape( if not os.path.exists(antismash_path): raise FileNotFoundError(f'antismash_path "{antismash_path}" does not exist!') - logger.info(f"Running BiG-SCAPE version {version}") logger.info( f'run_bigscape: input="{antismash_path}", output="{output_path}", extra_params={extra_params}"' @@ -90,6 +89,6 @@ def run_bigscape( # otherwise log details and raise a runtime error logger.error(f"BiG-SCAPE failed with return code {result.returncode}") - logger.error(f"output: {result.stdout}") + logger.error(f"output: {str(result.stdout)}") raise RuntimeError(f"Failed to run BiG-SCAPE with error code {result.returncode}") From 3096bcc5a988ce615d27d99c9202ae653a9e322c Mon Sep 17 00:00:00 2001 From: "Arjan Draisma (wur)" <74908173+adraismawur@users.noreply.github.com> Date: Wed, 17 Jul 2024 11:26:08 +0200 Subject: [PATCH 36/55] Apply suggestions from code review Co-authored-by: Cunliang Geng --- src/nplinker/genomics/bigscape/runbigscape.py | 8 ++++---- tests/unit/genomics/test_runbigscape.py | 4 ++-- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 0d43bd581..bf8173b12 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -15,7 +15,7 @@ def run_bigscape( antismash_path: str | PathLike, output_path: str | PathLike, extra_params: str, - version: int = 1, + version: Literal[1, 2] = 1, ) -> bool: """Runs BiG-SCAPE to cluster BGCs. @@ -34,7 +34,7 @@ def run_bigscape( antismash_path: Path to the antismash output directory. output_path: Path to the output directory where BiG-SCAPE will write its results. extra_params: Additional parameters to pass to BiG-SCAPE. - version: The version of BiG-SCAPE to run. Can be 1 or 2. + version: The version of BiG-SCAPE to run. Must be 1 or 2. Returns: True if BiG-SCAPE ran successfully, False otherwise. @@ -45,13 +45,13 @@ def run_bigscape( elif version == 2: bigscape_py_path = "bigscape-v2.py" else: - raise ValueError("Unexpected BiG-SCAPE version number specified") + raise ValueError("Invalid BiG-SCAPE version number. Expected: 1 or 2.") try: subprocess.run([bigscape_py_path, "-h"], capture_output=True, check=True) except Exception as e: raise FileNotFoundError( - f"Failed to find/run bigscape.py (path={bigscape_py_path}, err={e})" + f"Failed to find/run BiG-SCAPE executable program (path={bigscape_py_path}, err={e})" ) from e if not os.path.exists(antismash_path): diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 30833dc97..e8c6e0abd 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -27,7 +27,7 @@ def test_run_bigscape_v2(tmp_path): def test_run_bigscape_small_dataset_v1(tmp_path): result = bigscape.run_bigscape( - antismash_path=DATA_DIR / "bigscape/minimal_dataset", + antismash_path=DATA_DIR / "bigscape" / "minimal_dataset", output_path=tmp_path, extra_params="", version=1, @@ -38,7 +38,7 @@ def test_run_bigscape_small_dataset_v1(tmp_path): def test_run_bigscape_small_dataset_v2(tmp_path): result = bigscape.run_bigscape( - antismash_path=DATA_DIR / "bigscape/minimal_dataset", + antismash_path=DATA_DIR / "bigscape" / "minimal_dataset", output_path=tmp_path, extra_params="", version=2, From d4cf769dbb5abe2ab1d70300d6ba87af18c62489 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 11:29:05 +0200 Subject: [PATCH 37/55] add exceptions to docstring --- src/nplinker/genomics/bigscape/runbigscape.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index bf8173b12..7de932939 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -38,6 +38,12 @@ def run_bigscape( Returns: True if BiG-SCAPE ran successfully, False otherwise. + + Raises: + ValueError: If an unexpected BiG-SCAPE version number is specified. + FileNotFoundError: If the antismash_path does not exist or if the BiG-SCAPE python + script could not be found. + RuntimeError: If BiG-SCAPE fails to run. """ # switch to correct version of BiG-SCAPE if version == 1: From c00d59c6b621e01c0c668f8b72286b7b10034fee Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 11:34:46 +0200 Subject: [PATCH 38/55] add docstring to tests --- tests/unit/genomics/test_runbigscape.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index e8c6e0abd..cd7e124ad 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -4,6 +4,7 @@ def test_run_bigscape_v1(tmp_path): + """Test whether BiG-SCAPE v1 runs at all using the --help command""" result = bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, @@ -15,6 +16,7 @@ def test_run_bigscape_v1(tmp_path): def test_run_bigscape_v2(tmp_path): + """Test whether BiG-SCAPE v2 runs at all using the --help command""" result = bigscape.run_bigscape( antismash_path=DATA_DIR, output_path=tmp_path, From 18b231786aacc6210ac2cd144a82e6e8481d0229 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 11:34:55 +0200 Subject: [PATCH 39/55] use tmp path instead of data path --- tests/unit/genomics/test_runbigscape.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index cd7e124ad..656b689f4 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -6,7 +6,7 @@ def test_run_bigscape_v1(tmp_path): """Test whether BiG-SCAPE v1 runs at all using the --help command""" result = bigscape.run_bigscape( - antismash_path=DATA_DIR, + antismash_path=tmp_path, output_path=tmp_path, extra_params="--help", version=1, @@ -18,7 +18,7 @@ def test_run_bigscape_v1(tmp_path): def test_run_bigscape_v2(tmp_path): """Test whether BiG-SCAPE v2 runs at all using the --help command""" result = bigscape.run_bigscape( - antismash_path=DATA_DIR, + antismash_path=tmp_path, output_path=tmp_path, extra_params="--help", version=2, From 8a356a500d45b9fddfdb8a9a45fcdffcd6194a17 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 11:42:59 +0200 Subject: [PATCH 40/55] add missing typing --- src/nplinker/genomics/bigscape/runbigscape.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 7de932939..e2f983121 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -4,6 +4,7 @@ import subprocess import sys from os import PathLike +from typing import Literal logger = logging.getLogger(__name__) From 5726f22f6cd988c9df4e0a2a19cd7f7162bcbf52 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 11:43:40 +0200 Subject: [PATCH 41/55] add explanation of cluster mode --- src/nplinker/data/nplinker.toml | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/src/nplinker/data/nplinker.toml b/src/nplinker/data/nplinker.toml index 15b002498..5449f35f0 100644 --- a/src/nplinker/data/nplinker.toml +++ b/src/nplinker/data/nplinker.toml @@ -22,7 +22,7 @@ podp_id = "" # The default value is "INFO". level = "INFO" # The log file to append log messages. -# The value is optional. +# The value is optional. # If not set or use empty string, log messages will not be written to a file. # The file will be created if it does not exist. Log messages will be appended to the file if it exists. file = "path/to/logfile" @@ -56,6 +56,8 @@ version = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" # for version 2, use the following parameters string: # parameters = "--mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" +# Note that for BiG-SCAPE version 2, you cannot set any other mode other than "cluster" +# using these parameters # Which bigscape cutoff to use for NPLinker analysis. # There might be multiple cutoffs in bigscape output. # Note that this value must be a string. From aab5e6925c338df5edcab5a0eac2f72c30f699b3 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 11:43:52 +0200 Subject: [PATCH 42/55] parameterize tests --- tests/unit/genomics/test_runbigscape.py | 52 +++++-------------------- 1 file changed, 10 insertions(+), 42 deletions(-) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 656b689f4..45c696496 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -3,47 +3,26 @@ from .. import DATA_DIR -def test_run_bigscape_v1(tmp_path): - """Test whether BiG-SCAPE v1 runs at all using the --help command""" +@pytest.mark.parametrize("version", [1, 2]) +def test_run_bigscape(tmp_path, version): + """Test whether BiG-SCAPE runs at all using the --help command""" result = bigscape.run_bigscape( antismash_path=tmp_path, output_path=tmp_path, extra_params="--help", - version=1, + version=version, ) assert result is True -def test_run_bigscape_v2(tmp_path): - """Test whether BiG-SCAPE v2 runs at all using the --help command""" - result = bigscape.run_bigscape( - antismash_path=tmp_path, - output_path=tmp_path, - extra_params="--help", - version=2, - ) - - assert result is True - - -def test_run_bigscape_small_dataset_v1(tmp_path): - result = bigscape.run_bigscape( - antismash_path=DATA_DIR / "bigscape" / "minimal_dataset", - output_path=tmp_path, - extra_params="", - version=1, - ) - - assert result is True - - -def test_run_bigscape_small_dataset_v2(tmp_path): +@pytest.mark.parametrize("version", [1, 2]) +def test_run_bigscape_small_dataset(tmp_path, version): result = bigscape.run_bigscape( antismash_path=DATA_DIR / "bigscape" / "minimal_dataset", output_path=tmp_path, extra_params="", - version=2, + version=version, ) assert result is True @@ -61,25 +40,14 @@ def test_run_bigscape_wrong_version(tmp_path): assert "version" in e.value.args[0] -def test_input_path_not_exist_v1(tmp_path): - with pytest.raises(FileNotFoundError) as e: - bigscape.run_bigscape( - antismash_path=tmp_path / "not_exist", - output_path=tmp_path, - extra_params="", - version=1, - ) - - assert "antismash_path" in e.value.args[0] - - -def test_input_path_not_exist_v2(tmp_path): +@pytest.mark.parametrize("version", [1, 2]) +def test_input_path_not_exist(tmp_path, version): with pytest.raises(FileNotFoundError) as e: bigscape.run_bigscape( antismash_path=tmp_path / "not_exist", output_path=tmp_path, extra_params="", - version=2, + version=version, ) assert "antismash_path" in e.value.args[0] From 1d6da6099bf1d5a143a11c4cca8cb699b00914f3 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 13:16:54 +0200 Subject: [PATCH 43/55] remove two gbks --- .../JK1_GCF_00/BGC0001596.region001.gbk | 2043 --------- .../JK1_GCF_01/JK1.region01.gbk | 3887 ----------------- 2 files changed, 5930 deletions(-) delete mode 100755 tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk delete mode 100755 tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk diff --git a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk deleted file mode 100755 index ce0e4e4e6..000000000 --- a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_00/BGC0001596.region001.gbk +++ /dev/null @@ -1,2043 +0,0 @@ -LOCUS BGC0001596 46688 bp DNA linear CON 11-APR-2022 -DEFINITION Streptomyces albus strain DSM 41398 chromosome, complete genome. -ACCESSION BGC0001596 -VERSION BGC0001596 -KEYWORDS . -SOURCE Streptomyces albus - ORGANISM Streptomyces albus - Bacteria; Actinobacteria; Streptomycetales; Streptomycetaceae; - Streptomyces. -COMMENT REFSEQ INFORMATION: The reference sequence is identical to - CP010519.1. - The annotation was added by the NCBI Prokaryotic Genome Annotation - Pipeline (PGAP). Information about PGAP can be found here: - https://www.ncbi.nlm.nih.gov/genome/annotation_prok/ - COMPLETENESS: full length. - ##antiSMASH-Data-START## - Version :: 6.2.0-924c3663(changed) - Run date :: 2022-11-08 02:46:11 - NOTE: This is a single region extracted from a larger record! - Orig. start :: 0 - Orig. end :: 46688 - ##antiSMASH-Data-END## -FEATURES Location/Qualifiers - CDS 1..468 - /codon_start=1 - /inference="COORDINATES: protein motif:HMM:NF024970.2" - /locus_tag="SLNWT_RS23545" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5111" - /product="ATP-binding protein" - /protein_id="WP_052482552.1" - /transl_table=11 - /translation="MSTVRDPGPLAAPVRLAPRATALRETEALCSMPVSAEAVPLLRRF - ARDTSRQWDLPGSAQEAACVIVTELVTNVLLHSGSRDVTLRIVLSDFALTVHVDDEGRW - KHRPAARLATEDAGARCGRGLQLVDAYAVACDVDRTERGTRVRAEIAVAAA" - subregion 1..46688 - /aStool="externally annotated by: MIBiG" - /contig_edge="True" - /label="BGC0001596" - /subregion_number="1" - /tool="antismash" - region 1..46688 - /candidate_cluster_numbers="1" - /contig_edge="True" - /product="T2PKS" - /region_number="1" - /rules="(t2ks and t2clf)" - /subregion_numbers="1" - /tool="antismash" - protocluster 1..44880 - /aStool="rule-based-clusters" - /category="PKS" - /contig_edge="True" - /core_location="[7427:9880]" - /cutoff="20000" - /detection_rule="(t2ks and t2clf)" - /neighbourhood="35000" - /product="T2PKS" - /protocluster_number="1" - /t2pks_malonyl_elongations="8|9 (Score: 709.5; E-value: - 2.4e-216)" - /t2pks_molecular_weights="acetyl-CoA_8 (Da): 396.388" - /t2pks_molecular_weights="acetyl-CoA_9 (Da): 438.425" - /t2pks_product_classes="angucycline" - /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" - /tool="antismash" - proto_core 7428..9880 - /aStool="rule-based-clusters" - /tool="antismash" - /cutoff="20000" - /detection_rule="(t2ks and t2clf)" - /neighbourhood="35000" - /product="T2PKS" - /protocluster_number="1" - /t2pks_malonyl_elongations="8|9 (Score: 709.5; E-value: - 2.4e-216)" - /t2pks_molecular_weights="acetyl-CoA_8 (Da): 396.388" - /t2pks_molecular_weights="acetyl-CoA_9 (Da): 438.425" - /t2pks_product_classes="angucycline" - /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" - cand_cluster 1..44880 - /SMILES="" - /candidate_cluster_number="1" - /contig_edge="True" - /detection_rules="(t2ks and t2clf)" - /kind="single" - /product="T2PKS" - /protoclusters="1" - /tool="antismash" - gene 1..468 - /locus_tag="SLNWT_RS23545" - /old_locus_tag="SLNWT_5111" - gene complement(509..1117) - /locus_tag="SLNWT_RS23550" - /old_locus_tag="SLNWT_5112" - CDS complement(509..1117) - /codon_start=1 - /gene_functions="regulatory (smcogs) SMCOG1057:TetR family - transcriptional regulator (Score: 90.1; E-value: 4.1e-27)" - /gene_kind="regulatory" - /inference="COORDINATES: protein motif:HMM:NF012655.2" - /locus_tag="SLNWT_RS23550" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5112" - /product="TetR/AcrR family transcriptional regulator" - /protein_id="WP_052482553.1" - /transl_table=11 - /translation="MAAGSEKTTGAEKAQSTRPRLRADAERNRARVLNAARELFAERGA - EVSMDEVARRAEVGIGTLYRHFPTKEAMVIAAGQQRFGEILTYYRTVCRDSAEPLQALH - LLLTRIAEVESRDRGFATAVTEGSLGSEGPRSPLREDLEAELMALIGKGQEGGSIRQDM - ASVDILSLTCGLTSIVHRRSGDWRRYIDIMLDGLKSQAA" - gene 1422..1832 - /locus_tag="SLNWT_RS23555" - /old_locus_tag="SLNWT_5113" - CDS 1422..1832 - /GO_function="GO:0070967 - coenzyme F420 binding [Evidence - IEA]; GO:0016491 - oxidoreductase activity [Evidence IEA]" - /GO_process="GO:0008150 - biological_process [Evidence - IEA]" - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018104096.1" - /locus_tag="SLNWT_RS23555" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5113" - /product="TIGR03618 family F420-dependent PPOX class - oxidoreductase" - /protein_id="WP_040258142.1" - /transl_table=11 - /translation="MSRERASAPRVTPSVEAFLAEPHLATLTTLRPDGTPHVVAVRFTW - DARSGLARVMTVRDSRKVRNVLAAPGGRAALCQVAGFKWVTLEGAATVSEDPVRVTEGA - RRYAARYLSPPPNPPGRVVVEIAVDRVMSLNS" - gene complement(2013..2462) - /locus_tag="SLNWT_RS23560" - /old_locus_tag="SLNWT_5114" - CDS complement(2013..2462) - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383123.1" - /locus_tag="SLNWT_RS23560" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5114" - /product="nuclear transport factor 2 family protein" - /protein_id="WP_040253434.1" - /transl_table=11 - /translation="MTPSESTAEIAGLLDRYLITLDDEKLDDDWTRSLFTEDASVTFPV - GGHQGAAGMGAFHQRTLDAFTCTQHMGTHAFVEIEGGGDTARLRANCTSTHVHRPENAA - ELGPLFRTGTFVDGRARRTPEGWRLSALSFRLMWKHGTPPGGGGR" - gene 2627..4096 - /locus_tag="SLNWT_RS23565" - /old_locus_tag="SLNWT_5115" - CDS 2627..4096 - /GO_function="GO:0071949 - FAD binding [Evidence IEA]" - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 515.3; E-value: - 3.1e-156)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 501.7; E-value: 5.3e-153)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_007385270.1" - /locus_tag="SLNWT_RS23565" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5115" - /product="FAD-dependent monooxygenase" - /protein_id="WP_040253436.1" - /transl_table=11 - /translation="MENFDADVIIVGAGPTGLMLAGELGLHGISALAVDRLEEPIQQSR - ALGFSARTIEEFGQRGLLARFGQVDVIPFGHFGGVPLDFQIVEGGSYGARGIPQSRTEG - VLAGWAREKGAEIRRGVEVTGLDDDGEGVTLQVRTGEGESRLRGRYVVGCDGARSVVRK - AAGIGFPGSEAEIELRFADISGIQLRPRFIGEKVPGGMVMVLPLGPDRSRIIYFDRTQP - LRESAEPITFEEASEAFQRLCGEDISGATPHWVSSTTDVSRQAEAYRSGRVFVAGDAAH - IHLPIGAQGMSAGIQDAVNLGWKLALDLKGRAPEGLLDTYHEERHPVGRRILVNTLAQR - SLYLGGEEMKPLVDVMGELAGYEVVRKHLVGMVTGLDIRHSTVPGEHPLLGRRLPDREL - AVGGEKTTVFALLTEGRGVLLDLSGSAEARKAAEGHAGRVEVVTAESHGIGAELDALLV - RPDGYVAWVAPAGSGAEGLLEALDHWFGAAD" - gene 4166..4855 - /locus_tag="SLNWT_RS23570" - /old_locus_tag="SLNWT_5116" - CDS 4166..4855 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383121.1" - /locus_tag="SLNWT_RS23570" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5116" - /product="antibiotic biosynthesis monooxygenase" - /protein_id="WP_040253438.1" - /transl_table=11 - /translation="MPKISTEDGYLTVLNLFTADAPEKQEKLLGEMRKIVDAATYEGWI - SSTVHAGVDQPGTANFIQWRSGEDLEKRYAGEEFKHRTLPVFGEMTTSIRLLQNDIVYT - QRAPELNGVTEISPDRDDYTVITVFGVEKENQDALVEALSQDHFLKVDGYRSHSVLKGR - AARGLEGSFVVAYSQWASKEAYDAFNSQPEGERSAERKEAEATVRSLITSVDSNTYRVV - HTRAAGE" - gene 5176..6491 - /locus_tag="SLNWT_RS23575" - /pseudo="" - CDS 5176..6491 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_015036312.1" - /locus_tag="SLNWT_RS23575" - /note="frameshifted; Derived by automated computational - analysis using gene prediction method: Protein Homology." - /product="multicopper oxidase family protein" - /pseudo="" - /transl_table=11 - /translation="VKFTRPLPALPVLSPRRRTARAETYELRQRETECEIVPGLKTRVR - TFDGCFAPPVIKAVRGRRTVIRQVNELTVPTSIHLHGGHVPESSDGGPMDLVQPGASRT - YTYPNEQAHANLWFHDHAHHQESETVFRGLTGLICSPTRPSSGCRCPRAPTTCRSRSAT - SASTRPGRSSTP" - gene 7073..7396 - /locus_tag="SLNWT_RS23580" - /old_locus_tag="SLNWT_5120" - CDS 7073..7396 - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1225:Polyketide synthesis cyclase (Score: 159.3; - E-value: 4.3e-49)" - /gene_functions="biosynthetic-additional (t2pks) CYC - C4-C17/C2-C19 (Score: 196.7; E-value: 8.3e-61)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383120.1" - /locus_tag="SLNWT_RS23580" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5120" - /product="TcmI family type II polyketide cyclase" - /protein_id="WP_040253440.1" - /transl_table=11 - /translation="MHSTLIVARMDLGSSKDVAGLFGEFDATEMPHRMGTRRRQLFAYK - GLYFHLQDFDEDNGGERIEEAKTDPRFIGISQDLKPFIEAYDPATWRSPADAMAQRFYT - WEA" - gene 7428..8669 - /locus_tag="SLNWT_RS23585" - /old_locus_tag="SLNWT_5121" - CDS 7428..8669 - /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (44-387). E-value: - 6.2e-54. Score: 175.3. Matches aSDomain: - nrpspksdomains_SLNWT_RS23585_PKS_KS.1" - /codon_start=1 - /gene_functions="biosynthetic (rule-based-clusters) T2PKS: - t2ks" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1022:Beta-ketoacyl synthase (Score: 467.5; E-value: - 6.9e-142)" - /gene_functions="biosynthetic-additional (t2pks) KS (Score: - 765.6; E-value: 2.8e-233)" - /gene_kind="biosynthetic" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383119.1" - /locus_tag="SLNWT_RS23585" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5121" - /product="beta-ketoacyl-[acyl-carrier-protein] synthase - family protein" - /protein_id="WP_052483223.1" - /sec_met_domain="t2ks (E-value: 4.2e-244, bitscore: 801.4, - seeds: 25, tool: rule-based-clusters)" - /transl_table=11 - /translation="MEVLAPGGVGTKNFWSLLSEGRTATRGITFFDPAPFRSRVAAEID - FDPYAHGLSPHEVRRMDRAAQLAVVAARGALADSGLETAALEPHRTGVTVGSAVGATMG - LDEEYRVVSDGGRLDLVDHAYAVPHLYNHLVPSSFAAEVAWAVGAEGPSTVVSTGCTSG - IDALGYALELVREGSVDVMVAGASDAPISPITMACFDAIKATTPRHDDPEHASRPFDGT - RNGFVLGEGSAFFVLEEWESARRRGAHVYAELAGYATRSNAYHMTGLRTDGAEMAEAIR - LALDEARLAPEAIDYVNAHGSGTKQNDRHETAAFKKSLGAHAYATPVSSIKSMVGHSLG - AIGSIEIAASALAMEHHTVPPTANLTTPDPECDLDYVPLHAREQRTDAVLSVGSGFGGF - QSAMVLARPERSPA" - aSDomain 7560..8588 - /aSDomain="PKS_KS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23585_PKS_KS.1" - /domain_subtype="Iterative-KS" - /evalue="6.20E-54" - /label="SLNWT_RS23585_PKS_KS.1" - /locus_tag="SLNWT_RS23585" - /protein_end="387" - /protein_start="44" - /score="175.3" - /tool="antismash" - /translation="DFDPYAHGLSPHEVRRMDRAAQLAVVAARGALADSGLETAALEPH - RTGVTVGSAVGATMGLDEEYRVVSDGGRLDLVDHAYAVPHLYNHLVPSSFAAEVAWAVG - AEGPSTVVSTGCTSGIDALGYALELVREGSVDVMVAGASDAPISPITMACFDAIKATTP - RHDDPEHASRPFDGTRNGFVLGEGSAFFVLEEWESARRRGAHVYAELAGYATRSNAYHM - TGLRTDGAEMAEAIRLALDEARLAPEAIDYVNAHGSGTKQNDRHETAAFKKSLGAHAYA - TPVSSIKSMVGHSLGAIGSIEIAASALAMEHHTVPPTANLTTPDPECDLDYVPLHAREQ - RTD" - gene 8666..9880 - /locus_tag="SLNWT_RS23590" - /old_locus_tag="SLNWT_5122" - CDS 8666..9880 - /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (68-400). E-value: - 1.4e-31. Score: 101.6. Matches aSDomain: - nrpspksdomains_SLNWT_RS23590_PKS_KS.1" - /codon_start=1 - /gene_functions="biosynthetic (rule-based-clusters) T2PKS: - t2clf" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1093:Beta-ketoacyl synthase (Score: 681.1; E-value: - 6.9e-207)" - /gene_functions="biosynthetic-additional (t2pks) CLF 8|9 - (Score: 709.5; E-value: 2.4e-216)" - /gene_kind="biosynthetic" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_010359931.1" - /locus_tag="SLNWT_RS23590" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5122" - /product="ketosynthase chain-length factor" - /protein_id="WP_040253445.1" - /sec_met_domain="t2clf (E-value: 1.6e-212, bitscore: 696.9, - seeds: 26, tool: rule-based-clusters)" - /transl_table=11 - /translation="MSAPAVITGIGVAAPNGLGLRDYWAATLGGKSGIARLTHFDPSGY - PAQLAGEVPGFVAEDHLPSRLIPQTDRMTRMALAAADWALADAGITPAELPSFDMGVVT - ASSSGGFEFGQGELRKLWSQGSQFVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSDQ - AGGLDALAQARRQIRRGTPLIVTGAVDASLCPWGWVAQLSGGRMSTSAEAARAYLPFDR - EARGYVPGEGGAILIMEDAEAARARGARVHGRILGYGATFDPRPGSGRPPALRRAAQTA - LADAGVDAADIDVVFADAAGEPAADRAEAEVLTALFGIRGVPVTAPKTMTGRLYSGAAP - LDVTAALLALRDQVIPPTVHVEPCPEYGLDLVLAQPRPAKLRTALVLARGHGGFNSALV - VRGPE" - aSDomain 8870..9865 - /aSDomain="PKS_KS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23590_PKS_KS.1" - /domain_subtype="Iterative-KS" - /evalue="1.40E-31" - /label="SLNWT_RS23590_PKS_KS.1" - /locus_tag="SLNWT_RS23590" - /protein_end="400" - /protein_start="68" - /score="101.6" - /tool="antismash" - /translation="QTDRMTRMALAAADWALADAGITPAELPSFDMGVVTASSSGGFEF - GQGELRKLWSQGSQFVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSDQAGGLDALAQ - ARRQIRRGTPLIVTGAVDASLCPWGWVAQLSGGRMSTSAEAARAYLPFDREARGYVPGE - GGAILIMEDAEAARARGARVHGRILGYGATFDPRPGSGRPPALRRAAQTALADAGVDAA - DIDVVFADAAGEPAADRAEAEVLTALFGIRGVPVTAPKTMTGRLYSGAAPLDVTAALLA - LRDQVIPPTVHVEPCPEYGLDLVLAQPRPAKLRTALVLARGHGGFNSALVV" - CDS_motif 9323..9361 - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_SLNWT_RS23590_0001" - /evalue="2.00E-03" - /label="PKSI-KS_m4" - /locus_tag="SLNWT_RS23590" - /protein_end="232" - /protein_start="219" - /score="11.4" - /tool="antismash" - /translation="FDREARGYVPGEG" - gene 9975..10244 - /locus_tag="SLNWT_RS23595" - /old_locus_tag="SLNWT_5123" - CDS 9975..10244 - /NRPS_PKS="Domain: ACP (12-82). E-value: 1.7e-16. Score: - 52.2. Matches aSDomain: nrpspksdomains_SLNWT_RS23595_ACP.1" - /codon_start=1 - /gene_functions="biosynthetic-additional - (rule-based-clusters) PP-binding" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1129:acyl carrier protein (Score: 118.5; E-value: - 1.6e-36)" - /gene_functions="biosynthetic-additional (t2pks) ACP - (Score: 133.6; E-value: 4.3e-42)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383117.1" - /locus_tag="SLNWT_RS23595" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5123" - /product="acyl carrier protein" - /protein_id="WP_040253447.1" - /sec_met_domain="PP-binding (E-value: 7.6e-10, bitscore: - 30.7, seeds: 164, tool: rule-based-clusters)" - /transl_table=11 - /translation="MATAAFTLDDLKRILLQSAGAAEGVDLDGEILDTEFEVLGYESLA - LLETGGAIEREYGISLDDEVITDAETPRALIDAVNAHLSTAGAA" - aSDomain 10011..10220 - /aSDomain="ACP" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23595_ACP.1" - /evalue="1.70E-16" - /label="SLNWT_RS23595_ACP.1" - /locus_tag="SLNWT_RS23595" - /protein_end="82" - /protein_start="12" - /score="52.2" - /tool="antismash" - /translation="RILLQSAGAAEGVDLDGEILDTEFEVLGYESLALLETGGAIEREY - GISLDDEVITDAETPRALIDAVNAH" - gene 10263..11057 - /locus_tag="SLNWT_RS23600" - /old_locus_tag="SLNWT_5124" - CDS 10263..11057 - /NRPS_PKS="Domain: PKS_KR (11-121). E-value: 3.7e-10. - Score: 31.8. Matches aSDomain: - nrpspksdomains_SLNWT_RS23600_PKS_KR.1" - /codon_start=1 - /gene_functions="biosynthetic-additional - (rule-based-clusters) adh_short" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1001:short-chain dehydrogenase/reductase SDR (Score: - 259.9; E-value: 3.7e-79)" - /gene_functions="biosynthetic-additional (t2pks) KR C9 - (Score: 473.5; E-value: 3.7e-145)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018839768.1" - /locus_tag="SLNWT_RS23600" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5124" - /product="SDR family NAD(P)-dependent oxidoreductase" - /protein_id="WP_040253449.1" - /sec_met_domain="adh_short (E-value: 8.9e-36, bitscore: - 115.0, seeds: 230, tool: rule-based-clusters)" - /transl_table=11 - /translation="MTENTQEHGRLALVSGGTSGIGLASARLLAEQGHRVFLGARDADR - VAATVKELAGEGLPVDGTVLDVREDASVRAFVQAAVDRFGTVDVLVNNAGRSGGGVTAD - IPFELWADVIETNLTSVFRMTKEVLNAGGMRAKSRGRIINIASTAGKQGVVLGAPYSAS - KHGVVGFTKALGNELAPTGITVNAVCPGYVETPMAQRVRQGYADAYDTSEEAILEKFQA - KIPLGRYSTPEEVAGLVGYLASDTAASLTSQALNVCGGLGNF" - aSDomain 10296..10625 - /aSDomain="PKS_KR" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23600_PKS_KR.1" - /evalue="3.70E-10" - /label="SLNWT_RS23600_PKS_KR.1" - /locus_tag="SLNWT_RS23600" - /protein_end="121" - /protein_start="11" - /score="31.8" - /specificity="KR activity: inactive" - /specificity="KR stereochemistry: C1" - /tool="antismash" - /translation="ALVSGGTSGIGLASARLLAEQGHRVFLGARDADRVAATVKELAGE - GLPVDGTVLDVREDASVRAFVQAAVDRFGTVDVLVNNAGRSGGGVTADIPFELWADVIE - TNLTSV" - CDS_motif 10299..10370 - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_SLNWT_RS23600_0001" - /evalue="8.70E-07" - /label="PKSI-KR_m1" - /locus_tag="SLNWT_RS23600" - /protein_end="36" - /protein_start="12" - /score="21.6" - /tool="antismash" - /translation="LVSGGTSGIGLASARLLAEQGHRV" - gene 11107..12048 - /locus_tag="SLNWT_RS23605" - /old_locus_tag="SLNWT_5125" - CDS 11107..12048 - /NRPS_PKS="Domain: Polyketide_cyc2 (4-146). E-value: - 1.4e-18. Score: 59.5. Matches aSDomain: - nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.1" - /NRPS_PKS="Domain: Polyketide_cyc2 (155-292). E-value: - 2.3e-10. Score: 32.9. Matches aSDomain: - nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.2" - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1128:cyclase/dehydrase (Score: 444.3; E-value: - 3.9e-135)" - /gene_functions="biosynthetic-additional (t2pks) CYC C7-C12 - (Score: 476.4; E-value: 6.9e-146)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_019330940.1" - /locus_tag="SLNWT_RS23605" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5125" - /product="aromatase/cyclase" - /protein_id="WP_040253451.1" - /transl_table=11 - /translation="MTTREVEHEITIAAPAAAVYRLLAEVANWPRIFPPTLYVDREELG - PGQERIHIWATANGEAKNWTSHRTLDEDALRITFRQEVSPEPVAEMNGTWIIEPQGASS - SRVRLLHAFKAIGDDPHDLLWIETAVDKNSTKELAGLKENVELAHAAEELTFSFTDTVR - IDGAAKDAYDFIDQADKWDERLPHVARVRLTEDTPGLQELEMDTRAKDGSTHTTKSYRV - TFPHHRIAYKQVTLPALMTLHTGIWTFEEDPTGTHTTASSQHTVTLRPENIEKILGPDA - TVADARAYVQSALSTNSTATLGHAKNHAERQG" - aSDomain 11119..11544 - /aSDomain="Polyketide_cyc" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.1" - /domain_subtype="Polyketide_cyc2" - /evalue="1.40E-18" - /label="SLNWT_RS23605_Polyketide_cyc2.1" - /locus_tag="SLNWT_RS23605" - /protein_end="146" - /protein_start="4" - /score="59.5" - /tool="antismash" - /translation="EVEHEITIAAPAAAVYRLLAEVANWPRIFPPTLYVDREELGPGQE - RIHIWATANGEAKNWTSHRTLDEDALRITFRQEVSPEPVAEMNGTWIIEPQGASSSRVR - LLHAFKAIGDDPHDLLWIETAVDKNSTKELAGLKENVE" - aSModule 11119..11982 - /domains="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.1" - /domains="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.2" - /incomplete - /locus_tags="SLNWT_RS23605" - /tool="antismash" - /type="unknown" - aSDomain 11572..11982 - /aSDomain="Polyketide_cyc" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23605_Polyketide_cyc2.2" - /domain_subtype="Polyketide_cyc2" - /evalue="2.30E-10" - /label="SLNWT_RS23605_Polyketide_cyc2.2" - /locus_tag="SLNWT_RS23605" - /protein_end="292" - /protein_start="155" - /score="32.9" - /tool="antismash" - /translation="FSFTDTVRIDGAAKDAYDFIDQADKWDERLPHVARVRLTEDTPGL - QELEMDTRAKDGSTHTTKSYRVTFPHHRIAYKQVTLPALMTLHTGIWTFEEDPTGTHTT - ASSQHTVTLRPENIEKILGPDATVADARAYVQS" - gene 12048..13505 - /locus_tag="SLNWT_RS23610" - /old_locus_tag="SLNWT_5126" - CDS 12048..13505 - /GO_function="GO:0071949 - FAD binding [Evidence IEA]" - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 499.9; E-value: - 1.5e-151)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 551.4; E-value: 4.3e-168)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_019330939.1" - /locus_tag="SLNWT_RS23610" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5126" - /product="FAD-dependent monooxygenase" - /protein_id="WP_040253452.1" - /transl_table=11 - /translation="MDTADRLETQVIIVGAGPVGLLLAGELRLGGAEVVVLEQREAPTT - ESRASTLHARTMEILDSRGLLAGLGTPPQEPRGHFGGIPLDLTLPSRYPGQWKVPQFRT - EELLQEWALGLGADIRRGHQVHALNPGDQAEYVEAEATGPGGRRVLVRGRHLVACDGEE - GTVRRLTGVVFPGQSATRELLRADVDGIDVPDRRFERLPRGLAIAARRGDGVTRVMAHV - FGSTAQPRTGEAEFGEVVAAWKQVTGEDISGGTPLWVNTFGDASRQLVHYRRGRILFAG - DAAHVQMPIGGQALNLGLQDAFNLGWKLARQLREPGGEALLDSYHTERHAVGRRVLGNI - KAQAMLLLGGPEVEPLRTLLAELIRHEKVRAHLAGMISGLDIRYQLPGPAHPLLGARLP - HTVLTSPQGRVSVSELLRTGRGVWINPGVDVPDGARLSTLTGRPEEGPLTDKDSVLVRP - DGHVAWAGSTGTPPPAEALGPGWEATA" - gene 13588..15108 - /locus_tag="SLNWT_RS23615" - /old_locus_tag="SLNWT_5127" - CDS 13588..15108 - /GO_function="GO:0071949 - FAD binding [Evidence IEA]" - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 533.9; E-value: - 7.4e-162)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 546.1; E-value: 1.8e-166)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_019330938.1" - /locus_tag="SLNWT_RS23615" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5127" - /product="FAD-dependent monooxygenase" - /protein_id="WP_040253455.1" - /transl_table=11 - /translation="MAGTAQGTAVDADVIIVGAGPTGLMLAGELRLGGARVIVAERLAE - PTGQSRGLGFTARAMEIFDQRGLLPRFGQGETLETSPMGHFGGLQFDFTTLPGAHFGAR - GIPQYQTEAVLEEWAAGLGADIRRGWEFLELAEGFLTGEGVEVTFGTPEGVRTLRAAYL - VGCDGGGSQVRKAAGFAFPGLPATRAMFLADVTGLNLKPRFLGERLPHGMVMAAPLAEG - VDRIIVCPHGTPARDRDESVTFEEVAAAWQHITGEDISHGGADWVSSFSDAARQVDSYR - RGRVLLAGDAAHIHLPAGGQGLSTGVQDAANLGWKLAATVAGRAPAGLLDSYHTERHAV - GSRLLMNTRAQGFVFLGGEPADPLRTVFAELLGHEEVKQHLAGIVSHLDVHYAAPEGAH - PLTGHRLGEHILVGKEGESAVFAELHGGRGLLLDLADDAGVRAAGAGLTDRLTTVTATL - KSAPGDADRLDGVRALLVRPDGYVAWAGETTEGLAEAVRRWFGEASPA" - gene 15254..16195 - /locus_tag="SLNWT_RS23620" - /old_locus_tag="SLNWT_5128" - CDS 15254..16195 - /codon_start=1 - /gene_functions="biosynthetic-additional - (rule-based-clusters) Abhydrolase_6" - /gene_functions="biosynthetic-additional - (rule-based-clusters) PF00561" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018103054.1" - /locus_tag="SLNWT_RS23620" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5128" - /product="alpha/beta fold hydrolase" - /protein_id="WP_052482554.1" - /sec_met_domain="Abhydrolase_6 (E-value: 5.3e-13, bitscore: - 41.5, seeds: 455, tool: rule-based-clusters)" - /sec_met_domain="PF00561 (E-value: 5e-08, bitscore: 24.3, - seeds: 48, tool: rule-based-clusters)" - /transl_table=11 - /translation="MTALGSTPTGDTDPPAPEPPAPDPPVPGAFSTGVRRITLDAGGLD - LSALLSEPEQGPPRATVVAVHGGGMSAGYFDGQAHPEQSLMTLGAQLGYTVLSVDRPGY - GSSAAWLPEGLTLGEQAVVLHAALDDFRRHYAHGAGLFLLAHSLGGALVMATAAGAEAD - RALLGLDVSGCGHRYAVVPDQGRTTRRNTLRHWGPLRLYPPNTFATSTGLVAPVPAREA - GELARWPELFAALAPRISVPVRLTFAEHEAWWRHGEQDLADLAAQLTASPRVLVERQPD - AGHNISLGWAARAYHLRSLAFLEDCLTHTGRE" - gene 16321..16995 - /locus_tag="SLNWT_RS23625" - /old_locus_tag="SLNWT_5130" - CDS 16321..16995 - /GO_function="GO:0008897 - holo-[acyl-carrier-protein] - synthase activity [Evidence IEA]" - /NRPS_PKS="Domain: ACPS (140-185). E-value: 1.2e-11. Score: - 36.4. Matches aSDomain: - nrpspksdomains_SLNWT_RS23625_ACPS.1" - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1012:4'-phosphopantetheinyl transferase (Score: 143.8; - E-value: 7.6e-44)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_015037171.1" - /locus_tag="SLNWT_RS23625" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5130" - /product="4'-phosphopantetheinyl transferase superfamily - protein" - /protein_id="WP_052482555.1" - /transl_table=11 - /translation="MTSTRAPLPAPGTYQLWVFDSLTEEGIPATRAEAGPEALGPEERR - RARLFRRPADRRQYESAHLVLRRLLADHTGLAPERLEFGREGGRRGKPRLLGSPVPVHF - SLSHSHGLVAIALAADPVGVDVQRVPGARTVERCLPSLHPAERAELTALPESERPDAFA - LLWTRKEAYLKGLGTGLARPLAADYLGSGGLAARPPDWTVHNTAARPGHAAAAALRTPA - TG" - aSDomain 16741..16875 - /aSDomain="ACPS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_SLNWT_RS23625_ACPS.1" - /evalue="1.20E-11" - /label="SLNWT_RS23625_ACPS.1" - /locus_tag="SLNWT_RS23625" - /protein_end="185" - /protein_start="140" - /score="36.4" - /tool="antismash" - /translation="SLHPAERAELTALPESERPDAFALLWTRKEAYLKGLGTGLARPLA - " - gene 17035..18609 - /locus_tag="SLNWT_RS23630" - /old_locus_tag="SLNWT_5131" - CDS 17035..18609 - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1059:acetyl-CoA carboxylase, carboxyl transferase, - (Score: 729.5; E-value: 4e-221)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_019520922.1" - /locus_tag="SLNWT_RS23630" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5131" - /product="acyl-CoA carboxylase subunit beta" - /protein_id="WP_052482556.1" - /transl_table=11 - /translation="MATATEDTHHPRALAAELGARKEEARQGPDPRATERQHAKGKLTA - RERIDLLLDKNSFTEVEQLRRHRATGFGLEARKPYTDGVVTGWGTVEGRTVFVYAHDFR - IFGGALGEAHAAKIHKIMDMALAAGAPLVSLNDGAGARIQEGVSALAGYGGIFQRNTRA - SGVIPQISVMLGPCAGGAAYSPALTDFVFMVRDTSQMFITGPDVVQAVTGEEISQNGLG - GAEVHAGTSGVAHFAYDDEETCLAEVRYLLSFLPSNNRSMPPHLPSADPADRPGERLTE - VVPADGNRAYDVREVIEEVVDDGEYLEVHASWAPNLVCALARLDGHVVGVVANQPNAFA - GVLDIRASEKGARFVQFCDSFSIPLVTLVDVPGFLPGVDQEHEGIIRRGAKLLYAYCNA - TVPRVSVVLRKAYGGAYIVMDSRSIGADIALAWPTNEIAVMGAEGAANVVFRREIAAAA - DPGEMRAQKIKEYREELVHPYYAAERGLVDDVIDPRETRAVLCRAVTMLAAKDADLPRR - KHGNPPQ" - gene 18829..19044 - /locus_tag="SLNWT_RS23635" - /old_locus_tag="SLNWT_5132" - CDS 18829..19044 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018850635.1" - /locus_tag="SLNWT_RS23635" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5132" - /product="hypothetical protein" - /protein_id="WP_040258146.1" - /transl_table=11 - /translation="MLRVVRGNPAPEELAVLSALLFARLSAPEAQAAGPLGRAVAGWRR - PERGSMFDGPRTWRGTGSAAHPTGGR" - gene complement(19200..19985) - /locus_tag="SLNWT_RS23640" - /old_locus_tag="SLNWT_5133" - CDS complement(19200..19985) - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_017237263.1" - /locus_tag="SLNWT_RS23640" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5133" - /product="DUF3050 domain-containing protein" - /protein_id="WP_040253457.1" - /transl_table=11 - /translation="MSRYDWGKENASIEKLRKVIDDARLEVVKHPIYHRLATLEDVNTF - NENHVFAVWDFMSLLKSLQRSLTCVDVPWVPQGSSESRRLINDIVLVEESDELGDGFIS - HFELYVNGMAEAGADVTVINNFLDRIRGGEGVRTALVGASVPAAAATFVNATFDFIEGA - PLHCRAAAFAFGREDLIPEMFDQVIKVDDQGGKLATFREYLARHIEVDGEEHTPMAMAM - VADLCGEDEAKWQEAAETVTAALRARVALWDGIVAALDA" - gene 20578..20913 - /locus_tag="SLNWT_RS23645" - /old_locus_tag="SLNWT_5135" - CDS 20578..20913 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383104.1" - /locus_tag="SLNWT_RS23645" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5135" - /product="4Fe-4S ferredoxin" - /protein_id="WP_040253458.1" - /transl_table=11 - /translation="MPWEKNEAAGGETSGRDARIAARAREENWKKPPRRIESAECITCD - SCLRGCPAEFGAIFDRGLDVVIIPELCSGCPACVLECPVDCIYVDEDWAPTDESLWKHI - ELTADGA" - gene 20913..22832 - /locus_tag="SLNWT_RS23650" - /old_locus_tag="SLNWT_5136" - CDS 20913..22832 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_017237261.1" - /locus_tag="SLNWT_RS23650" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5136" - /product="hypothetical protein" - /protein_id="WP_040253460.1" - /transl_table=11 - /translation="MPSPAERGLSRREINARKRQSRRPSRHGSAAGAAPGPDYPREDGV - GFPGLLDRAWRAALAAGELPAAVDALLTLDGHVPGDIQLRALRTADEAALKVLCGASWR - GVRDGGQASGASAERAQVPPQDAVFDGEIALSTTGRILVRVPSQGPLAESGNLVAPALQ - VPWSAADLAAYRTESARAAARYSSAVVDCRQWLAAHSTQAREELLDLLKDAALRTAPFV - LYQEDRQYTNFRDPNTLTGKTLWPGHPDCALSSLAGLPLDQWSDSEAVLVVCLTLLVRS - ASYARIEEANGTQLTPDHVGHLLEGVRRNYNAHSRGEAVPPAASARVADLDALAGALRA - RRTEVLGEVQLYREIHGPLMHKIERTAAPRGAAARHREAEVTARLTEALPLAGEDLGAL - AAHLAESPAWLTKPHGEFRTGLEALVHASVAASTEAFEADFAMSRGMRSLAGLREALRA - QAWAEITDWGITDFFCCVVPDPAARRHFGDSVDRLADTAWAMSSRMQYNSWHFIAGNLP - KVPAVVARDHFVPPTLPDIAFYSDQHHHGHVAAKVRFSIRSPQAVEIDGRRFNGFMDLR - LLRCEGTPFGEQDLLAAHRVSAFVAGATGLAAELVAAGEEIEVTSFDSAWHGESVRAAV - KARG" - gene 22838..24277 - /locus_tag="SLNWT_RS23655" - /old_locus_tag="SLNWT_5137" - CDS 22838..24277 - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1105:amidase (Score: 418.1; E-value: 8.2e-127)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383106.1" - /locus_tag="SLNWT_RS23655" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5137" - /product="amidase family protein" - /protein_id="WP_078845181.1" - /transl_table=11 - /translation="MSPSEAGSVRPVTSEETQLTAYGIAATRALLGRGERTATEHLAAH - LAAIEERDPGLGAFVAVAGEGALRAAAAADARLRALGPAAFQDQPLLGVPVSVKDLIQT - GELPTRRGSLLPNRRPAADAPAVARLKAAGAIVVGKTTTSEYGWSASTVSRVSPPTRNP - WDPAYSAGGSSGGAAASVAAGLCTAALGTDGAGSIRIPAAFCGVVGYKPSFGRVPYVPA - GADRLSHLGPLARSVEDVMEIAAVLPGPHRQDPDSGLGALESRPERRGLRVGWIEFPGT - APEVRRVSERALEALAALGHHPERIEVPFRDPYPALLDILAAAEAAGAAPGDEADGDPG - RLAVVRHGRGLDGAAVMRAEEVRMELRTRLAAVMERHDLLAMATVPVEPFAPEAIGPDW - ASDPESLLWLAWSPATYPFNMTGQPAVSLPAGLSRAGLPVGVQLVGPVGADALVLDTAR - DLEAGLGPLPEVPQRVSERML" - gene 24280..25791 - /locus_tag="SLNWT_RS23660" - /old_locus_tag="SLNWT_5138" - CDS 24280..25791 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383107.1" - /locus_tag="SLNWT_RS23660" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5138" - /product="glutamine synthetase family protein" - /protein_id="WP_040253462.1" - /transl_table=11 - /translation="MYTRKWSRPAAEDGVGRSDFVAEHGLWDERQRAAAAEIEAHLGEV - DLIRLVFGDPHGLARSKTLTVEAFRAALRGGMDYSPGPFLFDTGHAVAVDFLSDPGVDV - PELLGAGNFVVVPDPVTFQLLPGGEARTAWVIGEEYLPDGRPHPLSSRHVLRKVIAAYA - AQEYTPVLGLEVEWYLTRRLEGPVGNAGNGFGLQGEAPRVAAMNPGYQFNSDNAFASVA - AFAHPLSALLRQLGLPLRSMEHESGPGQIETTFAPMHALDTADAMLLFRTLVKQRAAQG - GYHATFMSLPRIDGFDPSGWHVHQSVVDTRTGRNLFAPDDPAAPLSAAGLAYAEGLLRR - ARELCLLSVPTVNGHRRLGSGFSLSPTRIGWSPEDRTAMVRVVGAGGSRHLENRTGEPC - ANPYLALAAQLFAGLEGMNSDSLVPRPALGPDAAGAETLPGSLEESLAAFRQGSPADLL - GTPLARCLAKLKQSELDRFRTWAEKEQPPEGEVTEWEQREYFEAF" - gene 25861..27147 - /gene="purB" - /locus_tag="SLNWT_RS23665" - /old_locus_tag="SLNWT_5139" - CDS 25861..27147 - /EC_number="4.3.2.2" - /GO_function="GO:0004018 - N6-(1,2-dicarboxyethyl)AMP - AMP-lyase (fumarate-forming) activity [Evidence IEA]" - /GO_process="GO:0009152 - purine ribonucleotide - biosynthetic process [Evidence IEA]" - /codon_start=1 - /gene="purB" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1063:argininosuccinate lyase/adenylosuccinate lyase - (Score: 148.3; E-value: 5.8e-45)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_007389998.1" - /locus_tag="SLNWT_RS23665" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5139" - /product="adenylosuccinate lyase" - /protein_id="WP_040253465.1" - /transl_table=11 - /translation="MIPRYTRPEMAELFSDQARYETWVRVEILATEAQVRLGAVPGSAL - ADMRRAPVPLASRVAEIEKERDHEVLSFLAAYCEEIPEESARWVHLGMTSYDLVDTALG - HTLARGTDLLLDAARALRRILAERAVEHWDTVCVGRTHGVHAEPTTFGHKLAGYAFAVD - RSLTRLRAAREAVAVGTVSGSVGTYALIDPAVERHVLTALGLAAEPAPSQVVARDRHAQ - LVQAVAALGAVVEQVALEMRLLQRTEVREVEERRTGAYQGSSAMPHKRNPTTSERLVGL - ARLLRGHAGTALENVALWHERDLAHQSVERVILPDSLSVGHFQVTMATELLTHLAVFPE - RMRAHLEQTGGLVYSSAVLAELLATGTEREKAYRGVQAAANRTLAGGADFAAALAEEGI - DLGPLGPERFLGHHDVIRERLEQLRDLED" - gene 27131..27535 - /locus_tag="SLNWT_RS23670" - /old_locus_tag="SLNWT_5140" - CDS 27131..27535 - /EC_number="2.3.1.-" - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383109.1" - /locus_tag="SLNWT_RS23670" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5140" - /product="GNAT family N-acetyltransferase" - /protein_id="WP_040253467.1" - /transl_table=11 - /translation="MTWKIERVPGDGLDLDEVLTVYRESGLGERRPIEDRERFAAMLRG - ANLVVVCRTEEGRLIGIARSVSDFSYVTYLSDIAVSADFQRAGIGRALIAGTQAETPGV - KIVLLSAPAAVDYYPHLGFTRHESAWVLQP" - gene complement(27621..28349) - /locus_tag="SLNWT_RS23675" - /old_locus_tag="SLNWT_5141" - CDS complement(27621..28349) - /codon_start=1 - /gene_functions="regulatory (smcogs) SMCOG1008:response - regulator (Score: 185.3; E-value: 1.9e-56)" - /gene_kind="regulatory" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_015037154.1" - /locus_tag="SLNWT_RS23675" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5141" - /product="response regulator transcription factor" - /protein_id="WP_237282926.1" - /transl_table=11 - /translation="MPSPRFAEDEGFGPTTRKVAGLPTGQRILVVDNDSDYAEALVCRL - RRHGHETTRVQQGGTALQSLEDIDLVLLDLELPDLDGLEVCGAIRSVSCLPVIIVTARG - TELDRVLGLQAGADDFLVKPYGFRELLARIDAVMRRVHQQPQRVREIQHGPLKIDASSR - EVSLDGREVGLTRKEFDLLHLLASNPDTVIPRKRLLQQVWGDSWSRRTVDTHVSSLRSK - LGDSGWIITVRGVGFKLGSA" - misc_feature complement(27756..27758) - /note="tta leucine codon, possible target for bldA - regulation" - /tool="antismash" - gene complement(28640..29536) - /locus_tag="SLNWT_RS23680" - /old_locus_tag="SLNWT_5142" - CDS complement(28640..29536) - /GO_function="GO:0003677 - DNA binding [Evidence IEA]; - GO:0003700 - DNA-binding transcription factor activity - [Evidence IEA]; GO:0016987 - sigma factor activity - [Evidence IEA]" - /GO_process="GO:0006352 - DNA-templated transcription, - initiation [Evidence IEA]; GO:0006355 - regulation of - transcription, DNA-templated [Evidence IEA]" - /codon_start=1 - /gene_functions="regulatory (smcogs) SMCOG1032:RNA - polymerase, sigma-24 subunit, ECF subfamily (Score: 117.4; - E-value: 8.6e-36)" - /gene_kind="regulatory" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018088855.1" - /locus_tag="SLNWT_RS23680" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5142" - /product="sigma-70 family RNA polymerase sigma factor" - /protein_id="WP_040253470.1" - /transl_table=11 - /translation="MDKGEWPALAEKFESQRPHLRAVAYRMLGSVAEADDAVQETWLRL - SRSEAGEIGNLGGWLTTVAGRICLDMLRSRSSRREDPLGDHLPEHGPRDQAAAPTDPAH - EAQLVDSVGLALLVVLDTLDPAERIAFVLHDMFSVPFGEIAPIVGRTPVAARQLASRAR - RRVQAVDTSPDSDLPRQRAVVDAFLAAARGGEFEALLALLDPDVVLRVDAAATPAGAPM - EIVGAQPVAAQAGLYSGRAHLARTALVDGRLGLATAAPRQLSVVMDFTVSEGRITAMNI - IADPTRLAGLDVAILSA" - gene 29994..31013 - /locus_tag="SLNWT_RS23685" - /old_locus_tag="SLNWT_5143" - CDS 29994..31013 - /codon_start=1 - /inference="COORDINATES: ab initio prediction:GeneMarkS-2+" - /locus_tag="SLNWT_RS23685" - /note="Derived by automated computational analysis using - gene prediction method: GeneMarkS-2+." - /old_locus_tag="SLNWT_5143" - /product="ParB N-terminal domain-containing protein" - /protein_id="WP_159393028.1" - /transl_table=11 - /translation="MSLAEQLTYPAVDLDEIESSAIWIESHPITRVRIDSLVFEGSPRL - GGEDHDHVRVLAEAGDSLPAITVHRPTLRVIDGTHRVRAALLNGRTEIAARMLDCDEAA - AFVLSVKANVTHGLPLSRQERAAAAARIIMTHPQWSDRAVAAATGISDKTVSRIRSQSG - ADSAQSATRLGRDGRLRPLDSGQRRRRAAAMFLDRPDAGLREVARATGLSPATVRDVRQ - RIDRGEDPVPGRYRTAESPGGATAARQRPAAGRLDRRTVVVDRQRLLAKLSEDPSLRLN - EAGRRALRWLHHYSVDGNGIETLGQGLPCHWAPDVADLARSCAAAWAELAEQLQQRAE" - gene 31680..32846 - /locus_tag="SLNWT_RS23690" - /old_locus_tag="SLNWT_5145" - CDS 31680..32846 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018563740.1" - /locus_tag="SLNWT_RS23690" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5145" - /product="inositol-3-phosphate synthase" - /protein_id="WP_052482559.1" - /transl_table=11 - /translation="MSQHPEKAGPPGAPASGPGTGVWFIGARGSVATTAVTGAAALAAG - LQPPTGLVTEAPEFAGSGLPALSSLVFGGHDTADWPLPKRAEALAEGGVLPRGLAAAVQ - RELAAADEEIRPGGPLPGDRRGDEELIADFAADIADFTRRTGVARTVVVNLASTEPLPE - PNSARLPASSLYAAAALRAGAAYVNFTPSAGLHHPALAEAAASARVPYAGRDGKTGQTL - LRSVLAPMFRQRALDVRAWSGTNLLGGGDGAALADPAAAEAKNAGKNRVLEDTLGALPE - GEVHIDEVPALGEWKTAWDHVAFEGFLGSRMILQTIWQGCDSALAAPLVLDLARLAARA - QEAGLTGQLPALGFYFKDPDGGSSALAEQYAALLAFAARLGARPAEAS" - gene 32843..33769 - /locus_tag="SLNWT_RS23695" - /old_locus_tag="SLNWT_5146" - CDS 32843..33769 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_014049484.1" - /locus_tag="SLNWT_RS23695" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5146" - /product="UbiA family prenyltransferase" - /protein_id="WP_040253473.1" - /transl_table=11 - /translation="MSTPRDWAELLRVSALLSVPGDALAGAAASRRRPNSRTALALCSS - LCLYEAGMALNDWADRAEDAEERPHRPLPSGRIAPGAALAAAAGLTAAGLGLAARAGRP - AALCATALAGAVWAYDLRLKHTAAGPAAMAAARGLDLVLGALATAGPRSGEAAGSVLGR - ALPPAAVLGAHTWAVTAVSRAETQGGSAGRPLAALGTTAALGTLLAPAGARPLRLERAR - RLPETPRELAQAALAGAYAATAGRSYLHAALNPSPPLTQRAVGGGIRAMIPLQAALAAR - SGALATAASLGALVPLARSLARKVSPT" - gene 33766..34713 - /locus_tag="SLNWT_RS23700" - /old_locus_tag="SLNWT_5147" - CDS 33766..34713 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_016823815.1" - /locus_tag="SLNWT_RS23700" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5147" - /product="sugar phosphate isomerase/epimerase" - /protein_id="WP_078845184.1" - /transl_table=11 - /translation="MSIRLGYGTNGLTDLRLREALTLLAELGYQGVGLTLDHMHLDPLA - RGLSGRAKALARTLGALGLDVTVETGARYVLDPRRKHGPSLLDPDPEARVAREALLVTA - VEVAAELGAHAVHCFSGVRPEGTDEGTAWQRLADSLGPVLDAAQRDGIPLALEPEPGHL - VESLADFHRLRALLGDPELLGLTLDIGHCQCLEPASPAECVTAAAPWLRHVQIEDMRRG - VHEHLPFGEGEIDFPPVLAALEASGYRGLTVVELPRHSHAGPELARRSMEFLRPLVAAA - AREDRAAGAPSPVRARPVPLLTGPPLRQEAPSRT" - gene 34723..35409 - /locus_tag="SLNWT_RS23705" - /old_locus_tag="SLNWT_5148" - CDS 34723..35409 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018851358.1" - /locus_tag="SLNWT_RS23705" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5148" - /product="EboA domain-containing protein" - /protein_id="WP_186095464.1" - /transl_table=11 - /translation="MPITPITPEEPRPAPEPADGTEAELRREAAELRERLSAEGADWLD - GALAEAARAAAEPAPAESRAVPGWELRFAAAGRACGTEAAESARVLLLRAARPGPAALT - RLYRHGTGEERRAVLRALPRLPLAPGEGLPLVEDALRTNDTRLVAAAVGPYAAAHLDDH - AWRHAVLKCLFTQVPVRALARLPERARGDAELARMLRDFAAERTAAGRAVPADLDHVLA - LTAKDA" - gene 35409..36257 - /locus_tag="SLNWT_RS23710" - /old_locus_tag="SLNWT_5149" - CDS 35409..36257 - /GO_function="GO:0016788 - hydrolase activity, acting on - ester bonds [Evidence IEA]" - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_016327783.1" - /locus_tag="SLNWT_RS23710" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5149" - /product="TatD family hydrolase" - /protein_id="WP_040253475.1" - /transl_table=11 - /translation="MRIFDPHIHMTSRTTDDYEAMYAAGVRALVEPAFWLGQPRTSPES - FFDYFDALLGWEPFRAAQYGIAHHCTLALNPKEANDPRCLPVLDALPRYLVKDHVVAVG - EIGYDAMTPAEDTALAAQLELAAEHGLPALVHTPHRDKLTGLRRTLDVVAESKLPTERV - LIDHLNETTVKEARESGSWLGFSVYPDTKMDEHRMVALLKEYGPERVLVNSAADWGKSD - PLKTRKVGEAMLAAGFGEDEVHRVLWENPVAFYGLSGRLDLEVPGTEALHEGNSLLRGG - E" - gene 36261..37430 - /gene="eboE" - /locus_tag="SLNWT_RS23715" - /old_locus_tag="SLNWT_5150" - CDS 36261..37430 - /codon_start=1 - /gene="eboE" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_003972400.1" - /locus_tag="SLNWT_RS23715" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5150" - /product="metabolite traffic protein EboE" - /protein_id="WP_040253477.1" - /transl_table=11 - /translation="MRFRHPDGSLVHLAYCTNVHPAEDLDGVLAQLGAYCEPVRRRLGT - ERLGIGLWLARDAARALTTEASALRRLRTELDRRGLEVVTLNGFPYRGFGAEKVKYRVY - QPDWRDAERLEYTAELAGLLAELLPPDVTEGTLSTLPLAWRSDFDAAGAAAAERQLTEL - ARRLDDLEERTGRSIRVALEPEPGCAVERTADALAPLAALPAHRFGLCLDTCHLATCFE - EPAAALAALERAGATVPKVQLSAALHAEDPADPAVRAALAAFDEPRFLHQTRALAEGVL - HGTDDLGPALAGGTLPETVPWRAHFHVPLHAPPAPPLTSTMDVLRGSLDVLLGQDAPRS - RHFEVETYTWQALPPEARPADAAQLADGIAAELALARGLFRDLGLKELP" - gene 37427..38827 - /locus_tag="SLNWT_RS23720" - /old_locus_tag="SLNWT_5151" - CDS 37427..38827 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_020125660.1" - /locus_tag="SLNWT_RS23720" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5151" - /product="alkaline phosphatase family protein" - /protein_id="WP_040253479.1" - /transl_table=11 - /translation="MTATPTPLLVLDVVGLTPALLEQMPRLKSLARKGSSAGLGTVLPA - VTCAAQSTFLTGAPPAEHGIVGNGWYFRELGEVLLWRQHNGLVAGDKLWDAARRAHPGY - TVANVCWWYAMGADTDWTVTPRPVYYADGRKEPDCYTRPVELHDELTDALGTFPLFHFW - GPGADLVSSRWIIDATRHLNRTRHPDLTLCYLPHLDYDLQRFGPRDPRSLRAAAELDAA - LGPLLDEAEAEGRTVVVLSEYGITEVSRPVDINRALRRAGLLEVHTQDGMEYLDPMASR - AFAVADHQLAHVYVRRPEDLARVREVLEGLDGVAELLGDEGKKAHGLDHPRAGELVALA - APEAWFTYYYWLDDERAPDFAQLVEIHRKPGYDPAELFLDPLDPYVKLRAAGALARKKL - GMRYRMAVVPLDPAPVRGSHGRLPARPEDGPVLLCSRPGALPGEVAATEVKSLLLGLAG - LAEVPATG" - gene complement(38832..39386) - /locus_tag="SLNWT_RS23725" - /old_locus_tag="SLNWT_5153" - CDS complement(38832..39386) - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1111:GCN5-related N-acetyltransferase (Score: 146.6; - E-value: 1.2e-44)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018549427.1" - /locus_tag="SLNWT_RS23725" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5153" - /product="GNAT family N-acetyltransferase" - /protein_id="WP_040253481.1" - /transl_table=11 - /translation="MYAVPLAEDAALRPLEPWQAEEFLAHMDRARPHTDPWIPWASRST - DLDSARATLQDYADKQAADTGRLYGIWRAGTLVGGVMFVHFDTRLGNCEIGVWTEPAGE - GHGLITAAVRHLIDYAFAERGMHRVEWFSSTRNARSRAVAQRVGMQLDGTLREYFPNRG - FRHDKEVWSLLAPEWPGAAAV" - gene 39465..40115 - /locus_tag="SLNWT_RS23730" - /old_locus_tag="SLNWT_5152" - CDS 39465..40115 - /codon_start=1 - /gene_functions="regulatory (smcogs) SMCOG1057:TetR family - transcriptional regulator (Score: 120.6; E-value: 1.8e-36)" - /gene_kind="regulatory" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_016328168.1" - /locus_tag="SLNWT_RS23730" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5152" - /product="TetR family transcriptional regulator C-terminal - domain-containing protein" - /protein_id="WP_163011131.1" - /transl_table=11 - /translation="MPPARGDHEARRREVSEAVWQVLAARGFGGLTLRAVAAQMGATTG - LLTHYFPGKRALLAHALDVLDRRSAERPRPAAEEAGEAAGLVMLRAMLLDILPLDAASA - ASNRIWVGSWDAALTDPELAEEHAARYRRARARMTGYVADAQRLGELPAGPAAEEIAAA - AQSFVLGLVVQALFAPGEFPPERQVALLDAHLAKAAAGADRAPGTPPVPAGES" - gene complement(40161..41249) - /locus_tag="SLNWT_RS23735" - /old_locus_tag="SLNWT_5154" - CDS complement(40161..41249) - /codon_start=1 - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1042:O-methyltransferase (Score: 297.1; E-value: - 2.7e-90)" - /gene_functions="biosynthetic-additional (t2pks) MET - (Score: 268.6; E-value: 1.8e-82)" - /gene_kind="biosynthetic-additional" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383099.1" - /locus_tag="SLNWT_RS23735" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5154" - /product="hydroxyneurosporene methyltransferase" - /protein_id="WP_078845185.1" - /transl_table=11 - /translation="MPKLPPAKVVRAVEGVRAGLVKLTRLLAPPPFALLELSQGSMVTQ - ALYVAAELKVADELKDGPLTAAQLAQRVGADPESLHRLLRLLATYSVFEERADGSFKLK - PMGQALRSDTPQSMRATVLLMGHPTHWEEWAHLVDAVRTGEASLPKLRGMGAFEFIDAN - PEYGEIFTAGMGAMSETETLPLLAAYDFRRFRTIVDYGAGRGGLLAAALQQAKDARGVL - FDARIDTNGAADYLREQGVADRCTLEKGGLFDPAPAGGDAYLLKHIVHDWPEEQVIEIL - RNVRKVIDPDGRILLMEFVTPDDKPNKPHPAKLVDLWLMLLVGGKERSEKQYAEVLAAG - GFRLEKITETAAPISVIEARPV" - gene 41716..42792 - /locus_tag="SLNWT_RS23740" - /old_locus_tag="SLNWT_5156" - CDS 41716..42792 - /codon_start=1 - /inference="COORDINATES: protein motif:HMM:NF033206.1" - /locus_tag="SLNWT_RS23740" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5156" - /product="ScyD/ScyE family protein" - /protein_id="WP_159393029.1" - /transl_table=11 - /translation="MSRAHKPWAGALLAAAVVAGLTATAAPSQAAHRAGPEVLATNLNN - PRDITLQADGSILVAESGSGPATACAPGTSCLGFTGSIYRVNGSQKGRVVTGLPSKLEV - RADGGASVAGPNQVEARTGGYTVSSSFGGDAADRKALGAGGETLGTLHIAKGKVLGDLV - DHETRLDPDGPLGNNDVHSNAWMFAHHGKDYLVTDAGGNDLIRVLPDGTTKTEFVFPNN - GENETVPTGIVAAPDGSFYISDLSGQAAGKSRIWRYVPGSAPKVFATGLTNVTDLALDG - KGGLIALTLTKGYTETGPLPGALNRVDLKSGKATEIPTADRLVNSLGLAVGKGGEIYVT - NKTVGTTGELLKFPAARR" - gene 43304..43888 - /locus_tag="SLNWT_RS37105" - /old_locus_tag="SLNWT_5157" - CDS 43304..43888 - /codon_start=1 - /inference="COORDINATES: protein motif:HMM:NF019498.2" - /locus_tag="SLNWT_RS37105" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5157" - /product="cupin domain-containing protein" - /protein_id="WP_040253485.1" - /transl_table=11 - /translation="MTKIILPEDRPAGRRGFEIVLPSSLTDGAASLVEAHVSEAMSGPP - LHTHAESDETYFVLGGALIMIIDGKLTELRAGGLAHISKDTSHTWATRPDEGAHFLTLH - LPGGYELYHPTALHAEHEKGGPLEQKDLFELAARFDWRLAGPPEPHRLTPTGVLVPAGK - ADAEAEATKALATAEYERALAASIEAADSGS" - gene 43945..45807 - /locus_tag="SLNWT_RS23750" - /old_locus_tag="SLNWT_5158" - CDS 43945..45807 - /codon_start=1 - /gene_functions="transport (smcogs) SMCOG1005:Drug - resistance transporter, EmrB/QacA (Score: 389.3; E-value: - 3.1e-118)" - /gene_kind="transport" - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_018383102.1" - /locus_tag="SLNWT_RS23750" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5158" - /product="MFS transporter" - /protein_id="WP_063778692.1" - /transl_table=11 - /translation="MSGPGSGGPGTAAVPGAAPPGAAGAPDPRRWFALVVILVAGFMDL - LDVTIVNVVLPSVLADLDAAYTHGEWIVAGYVLGFAALMITGGRLGDILGRRKVFLAGV - AGFTAASLLCGLADGPGALIAARFLQGAMAGLMVPQILAIIHVTFPAEERGKVLGIWGG - VLGAASAAGLVAGGLLAEADPYGLGWRAVFLVNVPVGAAALLAAWFLVPDSRAPERPRL - DPLGALLSAAGILLLVYPLTEGRGLGWPPWTFLLMGAAVLVLGLFVLQQRGRTRADNSP - LMSLRLFRARAFSAGMAVWALFWIALGGFFFIWTLYMQVGLGWPPLRAGLTSSAFAVGC - AAGSGTAVEFFTPRFGRKALLAGALLCGTGFLGYVLVAAHYGPAVAPWQMVAPLLVAGI - GFGLVVAPMIDAVLTEVPVREAGSASGVLGTVQQIGIALGTALAGVLFFQQLDHDAARA - VARAAPALRQELTRAEVPAAERERILDAFADCLADRAAATDPTAEPASCRGPLPSPEVR - ALVIGAGQRATADNFSRTFALTLRWGAGSMGLVFLGLFALPRRVEFRGLDGGGPGPGSG - PSVPGASEGGAAVGPGAGPASGPGKERSAPARSGGQDAGTHPAG" - gene 46203..46688 - /locus_tag="SLNWT_RS23755" - /old_locus_tag="SLNWT_5160" - CDS 46203..46688 - /codon_start=1 - /inference="COORDINATES: similar to AA - sequence:RefSeq:WP_019359898.1" - /locus_tag="SLNWT_RS23755" - /note="Derived by automated computational analysis using - gene prediction method: Protein Homology." - /old_locus_tag="SLNWT_5160" - /product="phospholipase" - /protein_id="WP_040253488.1" - /transl_table=11 - /translation="MRRRHVLPLAAAALAMPAALLSTGSASAAPADKPQVLSSFTQTSA - SSYNAWNAARNNQGQWAAYGFDWSTDYCSTSPDNPFGFPFETACARHDFGYRNYKAMGT - FSANKARIDSALYEDLKRVCSRYSGATKTSCDGLAWTYYHAVDIFGIKGFKQLDKAA" -ORIGIN - 1 atgagcaccg tcagggaccc gggtccgctc gccgctcccg tccgtctcgc gccgcgggcg - 61 accgccctgc gggagaccga ggcgctgtgc tcgatgccgg tgagcgccga agcggtcccc - 121 ctgctgcggc ggttcgccag ggacacctcc cggcagtggg acctccccgg cagcgcccag - 181 gaagcggcct gcgtcatcgt caccgaactc gtcaccaacg tcctgctgca cagcggcagc - 241 cgggacgtca ccctgcggat cgtgctcagc gacttcgccc tgaccgtcca tgtcgacgac - 301 gagggccgct ggaagcaccg ccctgccgcc cgcctcgcca ccgaggacgc gggcgcgcgc - 361 tgcggccggg gcctgcaact cgtcgacgcc tacgcggtcg cctgcgatgt ggaccgtacg - 421 gagcgcggga cccgggtgcg ggccgagatc gcggtcgcgg cggcctgagc cccgtacctc - 481 cccggcttcc gcgggccggc cgacggcctc aggccgcctg ggacttgagc ccgtccagca - 541 tgatgtcgat gtagcggcgc cagtccccgc tgcggcggtg cacgatcgag gtcagcccgc - 601 aggtgagcga gaggatgtcc acgctcgcca tgtcctggcg gatgctgccg ccctcctggc - 661 ccttgccgat cagcgccatg agttccgctt cgaggtcctc ccgcagcggg ctgcgcgggc - 721 cctccgagcc gaggctgccc tcggtgacgg cggtggcgaa cccccggtcg cgggactcca - 781 cttcggcgat ccgggtgagc agcagatgca gggcctggag cggctcggcg gagtcgcggc - 841 agaccgtgcg gtagtaggtc aggatctccc cgaagcgctg ctggcccgcg gcgatgacca - 901 tggcctcctt ggtggggaag tgccggtaga gggtgccgat gccgacctcg gcccggcggg - 961 ccacctcgtc catggacacc tcggcgccgc gctccgcgaa gagctcccgc gcggcgttga - 1021 gcacgcgggc ccggttgcgc tcggcgtccg cgcggagccg gggacgggtg ctctgcgcct - 1081 tctcggcgcc ggtcgtcttc tcgctgcctg ccgccatgcg gaacctcctt ccggttgact - 1141 ctactatgcc ccctccgggc ccctcggcgg agcgggcaat cggccaactt gcacacccgg - 1201 cggacgattt ggggtggttg ggtgatcaac cgcgggccgc cgggcggtgg ttgacacccc - 1261 ttcgcgctct cgcctgtact gaaatatcgg aagcggagtc cgattcccgt accggtggcc - 1321 cgagtcggcg ccgccggtac cggtcgcacc cggcggcccg tccgcggcgg caggaccgga - 1381 caggggaacc aagggaacag ggaaggacgt acacgatgtc gatgtcccgg gaacgggcga - 1441 gcgcgccgcg ggtgacgccc tcggtggagg ccttcctcgc cgagccgcac ctggccaccc - 1501 tgaccacgct ccgccccgac ggcaccccgc atgtggtcgc cgtccgcttc acctgggacg - 1561 cgcggtcggg gctcgcccgg gtgatgaccg tgcgcgactc ccgcaaggtg cgcaatgtgc - 1621 tcgcggcgcc gggcggccgg gccgcgctct gccaggtcgc cgggttcaaa tgggtcaccc - 1681 tggagggcgc cgccaccgtg tccgaggacc ccgtacgggt caccgagggc gcccgccgct - 1741 acgccgcccg ctacctctcg ccgccgccca atccgccggg ccgggtcgtg gtcgagatcg - 1801 ccgtggaccg ggtgatgagc ctcaacagct gagcgggggc gggcacttcg gccgccgtgc - 1861 gcggatccgt acgcgaggtg tgagcgcgta cggatccgtg cgggacgtag cggtacgcgg - 1921 aggaagcggg gcgcccgggc ggcgccccgc ttcccgtgtg ccgggggagg aggcgcgggc - 1981 ccgcccccgg cggacgggcc cgcgccggag cgctacctgc ccccgccgcc cggcggggtg - 2041 ccgtgcttcc acatcaggcg gaagctcagc gcggacagcc gccagccctc gggggtcctg - 2101 cgggcgcggc cgtccacgaa ggtgccggtc cggaagagcg ggcccagctc cgcggcgttc - 2161 tccggccggt ggacgtgggt cgaggtgcag ttggcgcgca gccgggccgt gtcgcccccg - 2221 ccctcgatct cgacgaaggc gtgggtgccc atgtgctggg tacaggtgaa ggcgtccagg - 2281 gtgcgctggt ggaaggcgcc catgcccgcg gcgccctggt ggccgccgac cgggaaggtg - 2341 accgaggcgt cctcggtgaa caggctccgc gtccagtcgt cgtccagctt ctcgtcgtcc - 2401 agggtgatca ggtaccggtc caggagtccc gcgatttcgg cggtcgattc gcttggcgtc - 2461 atacctgaag gattgcccgc cattcgtggc ctgccaggct tcctgtcacg gatctgacgt - 2521 tcctgtcgaa ggcctgtagt agccacccca aggcctgtac ttgacgactg tttacccctt - 2581 gccgcattcc tgggaagaat gaggcaacac cgtcgggaga gggcagatgg aaaactttga - 2641 cgcggacgtg atcattgtcg gtgccggtcc cacaggactg atgctcgccg gggaactcgg - 2701 gctccacgga atttcggccc tcgcggtcga caggctcgaa gaaccgatcc agcagtcccg - 2761 cgccctcggt ttctccgcgc ggaccatcga ggaattcggc cagcgcggac tcctcgcccg - 2821 tttcggtcag gtcgacgtca tcccgttcgg gcatttcggc ggagtgccgc tcgatttcca - 2881 gatcgtcgag ggcggttcct acggggcccg cggaattccg cagtcgcgca ccgagggcgt - 2941 cctcgccggg tgggcccgcg agaagggcgc cgagatccgc cgcggcgtcg aggtcaccgg - 3001 cctcgacgac gacggcgagg gcgtcaccct ccaggtgcgc accggcgagg gcgagtcccg - 3061 gctgcgcggc cggtacgtgg tcggctgcga cggcgcccgc agcgtcgtcc gcaaggccgc - 3121 cgggatcggc ttcccgggca gcgaggcgga gatcgagctg cgcttcgcgg acatctccgg - 3181 gatccagctg cgcccgcggt tcatcggcga gaaggtcccc ggcggcatgg tgatggtgct - 3241 gccgctcggg cccgaccgca gccgcatcat ctacttcgac cgtacgcagc cgctgcgcga - 3301 gtcggccgag ccgatcacct tcgaggaggc ctccgaggcc ttccagcggc tgtgcggcga - 3361 ggacatcagc ggcgccaccc cgcactgggt cagctccacc accgacgtca gccgccaggc - 3421 ggaggcctac cgcagcggcc gggtcttcgt cgcgggcgac gccgcccaca tccatctgcc - 3481 gatcggcgcc cagggtatga gcgccgggat ccaggacgcg gtcaacctcg gctggaagct - 3541 cgctctggac ctgaagggca gggcgcccga ggggctgctc gacacctacc acgaggagcg - 3601 gcacccggtc ggccgccgca tcctcgtcaa caccctcgcc cagcgcagcc tctacctcgg - 3661 cggcgaggag atgaagccgc tggtcgacgt gatgggcgag ctggccgggt acgaggtggt - 3721 ccgcaagcac ctggtcggca tggtcaccgg cctcgacatc cggcactcca ccgtccccgg - 3781 cgagcacccg ctgctcggcc gccgcctgcc cgaccgcgag ctggccgtcg gcggcgagaa - 3841 gaccaccgtc ttcgccctgc tcaccgaggg ccggggcgtc ctgctcgacc tctccggcag - 3901 cgccgaggcc cgcaaggcgg ccgagggcca cgccggccgc gtcgaggtcg tcaccgccga - 3961 aagccacggc atcggcgccg agttggacgc cctgctggtg cgccccgacg gctatgtcgc - 4021 ctgggtcgcc cccgcgggct cgggcgccga ggggctcctg gaggccctcg accactggtt - 4081 cggcgccgcc gactgagccg cccggggccc cgccccgcca cgtaccccct gctctcccac - 4141 cctccgagaa ggaagcgacg acagcatgcc caagatctcc accgaagacg gctacctgac - 4201 cgtgctcaac ctcttcaccg cggacgcccc cgagaagcag gagaagctgc tcggtgagat - 4261 gcgcaagatc gtcgacgccg ccacctacga gggctggatc tccagcaccg tgcacgcggg - 4321 cgtcgaccag ccgggcaccg cgaacttcat ccagtggcgc agcggcgagg acctcgaaaa - 4381 gcggtacgcg ggcgaggagt tcaagcaccg cacgctgccg gtcttcggcg agatgaccac - 4441 ctcgatccgg ctgctgcaga acgacatcgt ctacacccag cgcgccccgg agctgaacgg - 4501 cgtcaccgag atctccccgg accgcgacga ctacaccgtc atcacggtct tcggggtgga - 4561 gaaggagaac caggacgcgc tcgtcgaggc gctctcccag gaccacttcc tgaaggtcga - 4621 cggctaccgc tcgcactccg tcctcaaggg ccgggccgcc cgcggcctcg aaggctcctt - 4681 cgtggtcgcc tactcccagt gggcgagcaa ggaggcctac gacgccttca actcccagcc - 4741 ggagggcgag cgttcggccg agcgcaagga ggccgaggcc accgtccgct cgctgatcac - 4801 ctcggtggac tccaacacct accgggtcgt gcacacccgc gccgcgggcg agtgacccac - 4861 cggcccggcc cgggagttcc gggccggcca gccgcggcga cgcccggccc ccgacggggc - 4921 cgggcgttcg ccgtcgttcc gcaccgaagg cccgggccgg acgccgcccg gccccaactg - 4981 ccgtcatctc aacggggaga agacatgttc acgcgcagaa ccgcactccg ctccggcgcc - 5041 gccctcaccg gcaccctcgg cgccgccggg ctcgccgtac cgctgctcgg cggcaccgag - 5101 gccggggccg ccgcgcccgg ggaggccgcc gggcaggccg gggccggggc cgccggcttc - 5161 gacgtctcgg cgctggtgaa gttcacccgg ccgctgcccg cgctgcccgt gctgagcccg - 5221 cgccgccgca ccgcccgcgc ggagacgtac gaactgcgcc agcgggagac ggagtgcgag - 5281 atcgtgccgg gcctgaagac ccgggtgcgg accttcgacg gctgcttcgc cccgccggtg - 5341 atcaaggcgg tacggggccg ccgcaccgtg atccggcagg tcaacgagct gaccgtgccg - 5401 acctcgatcc atctgcacgg cgggcatgtg cccgagtcca gcgacggcgg gccgatggac - 5461 ctggtccagc cgggcgcgag ccgcacgtac acgtacccca acgagcaggc gcacgccaac - 5521 ctctggttcc acgaccacgc ccaccaccag gagtccgaga ccgtcttccg cgggctgacc - 5581 ggccttatct gctcaccgac gagaccgagc agcggctgcc gctgccctcg ggcgcctacg - 5641 acgtgccgat cgcgatccgc gacatccgcc tcgacgaggc cgggcagatc gtctacgcca - 5701 tgaacgacgg caaggaccgc aacctgatgc tggccaacgg cgtcgcctat ccgtatctcg - 5761 ccgtcgccgc ccgcaagtac cgcttccgga tcgtcaacac ctccaatctg cgcaccctcg - 5821 acctgcggct ctccgacggc tcctcctatg tgcagatcgg ctccgacggc ggactgctcg - 5881 cccggccctt caccacctcc tcgctcaccc tctcgtccgg tgaacgcgcc gatatcgtgg - 5941 tcgacttcgc gcggtacgcg gccggcacca ggctcgtcct gaagaacgcg gtggccagcc - 6001 cgcccgggcc cgaggaccag atcggcgacc tcctcgaatt ccgggtcggc gacagggccg - 6061 aggaccgcag ccggatcccg gacaccctgc ggtcgctgcc gccgctcccg ccgccggacc - 6121 gcacccggga gatcgagctc ctgatgggcg cggacggcac tggtctgatc gacggcaagg - 6181 cctaccagga agggcgcgtc gacgcccaga tccccttcgg ctccaccgag ttgtggtcca - 6241 tccgcaacgc caacgaccgc ggcagccaca acttccatgt gcacctggtg cagttcaggg - 6301 tggtggagcg caacggccag ccggtgacgg ccggtccgga gagcggcctg aaggacaccg - 6361 tccggctcgc cccgggggag acggtcaagg tgcaggccac cttcggcggc taccgggggg - 6421 acttcgtcta ccactgccac atgatcgacc acgcggccat ggggatgatg gccaccatgc - 6481 gggtcggctg agcgggcggg gccgcgccgc tccgagccct ggcgccacgg gggcgtgccg - 6541 gtgtaccggt acgcccctgg gccatgcccg gaaaccggcg cgcaccccgg cgcccgtacc - 6601 ggcccgggcg ccccggctgt cccggcacca ccccgcgcac ccgctcgcgc ccccgcccca - 6661 gccgcctccc gggtggcgtc cggtcacttc cctgacccgt ccgtgccgct tcctgacgtt - 6721 cgcctggcgg tcctctgaca ttgcgggggc ggctctgcgg tacctgacga ttccgtaccg - 6781 agaaatgcac aagggcgcct tgtaggacgc gggctttgga agaaccattt accacaccgg - 6841 gcgatgtcac cggggggcgg cctccggtaa ggcacttccc cgccactcct tttcaccgag - 6901 tgccggaaaa gtgcctgcgg cgggccgcag aacaccgccg agctcccatg ggcggccgaa - 6961 tggattcgtg aatgcaattc ccgggccggt ttgtgtctcc ggcgcggggg cggcgctttc - 7021 gcgggcgcag ccgagtgccg cacagaccgc aactgccaag gagcgagaag atatgcacag - 7081 cacgctgatc gtcgcccgga tggacctcgg ttcgagcaag gacgtggccg ggctcttcgg - 7141 cgaattcgac gccaccgaaa tgccgcaccg catggggacg cggcgccgcc agctcttcgc - 7201 gtacaagggc ctgtacttcc acctccagga cttcgacgag gacaacggcg gtgagcgcat - 7261 cgaggaggcc aagaccgacc cgcgcttcat cggcatcagc caggacctca agcccttcat - 7321 cgaggcctac gaccccgcca cctggcgctc cccggccgac gcgatggccc agcgcttcta - 7381 cacctgggag gcgtgaggtg cccgggcgca gagtcgtgat caccgggatg gaggtcctcg - 7441 cccccggtgg tgtcggcacc aagaacttct ggagcctgct cagcgagggc cgcaccgcca - 7501 cccgcggcat caccttcttc gatcccgcgc ccttccgctc ccgggtcgcc gccgagatcg - 7561 acttcgaccc gtacgcgcac gggctgagcc cgcacgaggt gcgccgcatg gaccgcgccg - 7621 cccagctggc cgtggtcgcc gcccgcggcg ccctcgccga cagcggcctg gagaccgcgg - 7681 ccctggagcc gcaccgcacc ggcgtcaccg tcggcagcgc ggtcggcgcc accatgggcc - 7741 tggacgagga gtaccgggtg gtcagcgacg gcggccggct cgacctggtc gaccacgcct - 7801 acgcggtgcc gcacctctac aaccacctgg tgcccagctc cttcgccgcc gaggtcgcct - 7861 gggcggtggg cgccgagggc cccagcaccg tggtctccac cggctgcacc tcgggcatcg - 7921 acgccctcgg ctacgccctg gaactggtcc gcgagggctc ggtggacgtg atggtcgccg - 7981 gggcctccga cgcccccatc tcgcccatca ccatggcctg cttcgacgcc atcaaggcca - 8041 ccaccccgcg ccacgacgac ccggagcacg cctcgcggcc cttcgacggc acccgcaacg - 8101 gcttcgtgct cggcgagggc agcgccttct tcgtcctgga ggagtgggag tcggcccgcc - 8161 gccgcggcgc gcacgtctac gccgaactcg cgggctacgc cacccgctcc aacgcgtacc - 8221 acatgaccgg actgcgcacc gacggcgcgg agatggccga ggcgatccgg ctcgccctcg - 8281 acgaggcgcg gctcgccccg gaggccatcg actacgtcaa cgcgcacggc tccggcacca - 8341 agcagaacga ccggcacgag acggccgcct tcaagaagag cctcggcgcg cacgcctacg - 8401 cgaccccggt cagctccatc aagtcgatgg tgggccactc cctcggcgcg atcggctcca - 8461 tcgagatcgc cgcctcggcg ctcgcgatgg agcaccacac ggtgccgccg accgccaacc - 8521 tcaccacccc cgacccggag tgcgacctcg actacgtccc cctgcacgcc cgcgagcagc - 8581 gcaccgacgc ggtgctctcg gtcggcagcg gattcggcgg cttccagagc gcgatggtgc - 8641 tcgcccgccc ggagaggagc ccggcatgag cgcaccggcg gtcatcacgg gaatcggtgt - 8701 cgccgcaccc aacggcctgg gcctgcgcga ctactgggcc gccaccctcg gcggcaagag - 8761 cggcatcgcc cgcctcaccc acttcgaccc ctccggctat ccggcccaac tcgcgggcga - 8821 ggtacccggg ttcgtcgccg aggaccacct gccgagcagg ctgatcccgc agaccgaccg - 8881 gatgacccgg atggcgctcg cggcggccga ctgggcgctg gccgacgcgg gcatcacccc - 8941 cgccgaactg ccctccttcg acatgggcgt ggtcaccgcc agctcctccg gcggcttcga - 9001 gttcggccag ggcgagctgc gcaaactctg gagccagggc agccagttcg tctccgcgta - 9061 ccagtccttc gcctggttct acgcggtcaa cagcggccag atctccatcc gcaacggcat - 9121 gaagggcccg agcggggtgg tggtcagcga ccaggccggc gggctcgacg ccctcgccca - 9181 ggcgcggcgg cagatccgcc ggggcacccc gctgatcgtc accggcgcgg tcgacgcctc - 9241 gctctgcccc tggggctggg tggcgcagct ctccggcggc cggatgtcca ccagcgccga - 9301 ggcggcccgc gcctatctgc ccttcgaccg ggaggcccgc ggctatgtgc ccggcgaggg - 9361 cggcgccatc ctgatcatgg aggacgccga ggcggcccgc gcccgcgggg cccgggtgca - 9421 cggccggatc ctcggctacg gcgccacctt cgacccgagg ccgggcagcg gacgcccgcc - 9481 cgcccttcgc cgggccgcgc agacggcgct cgcggacgcg ggcgtggacg ccgccgacat - 9541 cgacgtggtc ttcgcggacg ccgcgggcga accggccgcc gaccgcgccg aggccgaggt - 9601 gctcaccgcg ctcttcggga tccgcggcgt cccggtgacc gcgccgaaga ccatgaccgg - 9661 gcggctgtac tcgggggccg cgccgctgga cgtcaccgcg gccctgctcg ccctgcgcga - 9721 ccaggtgatc ccgccgaccg tgcatgtgga gccctgcccc gagtacgggc tcgacctcgt - 9781 cctcgcccag ccgcgccccg cgaagctgcg caccgcgctg gtcctcgccc gcgggcacgg - 9841 cggcttcaac tccgcgctcg tggtccgcgg tcccgagtga accaccctgc cccgccgcgc - 9901 agttgagtgc gcgtcagctc cccgtccccg cgccgccccg ctcgccccgt gacatcccga - 9961 tggaaggaca ccccatggcc accgccgcgt tcaccctcga cgacctgaag cggatcctgc - 10021 tgcaatccgc cggcgccgcc gagggcgtcg acctggacgg cgagatcctc gacaccgagt - 10081 tcgaggtcct cggctacgaa tccctcgccc tcctggagac cggcggcgcc atcgagcgcg - 10141 agtacggcat ctcgctggac gacgaggtca tcaccgacgc ggagaccccg cgcgccctca - 10201 tcgacgccgt caacgcccac ctgtccaccg ccggtgcggc ctgagccgaa ggagccttca - 10261 ccatgaccga gaacacccag gaacacggcc gcctcgccct cgtctcgggc ggcaccagcg - 10321 gtatcgggct ggcgagcgcg cggctgctcg ccgagcaggg gcaccgggtc ttcctcggcg - 10381 cccgggacgc cgaccgggtc gcggcgaccg tcaaggaact ggccggcgag ggcctgccgg - 10441 tggacggcac cgtcctcgac gtgcgcgagg acgcctccgt acgggccttc gtccaggccg - 10501 ccgtggaccg cttcggcacc gtggacgtgc tggtcaacaa cgccggccgc tccggtggcg - 10561 gggtcaccgc ggacatcccc ttcgagctgt gggccgatgt catcgagacc aacctcacca - 10621 gcgtcttccg gatgaccaag gaggtgctga acgcgggcgg catgcgtgcc aagagccggg - 10681 ggcggatcat caacatcgcc tccaccgcgg gcaagcaggg tgtcgtcctc ggcgccccgt - 10741 actcggcctc caagcacggt gtcgtcggct tcaccaaggc gctgggcaac gagctggcgc - 10801 cgaccgggat cacggtgaac gcggtctgcc ccggctatgt cgagacgccc atggcccagc - 10861 gggtgcgcca ggggtacgcc gacgcgtacg acaccagtga ggaggccatc ctggagaagt - 10921 tccaggcgaa gatccccctc ggccgctact ccacgcccga ggaggtcgcc ggactcgtcg - 10981 gctacctcgc ctccgacacc gccgcctcgc tcacctccca ggccctcaac gtctgcggcg - 11041 gactgggcaa cttctgacgt ccgtacggcg atccccgcac cccttcatct gtctggagtt - 11101 gtggctatga cgacccgtga ggtcgagcac gagatcacca tcgcggctcc ggcggcggcc - 11161 gtgtaccggc tgctcgccga ggtggccaac tggccccgca tcttcccccc gaccctctac - 11221 gtggaccgcg aggagctggg cccggggcag gagcggatcc acatctgggc caccgccaac - 11281 ggcgaggcga agaactggac ttcgcaccgg acgctggacg aggacgccct gcgcatcacc - 11341 ttccggcagg aggtgagtcc ggagccggtg gcggagatga acgggacgtg gatcatcgag - 11401 ccgcagggcg cctcgtcctc gcgggtgcgg ctgctgcacg ccttcaaggc gatcggtgac - 11461 gatccgcacg acctgctgtg gatcgagacg gcggtcgaca agaacagcac caaggaactg - 11521 gccgggctga aggagaacgt cgaactcgcg catgcagccg aggagttgac gttctcgttc - 11581 accgacacgg tccgtatcga cggtgcggcg aaggacgcgt acgacttcat cgaccaggcc - 11641 gacaagtggg acgaacggct cccgcacgtg gcgcgggtgc ggctcaccga ggacaccccg - 11701 gggctgcagg agctggagat ggacaccagg gccaaggacg gctccaccca caccaccaag - 11761 tcctaccggg tgaccttccc ccaccaccgc atcgcctaca agcaggtcac cctgcccgcg - 11821 ctgatgaccc tgcacaccgg gatctggacc ttcgaggagg accccaccgg cacccacacc - 11881 acggcctcct cccagcacac cgtcaccctg cgcccggaga acatcgagaa gatcctcggc - 11941 cccgacgcga ccgtcgccga cgcccgcgcc tatgtgcaga gcgcgctgtc caccaacagc - 12001 accgccaccc tcggccacgc caagaaccac gcggagcgcc agggctgatg gacaccgcgg - 12061 accgcctgga gacccaggtc atcatcgtcg gcgccggtcc ggtcgggctc ctgctcgccg - 12121 gtgaactccg cctgggcggc gccgaggtgg tggtgctcga acagcgcgag gcgcccacga - 12181 ccgagtcgcg ggcctccacc ctgcacgccc gcaccatgga gatcctcgac agccggggac - 12241 tgctggccgg cctcggcacc ccgccgcagg agccgcgcgg ccacttcggc ggcatcccgc - 12301 tcgatctgac gctgcccagc cgctacccgg gccagtggaa ggtgccgcag ttccgcaccg - 12361 aggaactgct ccaggagtgg gcgctcggcc tcggcgcgga catccgccgc ggccaccagg - 12421 tgcacgcgct gaacccgggc gaccaggcgg agtacgtcga ggccgaggcc accggacccg - 12481 gcggcaggcg cgtcctggtg cgcggccgcc acctggtggc ctgcgacggc gaggagggca - 12541 ccgtccgcag gctgaccggg gtggtcttcc ccgggcagag cgccacccgg gagctgctgc - 12601 gcgccgacgt ggacggcatc gacgtacccg atcggcgctt cgagcggctg ccgcggggcc - 12661 tggccatcgc cgcccggcgg ggcgacgggg tgacccgggt gatggcccat gtcttcggct - 12721 cgaccgccca accccgcacc ggggaggccg agttcgggga ggtcgtggcg gcctggaagc - 12781 aggtcaccgg ggaggacatc tccggcggca ccccgctgtg ggtgaacacc ttcggcgacg - 12841 cctcccggca gctggtgcac taccggcgcg ggcgcatcct cttcgcgggc gacgccgccc - 12901 atgtgcagat gccgatcggc gggcaggccc tcaacctcgg cctccaggac gccttcaacc - 12961 tcggctggaa gctcgcccgg cagctgcggg aacccggcgg ggaggcgctg ctcgacagct - 13021 accacaccga gcggcacgcg gtcggccgcc gggtcctcgg caacatcaag gcccaggcca - 13081 tgctgctgct cggcggcccc gaagtggagc cgctgcgcac cctgctggcc gaactcatcc - 13141 gccacgagaa ggtccgcgcg cacctggccg ggatgatcag cggactcgac atccgctacc - 13201 aactcccggg ccccgcgcac cccttgctcg gcgcccggct gccgcacacc gtcctgacga - 13261 gtcctcaggg acgggtgtcc gtcagcgagt tgctgcgcac cggacgcgga gtgtggatca - 13321 acccgggcgt ggacgtgccg gacggggccc gtctcagcac gctcaccggc cgccccgagg - 13381 aggggccgct gaccgacaag gactccgtcc tggtgcggcc cgacgggcat gtcgcctggg - 13441 cgggctccac cgggacccca ccgcccgccg aggcactcgg gcccgggtgg gaagccaccg - 13501 cctgaggaga cccaccgccc cgaaggcacc gcccccactg tgccgggcac cacccgcacg - 13561 cccacacctc acgaagggac cgaaaccatg gcagggacag cacaggggac cgcggtggac - 13621 gccgatgtca tcatcgtcgg cgccggaccg accgggctga tgctcgccgg tgaactccgg - 13681 ctcggcggcg cccgcgtcat cgtcgccgaa cggctcgccg agcccaccgg gcagtcccgc - 13741 gggctcggct tcaccgcccg cgcgatggag atcttcgacc agcgcgggct gctgccccgc - 13801 ttcggccagg gcgagaccct ggagaccagc ccgatgggcc acttcggcgg cctgcagttc - 13861 gacttcacca ccctgcccgg cgcccacttc ggcgcccgcg gcatcccgca gtaccagacc - 13921 gaggcggtac tggaggagtg ggcggccgga ctcggcgcgg acatccgccg cggctgggag - 13981 ttcctggagc tggccgaggg cttcctcacc ggcgagggcg tcgaggtcac cttcggcacc - 14041 cccgagggcg tacgcaccct gcgcgccgcc tatctggtcg gctgcgacgg cggcggcagc - 14101 caggtccgca aggcggccgg tttcgccttc cccggactgc ccgcgacccg cgcgatgttc - 14161 ctcgccgatg tcaccggcct gaacctcaag ccccgcttcc tcggcgagcg cctgccgcac - 14221 gggatggtga tggcggcccc gctcgccgag ggcgtggacc ggatcatcgt ctgcccgcac - 14281 ggcacccccg cccgcgaccg cgacgagagc gtcaccttcg aggaggtcgc cgccgcctgg - 14341 cagcacatca ccggcgagga catcagccac ggcggcgccg actgggtcag ctccttctcc - 14401 gacgccgccc gccaggtcga cagctaccgc cgcggccggg tgctgctcgc cggggacgcc - 14461 gcgcacatcc acctccccgc cgggggccag gggctgagca ccggggtgca ggacgccgcc - 14521 aacctcggct ggaagctggc ggccaccgtc gccgggcggg cgcccgcggg gctgctcgac - 14581 agctaccaca ccgagcggca cgcggtcggc agccgcctgc tgatgaacac ccgcgcccag - 14641 ggcttcgtct tcctcggcgg cgaaccggcc gacccgctgc gcacggtctt cgccgaactc - 14701 ctcggccacg aggaggtcaa gcagcacctg gccgggatcg tcagccacct cgacgtgcac - 14761 tacgcggccc ccgagggcgc ccacccgctc accggccacc ggctcggcga gcacatcctg - 14821 gtcggcaagg agggcgagag cgctgtcttc gccgaactgc acggcgggcg tggcctgttg - 14881 ctcgacctcg ctgacgacgc cggggtccgc gcggcgggcg cgggactgac cgaccggctc - 14941 accaccgtca cggccaccct caagtccgcc cccggcgacg ccgaccgcct cgacggcgtc - 15001 cgcgccctcc tggtccgccc ggacggctat gtggcctggg cgggggagac caccgagggg - 15061 ctggcggagg ccgtacgccg atggttcggc gaggcctcgc ccgcctgatc ccgaccgccg - 15121 cgagcaccgg cgcccgcccg cacgggtgcc ggacccccag ggcggtgcgc cgggtacgtg - 15181 gcgcacccgg cacaccgccc gcccccctgc gaggccccgg cctcgcccct tcgaggcctc - 15241 gggagacccg gccatgacgg cgctcggcag cacgcccacc ggcgacacgg acccgcccgc - 15301 accggagccc ccggcaccgg acccgcccgt acccggcgcc ttctccaccg gggtccgccg - 15361 gatcaccctc gacgcgggcg gcctcgacct ctccgcgctg ctgagcgagc ccgagcaggg - 15421 cccgccccgg gccaccgtcg tcgcggtgca cggcggcggc atgagcgccg ggtacttcga - 15481 cgggcaggcc caccccgagc agtccctgat gacgctcggc gcccaactcg gctacaccgt - 15541 cctgtcggtg gaccgccccg gctacggcag ctccgccgcg tggctccccg agggactcac - 15601 cctcggcgag caggcggtgg tgctgcacgc cgccctcgac gacttccgcc ggcactacgc - 15661 ccacggggcc gggctcttcc tgctcgccca ctcgctcggc ggcgccctgg tgatggccac - 15721 cgccgccggg gccgaggcgg accgcgccct gctcggactc gacgtctcgg gctgcggcca - 15781 ccgctacgcc gtcgtgccgg accagggccg gaccacccga aggaacaccc tgcggcactg - 15841 gggcccgctg cggctctacc cgccgaacac cttcgccacg agcaccggcc tggtcgcccc - 15901 ggtcccggcc cgcgaggcgg gtgaactcgc ccgctggccc gagctgttcg ccgccctggc - 15961 gccccggatc agcgtgccgg tgcggctcac cttcgccgag cacgaggcct ggtggcggca - 16021 cggcgaacag gacttggccg acctcgccgc ccaactcacc gcctcaccac gggtcctggt - 16081 ggagcgtcag cccgacgccg ggcacaacat cagcctgggc tgggcggccc gcgcgtacca - 16141 tctgcgctcg ctggccttcc tggaggactg cctcacccac accggccggg agtgagcggc - 16201 cgtgccgccc gccggggtct tccgcaccgc ccgccgccga gcggggcccg aggcgtaccc - 16261 ggggccgtcg gccgcacagg gcggcaggca ccgccgcccg cggacgggag gtcccctgtc - 16321 gtgacgtcca cccgcgcccc gctgcccgcg cccggcacct accagctgtg ggtcttcgac - 16381 tccctcacgg aggaggggat cccggccacc cgcgccgagg cgggacccga ggcgctcggc - 16441 cccgaggagc ggcgccgggc ccgcctcttt aggcgccccg ccgaccgcag gcagtacgag - 16501 agcgcccatc tggtcctgcg gcggctgctc gccgaccaca ccggactggc ccccgagcgg - 16561 ctggagttcg gccgcgaggg cgggcggcgc ggcaagcccc gcctgctcgg ctcgccggtg - 16621 ccggtgcact tctcgctctc gcacagccac ggcctcgtcg cgatcgccct cgccgccgat - 16681 ccggtgggcg tggacgtcca gcgggtgccg ggggcgcgca ccgtcgagcg gtgcctgccc - 16741 tcgctgcacc ccgccgagcg ggccgaactc accgccctgc ccgagtcgga gcgcccggac - 16801 gccttcgccc tgctgtggac ccgcaaggag gcctacctca agggactcgg caccgggctc - 16861 gcccggccgc tcgccgcgga ctacctgggc agcggcggcc tcgccgcccg cccgccggac - 16921 tggaccgtgc acaacaccgc cgcccgcccg gggcacgcgg cagccgccgc gctccgtaca - 16981 cccgcgaccg gatgacagcc gggcgcgtac gccaccactg ggggaaggga caccatggcg - 17041 acagccaccg aggacaccca ccacccgcgc gcactcgccg cggaactcgg cgcgcgcaag - 17101 gaggaggccc ggcagggtcc cgacccgcgg gccaccgaac gccagcacgc caagggcaag - 17161 ttgacggcgc gtgagcggat cgacctgctg ctcgacaaga acagcttcac cgaggtcgag - 17221 cagttgcgca ggcaccgggc gaccggcttc ggcctggagg cgaggaagcc gtacaccgac - 17281 ggggtggtga ccggctgggg cacggtcgag ggccggacgg tcttcgtcta cgcccacgac - 17341 ttccggatct tcgggggcgc cctcggcgag gcgcacgccg cgaagatcca caagatcatg - 17401 gacatggcgc tggccgccgg ggcgccgctg gtctcgctca acgacggcgc gggcgcccgg - 17461 atccaggagg gcgtctccgc gctcgcgggc tacggcggca tcttccagcg caacacccgc - 17521 gcctcgggcg tcatcccgca gatctcggtg atgctcggcc cctgcgcggg cggcgccgcc - 17581 tacagccccg cgctcaccga cttcgtcttc atggtccgcg acacctccca gatgttcatc - 17641 accgggcccg atgtcgtcca ggcggtcacc ggcgaggaga tcagccagaa cgggctcggc - 17701 ggcgccgagg tgcacgccgg tacctccggg gtggcccact tcgcctacga cgacgaggag - 17761 acctgcctcg ccgaggtccg ctacctgctg tccttcctgc cgtccaacaa ccgcagcatg - 17821 ccgccgcacc tgccgagcgc cgaccccgcc gaccggcccg gcgagcggct caccgaggtg - 17881 gtgccggccg acggcaaccg cgcctacgac gtccgggagg tgatcgagga ggtcgtcgac - 17941 gacggcgagt acctggaggt gcacgcctcc tgggcgccca atctggtctg cgccctggcc - 18001 cgcctcgacg ggcatgtggt cggcgtggtc gccaaccagc cgaacgcctt cgccggggtc - 18061 ctcgacatca gggcgagcga gaagggcgcc cgcttcgtgc agttctgcga ctccttcagc - 18121 atcccgctgg tgaccctggt cgacgtgccg ggcttcctgc cgggcgtgga ccaggagcac - 18181 gagggcatca tccggcgcgg cgccaagctc ctgtacgcct actgcaacgc caccgtgccc - 18241 cgggtctcgg tggtcctccg caaggcctac ggcggcgcct acatcgtgat ggactcgcgc - 18301 tccatcggcg ccgacatcgc gctcgcctgg ccgaccaacg agatcgccgt gatgggggcc - 18361 gagggcgccg ccaacgtggt cttccggcgc gagatcgccg ccgccgcgga ccccggggag - 18421 atgcgcgcgc agaagatcaa ggagtaccgg gaggagctgg tccaccccta ctacgcggcc - 18481 gaacgcggtc tcgtcgacga cgtcatcgac ccccgcgaga cccgcgcggt gctctgccgc - 18541 gcggtcacca tgctggccgc caaggacgcc gacctgcccc gccgcaaaca cggcaaccca - 18601 ccgcagtagc agggcggttg cccctgctca ccaggcggct gcccggctcg cggggcggtc - 18661 gccgcggctc gtacgggagc ggtcgcgcgg gcggaagcgg gcagcgcgta cggaatcggc - 18721 agcgcgtacg gaatcagcag agaggtgagg cgaatgtccg agcggaacac gggtgcggcc - 18781 ggggagccgg agagcggtga gggcggccgg gagaccccct gccgccagtt gctgagggtg - 18841 gtgcgcggca acccggcgcc ggaggaactc gccgtgctct ccgccctgtt gttcgcccgg - 18901 ctctcggcgc cggaggcaca ggcggccggt cccctggggc gggcggtggc cggctggcgg - 18961 cgccccgagc gcggctcgat gttcgacggc ccgcgcacct ggcgcggcac cggatccgcc - 19021 gcgcacccga ccggcgggcg gtagggcccg ggaggccggt ggcgggtgcc ggggtgagcc - 19081 ccgccgcccc gcgtgccccg cgacgcgcgg aggccgcgta cgcgccgggc gtacgcggcc - 19141 tccgcggccg ggagacgggc cgggggcggg gtctcaccgg ccgcccccgg ccgccggggt - 19201 caggcgtcga gggccgccac gatgccgtcc cagagggcga cccgggcgcg cagcgcggcg - 19261 gtcaccgtct cggcggcctc ctgccacttg gcctcgtcct cgccgcacag gtcggcgacc - 19321 atcgccatgg ccatcggggt gtgctcctcc ccgtcgacct cgatgtgccg ggccaggtac - 19381 tcgcggaagg tggcgagctt gccgccctgg tcgtcgacct tgatgacctg gtcgaacatc - 19441 tccgggatca ggtcctcgcg gccgaaggcg aaggccgcgg cccggcagtg cagcggggcc - 19501 ccctcgatga agtcgaaggt ggcgttcacg aaggtggcgg ccgccgccgg gaccgaggcg - 19561 ccgaccaggg cggtgcgcac gccctcgccg ccgcggatgc ggtccaggaa gttgttgatc - 19621 acggtgacgt cggcgcccgc ctcggccatg ccgttgacgt acagctcgaa gtggctgatg - 19681 aagccgtcgc cgagctcgtc gctctcctcg accaggacga tgtcgttgat cagccgccgg - 19741 ctctccgagc tgccctgcgg cacccagggc acgtccacgc aggtgaggct gcgctggagg - 19801 ctcttcagga gggacatgaa gtcccagacc gcgaagacat ggttctcgtt gaaggtgttg - 19861 acgtcttcga gcgttgcaag gcggtggtag atcgggtgct tcaccacttc gaggcgggcg - 19921 tcgtcgatga ctttccgcag tttctcgatg gaagcgttct ctttgcccca gtcgtagcgc - 19981 gacacagaaa tgtctcccgt ccaaagaatg ccgtgtgttc gatctgttcc agtgcgttcg - 20041 gcgagcacta tggccgcatc tcacagcgcc cggcaagggg atgtgaggac gggcaatcgg - 20101 ggtgaagcgg gcggctgacg cggtgtccca tggggttttc ccgcggcgcg ctgtgcgact - 20161 gcgggatttc cgcccttgca cgccggggtg ctcttcggcg cggtcggccg tgatcccgcg - 20221 gccgggttcc ggttctgccg ggctccgggc cgaacggctt gtcctggcag gtcagttggg - 20281 ctctgatggg ggagcggcgg tccggttccg cggcggcccg gtgtgaaagt tggaccgcgt - 20341 tgcgccccct ggccgatcgg gggaccatcg gtcgcacttc cctgcggacg gtgattgctg - 20401 tccgattacc gcgaatccag gcggcggtgt tctccgtacc gaatacggga acggcgttcc - 20461 tgcttgtccc cgaaatggga ttccgcatgc gcgcgccgac aggtcggcac accggctcgg - 20521 cgatttctgg tctcttgccg tggacgcgag agaagaagac acgaggggga cttcgaaatg - 20581 ccctgggaaa agaacgaggc ggccggcggg gagacgagcg gacgggacgc gcggatcgcc - 20641 gcacgcgccc gtgaggagaa ctggaagaag cccccgcggc gcatcgagtc cgccgagtgc - 20701 atcacctgcg acagctgcct gcgcggctgc cccgcggagt tcggcgccat cttcgaccgc - 20761 ggcctcgacg tcgtcatcat ccccgagctg tgctcgggct gcccggcctg cgtcctggag - 20821 tgccccgtcg actgcatcta cgtcgacgag gactgggcgc ccaccgacga gagcctgtgg - 20881 aagcacatcg agctgaccgc ggacggtgcc tgatgccctc accggccgaa cgcggcctga - 20941 gccgccgcga gatcaacgcg aggaagcggc agagccgcag acccagcagg cacggcagcg - 21001 ccgccggcgc ggcgcccggc cccgactatc cgcgcgagga cggcgtgggc ttccccgggc - 21061 tgctcgaccg cgcctggcgc gcggcgctcg ccgccgggga gctgcccgcc gcggtggacg - 21121 cgctgctcac cctcgacggg cacgtccccg gcgacatcca gctgcgcgcc ctgcgcaccg - 21181 ccgacgaggc cgccctgaag gtgctctgcg gcgcctcctg gcgcggggtg cgcgacggcg - 21241 gccaggcgtc cggcgcgtct gccgagcggg cccaagtccc gccgcaggac gcggtgttcg - 21301 acggggagat cgccctgtcc accaccggcc ggatcctggt ccgggtgccc tcgcagggcc - 21361 cgctcgcgga gagcgggaac ctggtcgccc ccgccctcca ggtgccctgg tccgcggcgg - 21421 atctcgccgc ctaccgcacc gagtcggcgc gggcggcggc ccgctactcc tcggcggtgg - 21481 tcgactgccg ccagtggctc gcggcgcaca gcacccaggc ccgcgaggaa ctgctcgacc - 21541 tgctcaagga cgccgccctg cgcaccgcgc ccttcgtgct ctaccaggag gaccggcagt - 21601 acaccaactt ccgggacccc aacaccctca ccggcaagac cctgtggccc gggcatccgg - 21661 actgcgcgct gagcagcctc gcggggctcc cgctcgacca gtggtcggac agcgaggccg - 21721 tcctggtggt ctgcctgacc ctgctggtgc gctccgcctc gtacgcgcgc atcgaggagg - 21781 ccaacggcac ccagctgacc ccggaccacg tcggccacct cctggagggg gtgcggcgca - 21841 actacaacgc gcactcccgg ggcgaggcgg tgccgcccgc cgcctcggcg cgggtggccg - 21901 acctcgacgc gctggccggg gcgctgcgcg cgcgccggac cgaggtgctc ggcgaggtgc - 21961 agctctaccg ggagatccac ggccccctga tgcacaagat cgagcggacc gccgcccccc - 22021 ggggcgcggc cgcccgccac cgcgaggccg aggtcaccgc ccgcctcacc gaggcgctgc - 22081 cgctcgcggg cgaggacctc ggcgcgctcg ccgcgcacct cgccgagtcc ccggcctggc - 22141 tgaccaagcc gcacggcgag ttccgcaccg ggctcgaggc gctggtgcac gcctcggtgg - 22201 ccgcctccac cgaggccttc gaggccgact tcgcgatgag ccgcggcatg cgctcgctcg - 22261 cggggctgcg ggaggcgctg cgggcgcagg cctgggcgga gatcaccgac tgggggatca - 22321 ccgacttctt ctgctgcgtg gtgcccgacc cggcggcccg ccgccacttc ggcgactcgg - 22381 tggaccggct ggccgacacc gcctgggcga tgtcctcccg gatgcagtac aactcctggc - 22441 acttcatcgc gggcaatctg ccgaaggtgc ccgcggtggt ggcccgggac cacttcgtcc - 22501 cgccgaccct gccggacatc gccttctact ccgaccagca ccaccacggg cacgtcgccg - 22561 ccaaggtccg cttcagcatc cgcagcccgc aggcggtgga gatcgacggg cgccgcttca - 22621 acggcttcat ggacctccgg ctgctgcgct gcgagggcac ccccttcggc gaacaggacc - 22681 tgctcgccgc ccaccgggtc tccgccttcg tcgccggggc caccggcctc gccgccgaac - 22741 tcgtcgccgc cggtgaggag atcgaggtca cctccttcga ctcggcctgg cacggggagt - 22801 ccgtccgcgc ggccgtgaag gcgcgcggct gagccggatg agcccgtccg aggccggatc - 22861 cgtccgcccc gtcaccagcg aggagaccca gttgaccgcc tacggcatcg ccgcgacccg - 22921 ggcgctgctc ggccgcgggg agcgcaccgc caccgagcac ctcgccgccc acctcgccgc - 22981 gatcgaggaa cgcgaccccg gcctcggcgc cttcgtcgcg gtcgcgggcg agggggcgct - 23041 gcgggccgcc gcggccgccg acgcccggct gcgcgcgctc ggcccggccg ccttccagga - 23101 ccagccgctg ctcggcgtcc cggtctcggt caaggacctc atccagaccg gtgaactccc - 23161 cacccgccgc ggctccttgc tgcccaaccg ccgcccggcc gcggacgccc ccgcggtcgc - 23221 ccggctgaag gccgccgggg cgatcgtcgt cggcaagacc accacctccg agtacggctg - 23281 gagcgccagt accgtcagcc gggtctcgcc gcccacccgc aacccctggg acccggcgta - 23341 ctcggcgggc ggctccagcg ggggagcggc ggcctcggtg gcggccggac tgtgcaccgc - 23401 cgcgctcggc accgacggcg ccggatcgat ccgcatcccg gccgccttct gcggggtggt - 23461 cggctacaag ccctccttcg ggcgggtccc ctacgtcccc gcgggcgccg accggctctc - 23521 ccacctcggc ccgctggccc gcagcgtcga ggacgtgatg gagatcgccg cggtgctgcc - 23581 gggcccgcac cgccaggacc cggactccgg tctcggcgcc ctggagtcgc gtcccgagcg - 23641 gcgcggcctc cgggtcggct ggatcgagtt cccgggcact gcgcccgagg tgcgccgggt - 23701 cagcgaacgc gccctggagg ccctggccgc cctcgggcac caccccgagc gcatcgaggt - 23761 gcccttccgc gacccgtatc cggcgctcct ggacatcctc gccgccgccg aggccgccgg - 23821 tgccgcgccc ggcgacgagg cggacggcga ccccgggcgg ctggcggtgg tacgccacgg - 23881 ccgcgggctc gacggggccg cggtgatgcg cgccgaggag gtccggatgg agctgcgcac - 23941 ccgcctcgcc gcggtgatgg agcgccatga cctcctcgcg atggccaccg tcccggtgga - 24001 gcccttcgcc ccggaggcga tcggtcccga ctgggcgagc gaccccgaga gcctgctctg - 24061 gctcgcctgg agcccggcca cctacccctt caacatgacc ggccagcccg ccgtctcgct - 24121 gcccgcgggc ctcagccgcg ccgggctgcc ggtcggggtc cagctggtgg gccccgtcgg - 24181 cgcggacgcc ctggtcctcg acaccgcgcg ggacctggag gcgggactcg gtccgctgcc - 24241 cgaagtaccc cagcgcgtct ccgaaaggat gctctagcga tgtacacccg caagtggtcc - 24301 cggcccgccg ccgaggacgg agtcggccgc agcgacttcg tcgccgagca cggtctgtgg - 24361 gacgagcggc agcgcgccgc ggccgcggag atcgaggccc acctcggcga agtcgacctc - 24421 atacggctgg tgttcggcga tccgcacggg ctcgcccggt ccaagacgct caccgtggag - 24481 gccttccgcg cggccctgcg cggcgggatg gactacagcc cgggcccctt cctcttcgac - 24541 accggccacg cggtcgccgt cgacttcctc tccgacccgg gcgtggacgt ccccgaactc - 24601 ctcggcgcgg gcaacttcgt ggtcgtcccc gacccggtga ccttccagct gctgcccggc - 24661 ggcgaggccc gtaccgcctg ggtgatcggc gaggagtacc tgcccgacgg aaggccgcac - 24721 ccgctctcct cccggcacgt cctgcgcaag gtgatcgcgg cctacgcggc ccaggagtac - 24781 accccggtcc tcggtctgga ggtggagtgg tacctcaccc gcaggctgga gggcccggtg - 24841 gggaacgcgg gcaacggctt cggcctccag ggggaggcac cccgggtggc ggccatgaac - 24901 ccgggctacc agttcaactc cgacaacgcc ttcgcctcgg tggccgcctt cgcccatccg - 24961 ctgagcgcgc tccttcgcca actcggcctg ccgctgcggt cgatggagca cgagtcgggt - 25021 ccggggcaga tcgagaccac cttcgcgccg atgcacgccc tggacaccgc cgacgccatg - 25081 ctgctcttcc gcaccctggt caagcagcgg gccgcgcagg gcggttacca cgccaccttc - 25141 atgtcgctgc cgcgtatcga cggcttcgac ccgagcggct ggcatgtgca ccagtcggtc - 25201 gtcgacaccc gtaccggacg caacctcttc gcccccgacg accccgcggc cccgctctcc - 25261 gccgccggac tcgcctacgc ggagggcctg ttgcggcgcg cccgcgagct gtgcctgctc - 25321 tcggtgccga cggtcaacgg ccaccggcgc ctcggctccg gcttctcgct ctcgcccacc - 25381 cggatcggct ggagcccgga ggaccgcacc gcgatggtcc gggtggtcgg cgcgggcggc - 25441 tcccggcacc tggagaaccg caccggcgaa ccctgcgcca acccctatct cgccctggcc - 25501 gcccagctgt tcgccggtct ggagggcatg aacagcgact ccctcgtgcc gcgccccgcc - 25561 ctcggcccgg acgccgcggg cgccgagacg ctgccgggct ccctcgagga gtccctggcc - 25621 gctttccgcc agggcagccc cgccgatctg ctcggcaccc cgctcgcccg ctgcctggcc - 25681 aagctcaagc agagcgagct ggaccgcttc cgcacctggg ccgagaagga gcagccgccg - 25741 gagggcgagg tcaccgagtg ggagcagcgc gagtacttcg aggccttctg acccggactt - 25801 gggggctcaa ctcccttaca cacacggcca gttcgtccac cgactgaggg gcagccaccg - 25861 atgattcccc gctacacccg gcccgagatg gcggaactct tctcggacca ggcacgctac - 25921 gagacctggg tgcgggtgga gatcctcgcc accgaggccc aggtgcggct cggcgccgta - 25981 cccggcagcg cccttgcgga catgcggcgc gcgcccgtgc cgctcgcctc ccgggtcgcc - 26041 gagatcgaga aggagcgcga ccacgaggtg ctctccttcc tcgccgccta ctgcgaggag - 26101 atccccgagg agtcggcccg ctgggtccac ctcggcatga ccagctacga cctggtcgac - 26161 accgcgctcg gccacaccct cgcccgcggc accgacctgc tgctcgacgc ggcccgcgcc - 26221 ctgcgccgga tcctcgccga gcgggccgtg gagcactggg acaccgtctg cgtcggccgc - 26281 acccacgggg tgcacgccga gcccaccacc ttcgggcaca agctcgccgg gtacgccttc - 26341 gcggtggacc gctcgctgac ccggctgcgg gcggcacgcg aggcggtcgc ggtgggcacg - 26401 gtctccggct cggtgggtac gtacgcgctg atcgacccgg cggtggagcg gcacgtcctc - 26461 accgcgctcg gcctcgcggc ggagccggcg ccgagccagg tggtggcgcg cgaccggcac - 26521 gcccagctgg tgcaggcggt ggccgcgctc ggcgccgtgg tcgagcaagt cgccctggag - 26581 atgcggctgt tgcagcgcac cgaggtccgc gaggtggagg agcggcgcac cggcgcctac - 26641 cagggctcca gcgcgatgcc gcacaagcgc aacccgacca ccagcgaacg cctggtcggc - 26701 ctcgcgcggc tgctgcgcgg gcacgccggc accgccctgg agaacgtcgc gctctggcac - 26761 gagcgcgacc tcgcccacca gtccgtggag cgggtgatcc tcccggacag cctgagcgtg - 26821 ggccacttcc aggtgaccat ggccaccgaa ctgctcaccc atctcgccgt cttccccgag - 26881 cggatgcgcg cgcacctgga gcagaccggc gggctcgtct acagctccgc cgtcctcgcc - 26941 gaactgctcg ccacgggcac cgaacgcgag aaggcctacc ggggtgtgca ggcggcggcg - 27001 aaccgcaccc tggcgggcgg cgcggacttc gccgccgcgc tcgccgagga ggggatcgac - 27061 ctcgggccac tgggccccga gcgcttcctc ggccaccatg atgtgatccg cgagcgattg - 27121 gagcagctac gtgacctgga agattgagcg ggtaccgggg gacggcctgg acctggacga - 27181 agtcctcacc gtctaccggg agtcggggct cggcgagcgc cgcccgatcg aggaccggga - 27241 gcgcttcgcg gcgatgctgc gcggggcgaa tctggtggtc gtctgccgta ccgaggaggg - 27301 gcggctgatc ggcatcgccc gcagcgtctc cgacttcagc tatgtcacct acctctccga - 27361 catcgcggtc agcgccgact tccagcgcgc gggcatcggg cgggccctga tcgcggggac - 27421 ccaggccgag acccccgggg tgaagatcgt gctcctctcg gcgccggcgg cggtcgacta - 27481 ctacccgcac ctcggcttca cccggcacga gagcgcctgg gtgctccagc cctgaacccc - 27541 cgaggaatcg ggagcaagca gagcgcggcc gtctccccgg ggaggcggcc gagcggtctt - 27601 ccctctttct ctacggtggc tcaggcgctg cccagtttga atccgacgcc gcgcaccgtg - 27661 atgatccatc cgctgtcgcc gagtttgctg cgcagactgc ttacgtgggt atcgacggtt - 27721 cggcgcgacc aggaatctcc ccatacctgc tgcagtaaac gtttgcgggg aatcacggtg - 27781 tcgggattcg aggcgagcag gtgcagaaga tcgaattctt tcctggtgag tccgacctcg - 27841 cgtccgtcca ggctcacttc ccgggagctg gcatcgatct tgaggggccc gtgctggatt - 27901 tcccgtaccc gctgcggctg ttgatggacg cgccgcatca cggcgtcgat ccgggcgagg - 27961 agttcgcgga atccataggg tttgacgagg aaatcgtccg ccccggcctg gagtccgagg - 28021 acccggtcca gctcggtccc gcgggcggtc acgatgatca ccggcaggca gctgacggag - 28081 cggatcgccc cgcatacctc cagtccgtcc aggtccggca gctccagatc gagcaggacg - 28141 agatcgatgt cctccaggga ctgcaaggcg gtgccgccct gctggacgcg cgtagtctca - 28201 tgcccgtggc ggcgcagtcg gcagaccagc gcctcggcgt agtcgctgtc gttgtccacc - 28261 acgaggatcc gctggccggt gggcagtccc gcgaccttgc gggtggtggg gccgaagccc - 28321 tcgtcctccg cgaaccgggg cgagggcatg gcacgctgaa agggaatacc agattccagt - 28381 acggcctcgg tcgagctttg tgccatgtct gtcccccgtg agtcatgagc cccgttcggt - 28441 gaactgatgg gaatccgaag cgaaacggag cgcttacctg caagacgagc ggcatcggaa - 28501 tgcagaaaca cgagcgtcgt caggcactct gcgacgcctc ccgcgtggcg tcgcacggcc - 28561 cagaacacgg ggattcaccc cgcagggcgg acgttacctg attccgtgag acttgcggag - 28621 gggaaacgga cagaagttgt caggcggaga gaatggctac atcgagaccg gcgagacggg - 28681 tggggtccgc gatgatgttc attgcggtga tgcgtccctc ggaaacggtg aagtccatga - 28741 ccacggagag ttgcctgggc gccgccgtgg ccaggccgag acgcccgtcg accagcgccg - 28801 tccgcgccag atgcgcacgt cccgagtaga gaccggcctg cgccgccacg ggctgggcac - 28861 cgacgatctc catgggggcg ccggcggggg tggcggccgc gtccacccgc agcacgacat - 28921 ccgggtcgag cagggcgagc agcgcctcga actccccgcc gcgcgccgcc gcgaggaagg - 28981 cgtcgaccac cgcgcgctgg cgcggcaggt cggagtcggg cgaggtgtcc acggcctgca - 29041 cccggcggcg ggcgcggctg gcgagctgac gtgcggcgac gggggtgcgg ccgacgatcg - 29101 gcgcgatctc cccgaagggc acggagaaca tgtcgtgcag gacgaaggcg atccgctccg - 29161 ccgggtcgag ggtgtccagg acgacgagca gggcgagccc gacggagtcc accagctgcg - 29221 cctcgtgcgc cgggtcggtc ggcgcggcgg cctggtcgcg cgggccgtgc tcgggcaggt - 29281 ggtcgccgag cgggtcctcc cggcgcgagg agcgcgagcg cagcatgtcc aggcagatgc - 29341 ggccggccac ggtggtcagc cagccgccga ggttgccgat ctccccggcc tcgctccggc - 29401 tcagccgcag ccaggtctcc tggaccgcgt cgtccgcctc cgccacggaa ccgagcatcc - 29461 ggtaggccac cgcgcgcaga tggggccgct gggactcgaa cttctccgcc agcgccggcc - 29521 attcgccctt gtccaccggt cacatcctcc gctcggctcc cgtcatagcg ttgacggctg - 29581 tcactcagcg tatgtgaagg gaccccgccg cagcaggttc cgcgcgcaag ccgcccggcg - 29641 gggcctccgg gctgcccgcg gccgggcgga cgagccggtg cgcgcggccg gtcctgacct - 29701 cggtaaagtc aacgaggcat atccaccggg cagttggcga gtgctcgcgc cgcagatcac - 29761 ggtgccgggc ggtgtgcgcc cccgcttccc gggcccgctg tccgtgcgcg cggccccgcg - 29821 gcggtcgccg gtcgcccggg cccgccccgc cggaaccggc cgcaggttgg ccggaatccg - 29881 cccctgccca attacccctc ctgacacggc tgttgacacc gctgagcggg gtcccctcta - 29941 atgccgctac cggaactgga ttccgcttcc gcatcgctgt caggaggtgc accttgtctc - 30001 tggccgaaca gttgacctat ccggcagtcg atctcgacga gatcgagtcg tcggccatct - 30061 ggatcgaatc gcacccgatc acccgcgtac ggatcgactc cctcgtcttc gagggctccc - 30121 cgcgtctcgg cggcgaggac cacgaccacg tacgcgtgct cgccgaagcg ggggactccc - 30181 tgcccgcgat caccgtgcac cgccccaccc tgcgcgtcat cgacggcacc caccgggtcc - 30241 gcgcggccct gctcaacggc cgtaccgaga tcgcggcccg gatgctcgac tgcgacgagg - 30301 ccgcggcctt cgtcctgtcc gtcaaggcca acgtcaccca tggactgccg ctcagccgcc - 30361 aggagcgggc cgccgccgcg gcgcggatca tcatgaccca tccgcagtgg tcggaccggg - 30421 cggtcgccgc cgccaccggg atctccgaca agacggtctc ccggatccgc tcccagtcgg - 30481 gcgccgactc cgcgcagtcc gccacccgcc tgggccgcga cgggcggctg cgcccgctcg - 30541 acagcgggca gcgccgccgc cgcgccgccg cgatgttcct ggaccgcccc gacgcgggac - 30601 tgcgcgaggt ggccagggcc accggcctct ccccggcgac ggtacgggac gtgcgccagc - 30661 gcatcgaccg cggcgaggac ccggtacccg gccgctaccg cacggcggag agtcccggcg - 30721 gcgccaccgc ggcccggcag cgccccgccg ccggacgcct ggaccgcagg accgtggtgg - 30781 tggaccggca gcggctgctc gccaagctca gcgaggaccc ctcgctgcgc ctcaacgagg - 30841 cgggacggcg cgccctgcgc tggctgcacc actactccgt ggacggaaac ggcatcgaga - 30901 ccctcggcca ggggctgccc tgccactggg cccccgacgt cgccgacctg gcccgcagct - 30961 gcgccgccgc ctgggccgaa ctcgccgagc agctccagca gcgcgccgag taggcaggct - 31021 gccgcaactc ccttctccac ggctcgactt cgcagcggga gagggcaggg acaccgccgc - 31081 ccgcggcacc gtcccgcagc acctcggacc tcggtcgacc ggtccgcgca ccgccccacc - 31141 tcgtacgacc cggtcccgta ccggccggct ccaccccgca ccaccggact cccgggcgag - 31201 ccgccccgcg actcccgcac ctgagcacct cccggaccgc gcaccgcgcc tcccgcgccg - 31261 ccgccccgcc ggtcccgttc cgcgcaccgc cgctcgtgca ccgccgctcc gcgcaccgac - 31321 tgcgtcaact gccctccccg gcagcgcact tggcaccacc ggctccccgc accccgcagg - 31381 cgcgccacac ccgcaccgcg caccgccccg caccgcgtac cgccgcaccg cgcacctccc - 31441 gtaccgcgta ccacgtaccg ccgcaccgcg caccgccccg cacccacccg caccgccaga - 31501 gccccacacg ctcagcaccg ccctatccgc taccgggccc caccccggag ccgtcccagc - 31561 cgctccacgc tccaacgcct ctgcccaccc gggtggttga gcctctttcg gccacccgtc - 31621 ggcggtgccg aggggcggtg ggcgcggggc gggaaccgac gtcatccagg aggcatcccg - 31681 tgtcccagca ccccgagaag gccggtccgc ccggtgcccc tgcgagcggt cccggtaccg - 31741 gtgtgtggtt catcggggcc aggggctccg tcgccaccac cgcggtgacc ggcgcggcgg - 31801 cgctcgccgc cgggctccag ccgccgaccg gactggtcac cgaggcaccg gagttcgcgg - 31861 gcagcgggct gcccgcgctg tcctcgctcg tcttcggcgg gcacgacacc gccgactggc - 31921 cgctgcccaa gcgcgccgag gcgctggccg agggcggggt gctgccgcgc gggctcgccg - 31981 ccgcggtgca gcgcgaactc gccgccgccg acgaggagat ccgccccggc ggaccgctgc - 32041 ccggcgaccg gcgcggcgac gaggagctga tcgccgactt cgccgccgac atcgcggact - 32101 tcacccgccg caccggggtg gcccgcacgg tcgtggtcaa cctggcctcc accgagcccc - 32161 tgcccgaacc caacagcgcc cggctgcccg ccagttcgct gtacgcggcg gccgccctgc - 32221 gcgccggtgc ggcctacgtc aacttcaccc cctcggcggg gctgcaccac cccgcgctcg - 32281 ccgaggccgc ggccagcgcc cgggtcccgt acgcgggccg cgacgggaag accggccaga - 32341 ccctgctgcg ctcggtgctc gcgccgatgt tccggcagcg cgccctggac gtgcgggcct - 32401 ggtccgggac caatctgctg ggcggcggtg acggcgccgc cctcgccgac ccggccgccg - 32461 ccgaggcgaa gaacgcgggc aagaaccggg tcctggagga caccctcgga gcactgcccg - 32521 agggcgaggt gcacatcgac gaggtaccgg cgctcggcga gtggaagacc gcctgggacc - 32581 atgtcgcctt cgagggcttc ctcggctccc ggatgatcct gcagaccatc tggcagggct - 32641 gcgactcggc gctcgccgcc cccctggtcc tggacctggc ccggctcgcc gcccgcgccc - 32701 aggaggccgg gctcaccggg caactccccg cgctcggctt ctacttcaag gaccccgacg - 32761 gcggctcctc ggccctggcc gagcagtacg ccgcgctcct cgccttcgcc gcgcggctcg - 32821 gggcccgtcc tgcggaggcc tcgtgagcac cccccgcgac tgggccgaac tcctgcgcgt - 32881 ctccgccctg ctgtccgtgc ccggcgacgc cctcgcgggc gccgcggcca gccgccggcg - 32941 ccccaactcc cgtaccgcgc ttgccttgtg ctcctcgctc tgcctctacg aggcgggcat - 33001 ggcgctcaac gactgggcgg accgcgcgga ggacgccgag gagcgcccgc accgcccgct - 33061 gccctcgggc cgcatcgccc ccggcgccgc gctcgccgcg gcggccgggc tgaccgccgc - 33121 cgggctcggc ctcgccgccc gcgccggacg ccccgccgcg ctgtgcgcca ccgccctcgc - 33181 gggcgccgtc tgggcctacg acctgcgcct gaagcacact gcggccggtc ccgccgcgat - 33241 ggccgccgcg cgcgggctcg acctggtgct cggcgccctc gccaccgcgg gcccgcgctc - 33301 cggcgaggcg gccgggagcg tgctcggccg ggcgctgccg cccgccgcgg tgctcggcgc - 33361 ccacacctgg gcggtgaccg cggtctcccg cgccgagacc cagggcggct cggccggacg - 33421 gccgctcgcc gccctcggca cgacggccgc gctcggcacc ctcctcgccc ccgccggggc - 33481 ccggccgctg cgcctggagc gggcccgcag gctccccgag accccgcggg agctggccca - 33541 ggccgcgctg gccggggcct acgccgccac cgcggggcgg tcctatctgc acgccgcgct - 33601 gaacccctcg ccgccgctga cccagcgggc cgtcggcggc gggatccgcg cgatgatccc - 33661 gctgcaggcg gcgctcgccg cccgctccgg ggccctcgcc accgcggcct cgctcggcgc - 33721 gctggtcccg ctcgcccgca gcctcgcgag gaaggtcagc ccgacatgag catccgactc - 33781 ggctacggca ccaatggact caccgacctg cgcctgcgcg aggccctcac cctgctcgcc - 33841 gaactcggct accagggcgt cggcctgacg ctcgatcaca tgcatctgga cccgctggcg - 33901 cgcgggctga gcggccgggc caaggcgctc gcccgcaccc tcggcgcgct cggcctggac - 33961 gtcaccgtgg agaccggcgc ccgctatgtc ctcgacccgc gccgcaagca cgggccgagc - 34021 ctgctcgacc cggacccgga ggcgcgggtg gcccgcgagg cgctcctggt caccgcggtc - 34081 gaggtcgcgg cggaactcgg cgcccacgcc gtgcactgct tcagcggcgt ccggcccgag - 34141 ggcaccgacg agggcacggc ctggcagcgg ctcgccgact ccctcggccc ggtgctcgac - 34201 gcggcgcagc gcgacgggat cccgctcgcc ctggaacccg aacccggcca cctggtcgag - 34261 tcgctggccg acttccaccg gctgcgcgcg ctcctcggcg atcccgaact cctgggcctc - 34321 accctggaca tcgggcactg ccagtgcctg gagcccgcct cgcctgcgga gtgcgtgacc - 34381 gccgcggcgc cctggctgcg gcatgtgcag atcgaggaca tgcggcgcgg ggtgcacgag - 34441 catctgccct tcggcgaggg cgagatcgac ttcccgcccg tgctcgcggc cctggaggcc - 34501 agcggctacc ggggcctgac cgtggtcgaa ctgccgcgcc actcgcacgc cgggcccgaa - 34561 ctcgcccgcc ggtccatgga gttcctgcgc cccctggtcg ccgccgcggc ccgcgaggac - 34621 cgcgccgccg gggcgccgtc gccggtccgc gcccgtcccg taccactgct gaccgggccg - 34681 cccctgcggc aggaagcacc gtcccgtacc tgaggaagca ccatgccgat cactccgatc - 34741 acccctgagg aaccgcgccc cgccccggag cccgcggacg gcaccgaggc cgaactgcgc - 34801 cgagaggccg ccgagttgcg cgagcggctg agcgccgagg gcgccgactg gctggacggg - 34861 gcgctcgccg aggccgcccg ggcggcggcc gagcccgcac ccgcggagtc ccgtgcggtg - 34921 cccggctggg agctgcgctt cgcggcggcg ggccgcgcct gcgggaccga ggccgccgaa - 34981 tccgcccggg tactgctgct gcgcgccgcc cgccccggcc ccgccgccct cacccgcctc - 35041 taccggcacg gcaccggcga ggagcgccgc gccgtgctgc gggccctgcc gcggctgccg - 35101 ctcgcgccgg gggaggggct gccgctggtc gaggacgcgc tgcgcaccaa cgacacccgc - 35161 ctggtcgcgg ccgccgtcgg gccctacgcc gccgcccacc tggacgacca cgcctggcgg - 35221 cacgccgtcc tcaagtgcct gttcacccag gtccccgtgc gggccctggc ccggctgccc - 35281 gagcgggccc gcggcgacgc cgaactcgcc cgcatgctgc gggacttcgc cgccgaacgc - 35341 accgccgccg gacgcgccgt cccggccgac ctcgaccacg tactcgccct gaccgccaag - 35401 gacgcctgat gcgcatcttc gacccgcaca tccatatgac ctcgcgcacc accgacgact - 35461 acgaggcgat gtacgcggcc ggggtgcgcg ccctggtcga gcccgccttc tggctcggcc - 35521 agccccgcac ctccccggag agcttcttcg actacttcga cgcgctgctc ggctgggagc - 35581 ccttccgggc cgcgcagtac gggatcgcgc accactgcac cctcgcgctc aacccgaagg - 35641 aggcgaacga cccgcgctgc ctgcccgtcc tcgacgccct cccgcgctac ctggtcaagg - 35701 accatgtggt cgcggtcggc gagatcggct acgacgcgat gaccccggcc gaggacaccg - 35761 cgctcgccgc gcagctcgaa ctcgccgccg agcacggcct gcccgccctg gtgcacaccc - 35821 cgcaccgcga caagctcacc gggctgcgcc gcaccctcga cgtggtcgcc gagtcgaagc - 35881 tgcccaccga gcgggtcctg atcgaccacc tcaacgagac caccgtcaag gaggcccggg - 35941 agagcggcag ttggctcggc ttctccgtct acccggacac caagatggac gagcaccgca - 36001 tggtcgccct gctgaaggag tacggacccg aacgcgtcct ggtcaactcc gccgcggact - 36061 ggggcaagag cgacccgctg aagacccgca aggtcggcga ggccatgctc gccgcgggct - 36121 tcggcgagga cgaggtgcac cgggtgctgt gggagaaccc ggtcgccttc tacgggctca - 36181 gcggccgcct cgacctggag gtccccggca ccgaggccct gcacgagggc aactccctgc - 36241 tgcgcggggg cgaatgagcc gtgcgcttcc gccacccgga cggctccctc gtccacctcg - 36301 cctactgcac caatgtccac cccgccgagg acctggacgg ggtcctcgcc caactgggcg - 36361 cctactgcga gccggtgcgc agacgcctcg gcaccgaacg cctcggcatc ggcctgtggc - 36421 tggcccggga cgccgcccgc gccctgacca ccgaggcctc cgccctgcgc cgcctgcgca - 36481 ccgaactcga ccggcgcggc ctcgaagtgg tcaccctcaa cggcttcccc taccgcggct - 36541 tcggcgccga gaaggtcaag taccgcgtct accagcccga ttggcgggac gccgagcgcc - 36601 tggagtacac cgccgagctg gccgggctgc tcgccgaact gctgccgccg gatgtcaccg - 36661 agggcaccct ctccaccctg ccgctcgcct ggcgcagcga cttcgacgcg gccggtgccg - 36721 ccgcggccga gcggcagctc accgaactgg cccgccgcct ggacgacttg gaggagcgca - 36781 ccggccgctc catccgggtc gccctggagc cggagccggg ctgcgcggtg gagcggaccg - 36841 ccgacgccct cgccccgctc gccgcgctgc ccgcccaccg cttcgggctc tgcctggaca - 36901 cctgccacct ggccacctgc ttcgaggaac cggccgccgc cctcgccgcc ctggagcgcg - 36961 cgggcgccac cgtcccgaag gtgcagctct ccgccgccct gcacgccgag gacccggccg - 37021 acccggcggt acgggccgcg ctcgccgcct tcgacgagcc ccgcttcctg caccagaccc - 37081 gcgccctggc cgagggggtg ctgcacggca ccgacgacct gggcccggcg ctcgcgggcg - 37141 ggacgctgcc cgagaccgtg ccctggcgcg cccacttcca cgtaccgctg cacgcgccgc - 37201 ccgccccgcc gctcacctcc acgatggacg tcctgcgtgg ctccctcgat gtgctgctcg - 37261 gtcaagacgc cccgcgcagc cgccacttcg aggtggagac ctacacctgg caggccctgc - 37321 cgcccgaggc gcgaccggcc gacgcggcgc agctcgccga cggtatcgcc gccgaactcg - 37381 ccctcgcccg cggcctcttc cgcgacctcg gcctcaagga gctgccgtga ccgccacccc - 37441 gaccccgctg ctcgtgctcg acgtggtggg cctgacgccc gccctcctgg agcagatgcc - 37501 gcgcctgaag tcccttgccc gcaagggctc ttcggccgga ctcggcaccg tgctgcccgc - 37561 ggtgacctgc gccgcccagt ccaccttcct caccggagcg ccgcccgccg agcacgggat - 37621 cgtcggcaac ggctggtact tccgcgagct gggcgaggtg ctgctctggc gccagcacaa - 37681 cgggctcgtc gcgggcgaca agctctggga cgcggcccgc cgcgcccacc ccggctacac - 37741 ggtcgccaat gtctgctggt ggtacgcgat gggcgcggac accgactgga ccgtcacccc - 37801 gcggccggtg tactacgccg acggccgcaa ggagccggac tgctacaccc gccccgtcga - 37861 gctgcacgac gaactcaccg acgccctcgg caccttcccc ctcttccact tctggggacc - 37921 cggcgccgac ctggtctcca gccggtggat catcgacgcc acccggcacc tcaaccgcac - 37981 ccgccacccg gacctgaccc tctgctacct cccgcacctc gactacgacc tccagcgctt - 38041 cggcccccgc gacccgcgct cgctgcgcgc cgccgccgaa ctcgacgcgg cgctcggccc - 38101 cttgctggac gaggccgagg cggagggccg caccgtggtg gtgctgtccg agtacggcat - 38161 caccgaggtg tcccgccccg tcgacatcaa ccgcgccctg cgccgcgccg ggctcctgga - 38221 ggtgcacacc caggacggca tggagtacct ggacccgatg gcctcccgtg ccttcgcggt - 38281 cgccgaccac cagctcgccc atgtctacgt acggcgcccg gaggacctgg cccgggtgcg - 38341 ggaggtgctc gaagggctcg acggggtcgc cgaactcctc ggcgacgagg gcaagaaggc - 38401 gcacggcctc gaccacccgc gggccgggga actcgtcgcg ctcgcggcgc cggaggcctg - 38461 gttcacgtac tactactggc tggacgacga gcgggcgccg gacttcgcgc agctggtgga - 38521 gatccaccgc aagcccggct acgaccccgc cgaactcttc ctggacccgc tcgaccccta - 38581 tgtgaagctc cgggcggccg gtgcgctggc ccgcaagaag ctcgggatgc gctaccggat - 38641 ggcggtggtc ccgctcgacc cggcgccggt gcgcggcagc cacggcaggc tcccggcccg - 38701 ccccgaggac gggccggtgc tgctctgctc gcgccccggc gccctgccgg gggaggtcgc - 38761 cgccaccgag gtcaagtcgc tgctgctcgg gctcgcgggt ctcgccgagg tgcccgccac - 38821 ggggtgaggg ctcagaccgc ggcggcgccc ggccactcgg gggcgagcag cgaccagacc - 38881 tccttgtcgt gccggaagcc gcggttcggg aagtactccc gcagggtgcc gtcgagctgc - 38941 atgcccaccc gctgggcgac cgcgcggctg cgcgcgttgc gggtgctgct gaaccactcg - 39001 acgcggtgca tgccccgctc ggcgaaggcg tagtcgatca ggtgccgcac ggccgcggtg - 39061 atcaagccgt ggccctcgcc cgccggttcg gtccacaccc cgatctcgca gttgccgagc - 39121 cgggtgtcga agtgcacgaa catcaccccg ccgaccaggg tgcccgcccg ccagatcccg - 39181 tagaggcggc cggtgtcggc ggcctgcttg tccgcgtagt cctggagggt ggcccgggcc - 39241 gagtccaggt cggtggagcg ggaggcccag gggatccagg ggtcggtgtg cgggcgggcc - 39301 cggtccatgt gggcgaggaa ctcctcggcc tgccagggtt cgagcgggcg cagcgcggcg - 39361 tcctcggcga gcggtacggc gtacatggcg gtcctcagcg gtcggcgggg gcggacggcc - 39421 cgctccccgg tacataacaa acgttgggta tgtaccctac tcgtatgccg cccgcacgtg - 39481 gagaccatga agcccgccgg agagaggtct ccgaggcggt gtggcaggtg ctcgccgcgc - 39541 ggggcttcgg ggggctgacc ctgcgggccg tggccgcgca gatgggggcc accaccgggc - 39601 tgctcacgca ctacttcccc ggcaagcggg cgctgctcgc gcacgccctg gacgtactgg - 39661 accgccgctc ggccgagcgc ccgcgccccg ccgccgagga ggcgggggag gccgccggtc - 39721 tggtgatgct gcgggcgatg ctgctcgaca tcctgccgct ggacgccgcg agcgcggcca - 39781 gcaaccggat ctgggtcggc tcctgggacg cggcgctcac cgacccggag ctggccgagg - 39841 agcacgccgc ccgctaccgc cgcgcccgcg cgcggatgac cgggtacgtc gcggacgccc - 39901 agcggctcgg cgaactgccg gccggccccg cggccgagga gatcgcggcg gcggcgcaga - 39961 gcttcgtcct cggtcttgtc gtacaggcgc tcttcgcgcc cggggagttc ccgcccgagc - 40021 gccaagtcgc tttgctcgac gcccacttgg cgaaggccgc cgccggggcg gaccgggcgc - 40081 cggggacgcc gccggtcccg gcaggggagt cctgaccggg accggacggg cgcggggcgc - 40141 cgggtgcagt gcgcgcgggc tcagaccggg cgggcctcga tcaccgagat cggggcggcc - 40201 gtctcggtga tcttctccag gcggaagcca ccggcggcga gcacttccgc gtactgcttc - 40261 tcgctgcgct ccttgccgcc gacgagcagc atcagccaca ggtcgaccag cttggccggg - 40321 tgcggcttgt tcggcttgtc gtcgggggtc acgaactcca tgaggaggat ccggccgtcc - 40381 gggtcgatga ccttgcggac attgcgcagg atctcgatca cctgctcctc gggccagtcg - 40441 tgcacgatgt gcttgaggag ataggcgtcc ccgcccgcgg gggccgggtc gaagaggccg - 40501 cccttctcca gggtgcagcg gtcggccacg ccctgctcgc gcaggtagtc ggcggcgccg - 40561 ttggtgtcga tccgcgcgtc gaagaggacc ccgcgggcgt ccttcgcctg ctggagcgcg - 40621 gcggcgagca gaccgccgcg ccccgcgccg tagtcgacga tggtgcggaa ccggcggaag - 40681 tcgtaggcgg cgagcagcgg cagggtctcc gtctcggaca tcgcgcccat gcccgcggtg - 40741 aagatctccc cgtactccgg gttggcgtcg atgaactcga aggcgcccat gccgcgcagc - 40801 ttgggcaggc tggcctcgcc ggtgcgcacc gcgtcgacca ggtgcgccca ctcctcccag - 40861 tgggtcgggt gccccatcag caggacggtg gcgcgcatcg actgcggggt gtcggagcgc - 40921 agcgcctgcc ccatcggctt cagcttgaag ctgccgtcgg cgcgctcctc gaagaccgag - 40981 taggtggcga gcaggcgcag cagccggtgc agcgactcgg ggtcggcgcc gacccgctgg - 41041 gccagctggg cggcggtcag cggaccgtcc ttcagctcgt cggcgacctt caactcggcg - 41101 gccacgtaca gggcttgggt gaccatcgag ccctgggaga gttcgagcag cgcgaacggc - 41161 ggcggggcga gcagccgggt cagcttcacc aggccggcgc gcacaccctc cacggcgcgg - 41221 acgactttgg cgggggggag tttgggcatg cgtatcctcc gtggcggtgt cgcggaactc - 41281 gtgcctgcgg gacgtacgga ccgccgcgta cacgggggct gaactggagc cctggcgcag - 41341 gggaaagcct cgaacggagc cgttcgccgg gcggtgcccg ctcaccgaaa ccagcggtgt - 41401 cccgggccga ctgtaggggc gcctcttccc ttgcgccacc gtgtgcagaa agcccgggaa - 41461 ttgcgcaccg gcagttcggc ggagtttccg gtgagcggcc cggtgcgcct tctcgccgag - 41521 ttctcgaccg gggtgtgcaa ccgcgatatt tccgaggtcg cacacttgat ttccgaggtc - 41581 ggacacgtac cgccgcccaa atcccgggaa gagcaggcaa tttcacccgg gacggctgcg - 41641 gccgcgtacg tctatggtga cgccggtcga atgcacgccc cccattccgg gggtgtgcca - 41701 ggaaaaggga gagacatgtc aagagcacac aagccttggg cgggggccct ccttgcggca - 41761 gcggtggtgg cggggctcac ggccaccgcc gcacccagcc aggccgcgca ccgcgcgggc - 41821 cccgaggtcc tcgcgaccaa cctgaacaac ccgcgggaca tcacgctcca ggcggacggt - 41881 tcgatcctcg tcgccgagtc cggcagcggt cccgccacgg cctgtgcgcc gggcacctcc - 41941 tgcctcggct tcaccggctc gatctaccgg gtcaacggca gccagaaggg ccgcgtcgtc - 42001 accgggctgc cctccaagct ggaggtccgc gcggacggcg gcgcctcggt cgccggaccc - 42061 aaccaggtcg aggcccgcac cggcggctac accgtctcca gcagcttcgg cggcgacgcc - 42121 gcggaccgca aggcgctggg cgcgggcggc gagaccctcg gcaccctgca catagccaag - 42181 ggcaaggtgc tcggcgacct cgtcgaccac gagacccggc tcgacccgga cggcccgctc - 42241 ggcaacaacg acgtgcactc caacgcgtgg atgttcgccc accacggcaa ggactacctg - 42301 gtcaccgacg cgggcggcaa cgacctgatc cgggtgctcc cggacggcac caccaagacc - 42361 gagttcgtct tcccgaacaa cggcgagaac gagacggtgc ccaccgggat cgtggccgcc - 42421 cccgacggct ccttctacat ctccgacctc agcggccagg ccgcgggcaa gtcccgcatc - 42481 tggcgctacg ttcccggcag cgccccgaag gtcttcgcca ccggtctgac gaacgtcacc - 42541 gacctcgccc tggacggcaa gggcgggctg atcgccctca ccctcaccaa gggctacacg - 42601 gagaccggcc cgctgcccgg cgccctgaac cgcgtcgacc tgaagagcgg caaggcgacc - 42661 gagatcccga ccgccgaccg gctggtcaac tccctcggcc tcgccgtcgg caagggcggc - 42721 gagatctatg tgaccaacaa gacggtgggc accaccggcg aactcctgaa gttccccgcc - 42781 gcgcgccggt gagcaccggc cgccggaact gacaccggcc ggggcgcact tcggccccgg - 42841 ccgatgtcag gatttccccc gccgggtgaa atcccggcag gcccgtctcc ggttccgcac - 42901 agagaacgga caggtcttcc gcgacagcgg ccctcggccg gaaatccggg cgaccatgcg - 42961 gtagggatgt cgcctgcgga tgtcgtgcac ggacatcgtg cacggatgtc gcgtacgtca - 43021 tcgagtacgg cccggagtgc gtatcgccta cggctccgcg ttcggcctcg gagtccggcc - 43081 ggggaatccg cagtcgcaca gcaaaaggga atccggtggg cccgagtacg ctgtggccgc - 43141 tccggtgatc cgcgggaatc cggccttccc ccgcggaagg aagaagtccc ctcgcgcgcc - 43201 ctttccgctc gtattttggg cgtgcgcggc acgtgacacc gcacgcacca tttcgcgtct - 43261 ccgcttttac gccaccgcag gaactcacgc cagagaggga ctcatgacga agatcatcct - 43321 tcccgaggac cgccccgcag gccgccgcgg gttcgagatc gtcctgccca gctccttgac - 43381 cgacggggcc gcctcgctcg tcgaggcgca tgtctccgag gcgatgtccg ggccgccgct - 43441 gcacacccac gcggagtcgg acgagaccta cttcgtcctc ggcggcgcgc tcatcatgat - 43501 catcgacggc aagctcaccg agctgcgcgc cggtggcctc gcccacatca gcaaggacac - 43561 ctcgcacacc tgggccaccc gtcccgacga gggcgcccac ttcctcaccc tgcacctgcc - 43621 gggcggctac gagctgtacc acccgaccgc gctccacgcc gagcacgaga agggcggccc - 43681 cctggagcag aaggacctct tcgagctggc ggcccgcttc gactggcgcc tggccggccc - 43741 gcccgagccg caccgcctga ccccgaccgg cgtcctggtc cccgcgggca aggcggacgc - 43801 cgaggcggag gccaccaagg cactcgccac ggcggagtac gaacgcgccc tcgccgcgtc - 43861 catcgaggcc gccgactccg gctcctgagg cgcgagtcgg cggacgggca cggcggaggc - 43921 ggggagcgtc atgggggcgg caccgtgagc gggccggggt ccggcgggcc gggcaccgcc - 43981 gccgtaccgg gcgccgcccc gcccggtgcc gccggggcgc ccgacccccg gcgatggttc - 44041 gccctggtgg tgatcctggt cgccgggttc atggacctgc tcgatgtgac catcgtgaac - 44101 gtggtcctgc cgagcgtcct cgcggacctg gacgccgcct acacgcacgg ggagtggatc - 44161 gtcgccgggt acgtgctcgg cttcgccgcg ctgatgatca ccggcgggcg gctcggcgac - 44221 atcctcggcc gccgcaaggt cttcctcgcc ggggtggccg gattcaccgc ggcctcactg - 44281 ctctgcgggc tcgccgacgg gcccggggcg ctgatcgcgg cccgcttcct gcaaggcgcc - 44341 atggccgggc tgatggtgcc gcagatcctc gcgatcatcc atgtcacctt ccccgccgag - 44401 gagcgcggca aggtcctcgg catctggggc ggcgtactcg gcgccgcctc ggccgcgggc - 44461 ctggtcgccg ggggactgct cgccgaggcg gatccgtacg gactcggctg gcgcgcggtc - 44521 ttcctggtca atgtgccggt cggcgccgcg gccctgctcg ccgcctggtt cctcgtcccg - 44581 gactcccgcg ctcccgagcg gccccggctc gatccgctcg gcgcgctgct gtccgccgcg - 44641 ggcatcctgc tcctggtcta tccgctcacc gaggggcgcg gcctcggctg gccgccgtgg - 44701 accttcctgc tgatgggcgc cgcggtcctg gtgctcgggc tcttcgtgct ccagcagcgc - 44761 gggcgcaccc gggccgacaa ctccccgctg atgtcgctgc gtctgttccg ggcgcgcgcc - 44821 ttctcggcgg ggatggcggt gtgggcgctc ttctggatcg ccctcggcgg cttcttcttc - 44881 atctggaccc tgtacatgca agtggggctc ggctggccgc cgttgcgggc gggactgacc - 44941 agttccgcct tcgcggtggg ctgcgccgcc gggtccggga ccgccgtcga gttcttcacc - 45001 ccgcgcttcg gccgcaaggc cctgctcgcg ggcgccctcc tctgcggcac cggcttcctc - 45061 ggctacgtcc tggtcgccgc ccactacgga cccgccgtcg ccccctggca gatggtcgcc - 45121 ccgctcctcg tcgccggtat cggcttcggg ctggtggtgg cgccgatgat cgacgcggtg - 45181 ctcaccgagg tcccggtgcg cgaggcgggc tcggcctccg gggtcctcgg caccgtgcag - 45241 cagatcggca tcgcgctcgg caccgccctc gccggggtgc tcttcttcca gcagctcgac - 45301 cacgacgcgg cgcgtgccgt ggcgcgggcc gcccccgcgc tgcgccagga actcacccgg - 45361 gccgaggtgc ccgccgccga gcgcgagcgg atcctcgacg ccttcgccga ctgcctcgcg - 45421 gaccgcgccg cggcgaccga cccgaccgcc gaacccgcct cctgccgggg cccgttgccc - 45481 tctcccgagg tccgcgcgct ggtgatcggg gccgggcagc gggccaccgc cgacaacttc - 45541 tcccgcacct tcgcgctgac cctcagatgg ggcgcgggca gcatgggcct ggtcttcctc - 45601 ggcctcttcg ccctgccgcg gcgggtggag ttccgggggc tcgacggggg cggtccgggt - 45661 ccggggtccg gaccttccgt gccgggcgcc tcggagggtg gcgctgccgt cggtccgggc - 45721 gccggtccgg cctccggtcc cgggaaggag cgctccgccc ccgcgcggtc cggtggccag - 45781 gacgccggca ctcaccccgc cgggtgatcc ggccgcattc cgtttcccgc gagcccgggg - 45841 cacgccccga tgccgcgcgc cccctcgtcc ccgtaccgcc gcccgtgccg cgcccggtgg - 45901 ggcaaaggcg cgcaccgtac cgtaccggca ccagtcgtgc acacccggca gccggggcat - 45961 tcgccgggag tgggggaagt ctgtccttcg ccggaccatg tccggactgt tctctgacgt - 46021 ttctctgaat ttctgtcagc ggatttgtcc tgaccgacag ttgcccggca acagggcgcg - 46081 aagaattcac ctccggctcg ctgccgcggt ctgttcgcgg gccccgcgag gcggcaggct - 46141 ggggccgcct cgaccgcgta cggcgaggcg ccccacgtcc cccctcacct ccggaggtcc - 46201 ccatgcgccg ccgtcacgtc ctgccgctcg ccgccgccgc gctggcgatg cccgccgctc - 46261 tcctgtcgac cggttccgct tcggccgcac ccgccgacaa gccgcaggtg ctcagctcct - 46321 tcacgcagac cagcgcctcc agctacaacg cctggaacgc cgcccgcaac aaccaggggc - 46381 agtgggccgc ctacggcttc gactggtcca cggactactg cagcacctcg cccgacaacc - 46441 ccttcggctt ccccttcgaa accgcctgtg cgcgccacga cttcggctac cgcaactaca - 46501 aggcgatggg caccttcagc gccaacaagg cccggatcga ctccgccctc tacgaggacc - 46561 tgaagcgggt ctgcagccgc tactccggcg cgaccaagac ctcctgcgac gggctggcct - 46621 ggacctacta ccacgccgtc gacatcttcg gcatcaaggg cttcaagcag ctcgacaagg - 46681 ccgcctga -// diff --git a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk b/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk deleted file mode 100755 index d7febe529..000000000 --- a/tests/unit/data/bigscape/minimal_dataset/JK1_GCF_01/JK1.region01.gbk +++ /dev/null @@ -1,3887 +0,0 @@ -LOCUS Chromosome1 84281 bp DNA linear UNK 14-OCT-2019 -DEFINITION Bacteria strain JK1. -ACCESSION Chromosome1 -VERSION Chromosome1 -KEYWORDS . -SOURCE Bacteria - ORGANISM Bacteria Unclassified. - . -COMMENT ##antiSMASH-Data-START## - Version :: 6.1.1 - Run date :: 2023-02-06 17:22:58 - NOTE: This is a single cluster extracted from a larger record! - Orig. start :: 13276 - Orig. end :: 97557 - ##antiSMASH-Data-END## -FEATURES Location/Qualifiers - CDS 1..690 - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:O33341 Putative glutamine - amidotransferase" - /db_xref="UniProtKB/TrEMBL:A0A399CHF0" - /locus_tag="JK1GL000010" - /note="GO_function: GO:0016787 - hydrolase activity" - /product="MULTISPECIES: gamma-glutamyl-gamma-aminobutyrate - hydrolase family protein" - /protein_id="ncbi_JK1GL000010" - /transl_table=11 - /translation="MAVTADATTVNWNIWGDVAVAVLPQPYLDKVTQAGGAPVLLPPLV - EAVESVMERVDALLMSGGADIDPALYGARPGEFVFPPHPARDAAELAALAVAERRGIPV - LGVCRGLQLISITRGGTLDQHLPEHSPAVPGRYEPRTIRVKPDSLLGGALGPSPTVYCH - HHQGIDKLGAGLVATAWSDDGVIEGAEAEDPSAPFLAGLQAHGELGEDTVALFEAFIEA - AKAGPRR" - protocluster 1..84281 - /aStool="rule-based-clusters" - /category="PKS" - /contig_edge="False" - /core_location="[47298:63009]" - /cutoff="20000" - /detection_rule="(t2ks and t2clf)" - /neighbourhood="35000" - /product="T2PKS" - /protocluster_number="1" - /t2pks_malonyl_elongations="8|9 (Score: 1286.8; E-value: - 9.9e-215)" - /t2pks_molecular_weights="acetyl-CoA_8 (Da): 414.403" - /t2pks_molecular_weights="acetyl-CoA_9 (Da): 456.440" - /t2pks_product_classes="angucycline" - /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" - /tool="antismash" - proto_core 34023..49733 - /aStool="rule-based-clusters" - /tool="antismash" - /cutoff="20000" - /detection_rule="(t2ks and t2clf)" - /neighbourhood="35000" - /product="T2PKS" - /protocluster_number="1" - /t2pks_malonyl_elongations="8|9 (Score: 1286.8; E-value: - 9.9e-215)" - /t2pks_molecular_weights="acetyl-CoA_8 (Da): 414.403" - /t2pks_molecular_weights="acetyl-CoA_9 (Da): 456.440" - /t2pks_product_classes="angucycline" - /t2pks_starter_units="acetyl-CoA (Score: 0.0; E-value: 0)" - cand_cluster 1..84281 - /SMILES="" - /candidate_cluster_number="1" - /contig_edge="False" - /detection_rules="(t2ks and t2clf)" - /detection_rules="AfsA" - /kind="neighbouring" - /product="T2PKS" - /product="butyrolactone" - /protoclusters="1" - /protoclusters="2" - /tool="antismash" - region 1..84281 - /candidate_cluster_numbers="1" - /candidate_cluster_numbers="2" - /contig_edge="False" - /product="T2PKS" - /product="butyrolactone" - /region_number="1" - /rules="(t2ks and t2clf)" - /rules="AfsA" - /tool="antismash" - mRNA 1..690 - /locus_tag="JK1GL000010" - /note="MULTISPECIES: gamma-glutamyl-gamma-aminobutyrate - hydrolase family protein" - gene 1..690 - /locus_tag="JK1GL000010" - mRNA complement(992..2509) - /locus_tag="JK1GL000012" - /note="MULTISPECIES: NAD(P)-binding protein" - gene complement(992..2509) - /locus_tag="JK1GL000012" - CDS complement(992..2509) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A3R9UBU6" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 497.4; E-value: - 8.3e-151)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 492.0; E-value: 4.7e-150)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000012" - /note="GO_function: GO:0071949 - FAD binding" - /product="MULTISPECIES: NAD(P)-binding protein" - /protein_id="ncbi_JK1GL000012" - /transl_table=11 - /translation="MAKGAIVVGAGPVGLMLAGELRLGGVDVVVYDKLPGPSGESRGVG - FTRRAAEVFEQRGLLERFGDVEWAQGHFGGVRIDFGKLDDNHFSVRGVPQFRTEEILEN - WLKELGVPVLRNHEVTGYRERPDGVVVEYEGPDGHGEDTAQYLVGCDGARSLVRTLAGI - DFKGWGATRGMYMADLVGAGVRQRPIGEKVPGGMVMAFNLENGVDRIVIHDENLRPPED - KSALRFTDIADAWQRMTGESLHHAEVRWISSFTDTTRQAEHYRSGRVFLAGDATHIHMP - AGAQGMSVGVQDAANLGWKLAAAINGWAPEGLLDTFESERHPVGEKLMRNTRAQTRLYL - TGDEMEPLRAVMRELVELPEAARHLAGIVSGVDIRYDMGPGDHPLLGLRLAPGHELLLE - DGGRTRVAELLHPARGVLLVTGAADDAARVRGAAAGWDDRVRTVVGEWAEPVTGDRPAA - VLLRPDGHVAWAAPDGVELLGRALERWFGRGRDTAGSRAHAVGAAGV" - mRNA complement(2542..3522) - /locus_tag="JK1GL000011" - /note="MULTISPECIES: alpha/beta hydrolase" - gene complement(2542..3522) - /locus_tag="JK1GL000011" - CDS complement(2542..3522) - /codon_start=1 - /db_xref="COG:COG0596 Pimeloyl-ACP methyl ester - carboxylesterase" - /db_xref="UniProtKB/TrEMBL:A0A399CRL9" - /gene_functions="biosynthetic-additional - (rule-based-clusters) Abhydrolase_6" - /gene_functions="biosynthetic-additional - (rule-based-clusters) PF00561" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1262:haloalkane dehalogenase (Score: 153.4; E-value: - 1.3e-46)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000011" - /note="GO_function: GO:0003824 - catalytic activity" - /product="MULTISPECIES: alpha/beta hydrolase" - /protein_id="ncbi_JK1GL000011" - /sec_met_domain="Abhydrolase_6 (E-value: 2.5e-15, bitscore: - 56.4, seeds: 455, tool: rule-based-clusters)" - /sec_met_domain="PF00561 (E-value: 3.1e-22, bitscore: 78.2, - seeds: 48, tool: rule-based-clusters)" - /transl_table=11 - /translation="MTLNRRTMLALGTGATALAMTGTATAAHAREHTGSVPSDSELARS - LPGGFRSRCATVNGVRLHYVTGGHGRPLLLVPGWPQTWWAYRKVMPQLARTHRVIAVDL - RGMGGSDKPAGGYDKKTMAADLHALVRHLGHRQVDIAGHDIGAMVAFAFAANHPEATRR - LALLDTPHPDESEYDLRLLYRPGTGTALWWWAVNQLQQLPEQLMCGRMRHVIDWLFAHS - LADQNLVGEADREIYAHAYNSPQAIRAGTGWYQACHQDIADLAGYGRLTMPVLGIGGNF - TYEDLQRKLTAQATDVRMVRASKSVHYLPEEEPEVVAGALLDFFG" - mRNA complement(3561..4397) - /locus_tag="JK1GL000013" - /note="MULTISPECIES: NAD(P)H-binding protein" - gene complement(3561..4397) - /locus_tag="JK1GL000013" - CDS complement(3561..4397) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W167" - /gene_functions="other (smcogs) SMCOG1199:NmrA family - protein (Score: 213.1; E-value: 9.8e-65)" - /gene_kind="other" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000013" - /product="MULTISPECIES: NAD(P)H-binding protein" - /protein_id="ncbi_JK1GL000013" - /transl_table=11 - /translation="MTVLVTGSRGKVGSLLVQVLHERGVAVRAGSSNPEKLSLPAGTES - VRLALDTPADFAAALDGVDSVFLYAEPAAVDAFVAQAEKAGVEHVVIMSADAVLRPSAA - DDPIAAPHLAVEQALAASSLTSTPLNCGALAGNALPWAWSLKARGAVGLPYPDSHADPV - NERDIAEAACAVLTDPALRGRSYHLTGPQSLTFAEHVAIIAAAAGRDIPVERIPPQVWR - ANKPDFMPDDIADALLKLWAASTAPVPLTDHVEQLTGHPARPFTVWADQHAGAFRA" - mRNA complement(4636..6432) - /locus_tag="JK1GL000014" - /note="MULTISPECIES: monooxygenase" - gene complement(4636..6432) - /locus_tag="JK1GL000014" - CDS complement(4636..6432) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W161" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 497.8; E-value: - 6.2e-151)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 494.4; E-value: 8.7e-151)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000014" - /note="GO_function: GO:0071949 - FAD binding" - /product="MULTISPECIES: monooxygenase" - /protein_id="ncbi_JK1GL000014" - /transl_table=11 - /translation="MTAAGSVTAAGSASARRRLEPSPTRLGRRHRPRSAAAAPAPRPPA - GTDTWSHAPPPPPAPPRPGPGPRRGGPLLRGPALRLQRRSIGEVFPGAWLPPRTRERFT - NDLREEYFMAKGAIVVGAGPVGLMLAGELRLGGVDVVVYDKLPAPSGESRGLGFTSRTA - EVLDQRGLLDELGEFRWGRHGHFGGVRIDFTLLEESHFGVMGLAQSRTEQLLGDWTARL - GVPVLRGREVTGFEETEDGVVVRYDGPDGPGEDHAQYLIGCDGGRSTVRRLAGIAFPGD - EATRGMYLADVTGADIRPRPIGERVEGGGMVLSVGLGDGYDRIVIHEPGVRPHHGEGTL - TFTEVADAWQRMTGESIHHGHTRWMTALTNATGLAEQYRSGRVLLAGDAAHDHAPLGAQ - GVSVGLQDAVNLGWKLAATINGWAPDGLLDTYHAERHPLGEQLLRNVHAQSLLYLSGEE - MEPLRAVMRELVRIPDAARYLAGQVSGLHIRYDVGAGEHPLLGLRLPLQRALQRADGTR - VRVAELLHEARGVLIVTGDPSTVHKTAADWSDRVDVVAGTWAEDGGPEAVLLRPDGHVV - WAAPDGGDVTDALTRWFGAAAV" - mRNA complement(6579..8087) - /locus_tag="JK1GL000015" - /note="MULTISPECIES: MFS transporter" - gene complement(6579..8087) - /locus_tag="JK1GL000015" - CDS complement(6579..8087) - /codon_start=1 - /db_xref="COG:COG2271 Sugar phosphate permease" - /db_xref="UniProtKB/TrEMBL:Q1RQU5" - /gene_functions="transport (smcogs) SMCOG1005:Drug - resistance transporter, EmrB/QacA (Score: 405.2; E-value: - 4.8e-123)" - /gene_kind="transport" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000015" - /note="GO_component: GO:0005887 - integral component of - plasma membrane; GO_component: GO:0016021 - integral - component of membrane; GO_function: GO:0022857 - - transmembrane transporter activity; GO_process: GO:0055085 - - transmembrane transport" - /product="MULTISPECIES: MFS transporter" - /protein_id="ncbi_JK1GL000015" - /transl_table=11 - /translation="MAASDATTARSASGAGLSPGLILAFVCMGQFMVFTDVSIVNLALP - SIQEGLGMSEVSLNYIVTAYATVLGGFLLLGGRLADTFGRRRLIQIGFVIFALASLTSG - LAENGTMLIASRAVQGFGAALITPAALAILTNTFAEGPERNKALGVWGSLSGIASIVGV - ILGGVLADTWGWEWIFWINVPIGLGAAVLAPRILPESKAEERGKFDTLGAVTLTAGLLL - LIFTLGEATTVGWDTFRTIGSLVGVVALLTAFVVIEAKVASPMMPLRIFRLKTMRVANI - SAVLVFGTFGSLFFFASLFMQQAFGYSPLKAGFAYVPLAFSVAAGAGIASGLVTKMAAR - PVVMMGLTLTVAGLLLMWRAPADGSYVVDLLAPFILLGLGCGMVFVTLQIAAFVGVTDE - DAGVGAGLINTSQEAGGALGLAVVATIAYSGMSTEMAATGGKPELIAEVHEAANHDAFL - SGAMLGTVALLVVTFLMPRGKQSMSSAPAEAGEGPALVKADAEK" - mRNA complement(8210..8947) - /locus_tag="JK1GL000016" - /note="hemerythrin domain-containing protein" - gene complement(8210..8947) - /locus_tag="JK1GL000016" - CDS complement(8210..8947) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A399CNC7" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000016" - /product="hemerythrin domain-containing protein" - /protein_id="ncbi_JK1GL000016" - /transl_table=11 - /translation="MSMSDPAQSPGARMYEEFVAIHAVLRRGTRLVVDAYERLADGHDT - DTATLVDAGRWLLAFTHAHHKAEDDLFWPVLEALYPDARAQLKELSDDHVVLDRRLNAL - ETAIDALDEATQAARATGGTDGARAGAEAARQVHQVLDGHLTAEEAVVEDLFPGVPADD - IDRLREAFVQGSPRFGLHFMFGLLDDPEPARGRDLLTENFPPQLRAAGPRLISQYEAGI - QGLRGGPGDDSGRPVTSAGPRSS" - mRNA complement(9126..10688) - /locus_tag="JK1GL000017" - /note="MFS transporter" - gene complement(9126..10688) - /locus_tag="JK1GL000017" - CDS complement(9126..10688) - /codon_start=1 - /db_xref="COG:COG0477 MFS family permease" - /db_xref="UniProtKB/TrEMBL:A0A429NHX3" - /gene_functions="transport (smcogs) SMCOG1005:Drug - resistance transporter, EmrB/QacA (Score: 417.7; E-value: - 7.5e-127)" - /gene_kind="transport" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000017" - /note="GO_component: GO:0005887 - integral component of - plasma membrane; GO_component: GO:0016021 - integral - component of membrane; GO_function: GO:0022857 - - transmembrane transporter activity; GO_process: GO:0055085 - - transmembrane transport" - /product="MFS transporter" - /protein_id="ncbi_JK1GL000017" - /transl_table=11 - /translation="MMTTVEDPASAAQGRPAGTSVRVLLIPLVAAMMLSQLDTMIVGTA - LPTVTAELGGLEHVSWVVTAYTLATAVSTPVWGRLGDVRDRKNVLLAAIVVFLAGSALS - GAAQDMGQLIGFRAVQGLGAGGLMAGVMAIVGELVPPRERGRYQGLISGAMAVAMIGGP - MAGGAVTDHLGWRWAFYLNLPLGALALAMIWRLLRLPRRSRVARVDTLGAALLTVGISA - TVLLTTWGGTRYAWDSAAVVLLAAAAGAALWAFVRRQARTADPIMPLHMFQVRNFTLMS - VIGFLTGFVMFGVLLFLPLYQQAVQGASATNSGLLLLPMLAALIAASLVAGRVTTVSGR - YKVFPVTGGALLCAGAWLLSRMDTSTSRPTAALSMAVLGAGLGCLTQTVTVVAQNSVEL - RDIGAASAAVTLFRTLGSCFGVAVMGTLFNREVLRVTAERAPGVPALDNARLDAQSLER - LEPALHEAYRHATAAGTHVAFLLCAGVGAAVLGAGLLVREVALRRAGQDTARPAVSRAP - GGH" - mRNA complement(10723..11481) - /locus_tag="JK1GL000018" - /note="MULTISPECIES: response regulator transcription - factor" - gene complement(10723..11481) - /locus_tag="JK1GL000018" - CDS complement(10723..11481) - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:A0QTK2 DNA-binding response - regulator MtrA" - /db_xref="UniProtKB/TrEMBL:A0A399CJS4" - /gene_functions="regulatory (smcogs) SMCOG1008:response - regulator (Score: 157.2; E-value: 7.8e-48)" - /gene_kind="regulatory" - /locus_tag="JK1GL000018" - /note="GO_function: GO:0003677 - DNA binding; GO_process: - GO:0000160 - phosphorelay signal transduction system; - GO_process: GO:0006355 - regulation of transcription, - DNA-templated" - /product="MULTISPECIES: response regulator transcription - factor" - /protein_id="ncbi_JK1GL000018" - /transl_table=11 - /translation="MSAQTLPELRTSTSQLIRLVQDGTAPAPAAPAPGGRRILVVDADV - GPGDSLVTQLRRYGHEPVAVQCGGQALQAHADADLVLLALELPDLDGLEVCRAIRAVSR - VPVVIVTARQSELDCVLGLQAGADDYVTKPYGLRELMARIEAVMRRTHWQPAARRYIRR - GRLHIDVDSREVTVDGSGVALTRKEFDLLCLLASHPDTVIPRKHLLKQVWGDSWSQRTV - DTHVSSLRGKLGGSGWIVTVRGVGFKLGAG" - mRNA complement(11666..12070) - /locus_tag="JK1GL000019" - /note="MULTISPECIES: GNAT family N-acetyltransferase" - gene complement(11666..12070) - /locus_tag="JK1GL000019" - CDS complement(11666..12070) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W040" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000019" - /note="GO_function: GO:0008080 - N-acetyltransferase - activity" - /product="MULTISPECIES: GNAT family N-acetyltransferase" - /protein_id="ncbi_JK1GL000019" - /transl_table=11 - /translation="MNWTIERAEGKDLDLDEVLAVYRSSGLGERRPVEDRDRMKAMLTG - ANLVLVARDGDGALIGIARSVSDFSYVTYLSDIAVDGRLQRSGIGRALIDATRKEAPTA - KIVLLSAPAATAYYPHIGFTQHNSAWVLNP" - mRNA complement(12054..13340) - /locus_tag="JK1GL000020" - /note="MULTISPECIES: adenylosuccinate lyase" - gene complement(12054..13340) - /locus_tag="JK1GL000020" - CDS complement(12054..13340) - /EC_number="4.3.2.2" - /codon_start=1 - /db_xref="COG:COG0015 Adenylosuccinate lyase" - /db_xref="UniProtKB/Swiss-Prot:P74384 Adenylosuccinate - lyase" - /db_xref="UniProtKB/TrEMBL:A0A454W043" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1063:argininosuccinate lyase/adenylosuccinate lyase - (Score: 140.4; E-value: 1.5e-42)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000020" - /note="GO_function: GO:0003824 - catalytic activity; - GO_function: GO:0004018 - N6-(1,2-dicarboxyethyl)AMP - AMP-lyase (fumarate-forming) activity; GO_process: - GO:0009152 - purine ribonucleotide biosynthetic process" - /product="MULTISPECIES: adenylosuccinate lyase" - /protein_id="ncbi_JK1GL000020" - /transl_table=11 - /translation="MIPRYTLPEMADLFADQSRYATWVKVEILASEAQAGLGRVPAAAV - EDMRRARVPLAARVAEIEKERDHEVLSFLAAYCEDIPEDSARWVHLGMTSYDLVDTALG - HTLARATDLLLAAARRLRATLVGKALEHWDTVMVGRTHGVHAEPTTFGHKLGVHAFAVD - RSITRLTAAREAVAVGTVSGSVGTYALIDPEVERHVCDALGLGVEPVPSQVVARDRHAQ - LMQAVAALGACIEQIALELRLLQRTEVREVEEHRTGAYQGSSAMPHKRNPTTSERLCGL - ARLLRGYADTALENVALWHERDLAHQSVERVILPDSLSVGHFQTVMAADLINSLTVRPE - RMRAHIDTTDGLIHSSAVLADLLARGVERERAYRGVQAAADHTLATGEHFAAGLAREGI - DVESLEPERFLTRHDVIRTRLETLRELDD" - mRNA complement(13437..14957) - /locus_tag="JK1GL000021" - /note="MULTISPECIES: glutamine synthetase" - gene complement(13437..14957) - /locus_tag="JK1GL000021" - CDS complement(13437..14957) - /EC_number="6.3.1.2" - /codon_start=1 - /db_xref="COG:COG0174 Glutamine synthetase" - /db_xref="UniProtKB/TrEMBL:A0A429NHX7" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000021" - /note="GO_function: GO:0003824 - catalytic activity; - GO_function: GO:0004356 - glutamate-ammonia ligase - activity; GO_process: GO:0006542 - glutamine biosynthetic - process; GO_process: GO:0006807 - nitrogen compound - metabolic process" - /product="MULTISPECIES: glutamine synthetase" - /protein_id="ncbi_JK1GL000021" - /transl_table=11 - /translation="MYARSWSSPAPDGSVGRPSFVTDHGLWDDERVAAAERVEAALDEV - DFVRLVFGDPHGLARSKTLTADAFRSVLRNGMNFSPGPFLFDTGHAVAVDFLGDHGIGV - DEIAGAGNFVLVPDPVTFQVLPERGPRTAWVLGDEYLRDGTPHPLSSRAVLRRVVNRYA - ALGLQPVLGLEVEWYLTRRLDDEPGNQGNGFGLQGQAPRVTAVNAGYQFNLDAAYDTVA - PITGPLGLHLRKLGLPLRSMEHESGPGQVETTFSPMTALDTADAMLLFRTVTKRFCARR - GHHASFMSQPRLDAADPSGWHLNQSVVDLATGRNLFSAEGLSGGLSPNGKAYAEGLLTW - ARELFLLSVPTVNGYRRLAAEHALAPTRLGWSFEDRTAMLRVVGSGAGAHIENRVGEPC - ANPYLNIAAQLFAGLEGLTAQPADPQTAPRGEAPTETQPQTVPQTLAEALDAFRTGRAD - QLLGAPLAACMTKLKESELGRFTAWSSQTAPAPGQVTDWEQREYFGVY" - mRNA complement(14962..16371) - /locus_tag="JK1GL000022" - /note="MULTISPECIES: amidase" - gene complement(14962..16371) - /locus_tag="JK1GL000022" - CDS complement(14962..16371) - /EC_number="6.3.5.6" - /EC_number="6.3.5.7" - /codon_start=1 - /db_xref="COG:COG0154 Asp-tRNAAsn/Glu-tRNAGln - amidotransferase A subunit or related amidase" - /db_xref="UniProtKB/TrEMBL:A0A429NHY2" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1105:amidase (Score: 416.1; E-value: 3.3e-126)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000022" - /note="GO_function: GO:0004040 - amidase activity" - /product="MULTISPECIES: amidase" - /protein_id="ncbi_JK1GL000022" - /transl_table=11 - /translation="MTARGIRRTKELLSRRELTVVEHVQDVLAAVRERDHLGAYVAVAG - DEAIRAAARADELIRDRGREAWWDLPLLGVTVSVKDLLQTRDLPTTRGSLLPNGRPAQD - APAVARLRAAGAIVVGKTTTSEFGWSASTVGRLAPPTRNPYDPSRSAGGSSGGAAASVA - AGLCEGALGTDGSGSIRIPAAFCGVVGYKPSFGRVPYYPNGADRLAHQGPIAATVADAA - LLGQVIAGPHPTDPDSGLGSLDSPRDMRSLRIGWIEYEGTDPEIRRVTEAARDVLLDEG - HLVEEVQVRCHNLYPAVVDILAATEAAGTRPEDEELIDPGRLHVVRHGRTLSGVAVIQA - EEIRQNLRATLRSVMDDYDLLAMATVPVEPFDAGAIGPDWAADVRDLLWLAWAPASYPY - NMTGQPAASLPAGLTSSGLPAGVQLVGPVGADDLVLTVARRLEAMLPPLPQPPAAPPVA - ASTGTTGERTF" - mRNA complement(16491..18431) - /locus_tag="JK1GL000023" - /note="hypothetical protein" - gene complement(16491..18431) - /locus_tag="JK1GL000023" - CDS complement(16491..18431) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A3R9U297" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000023" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000023" - /transl_table=11 - /translation="MPERGESRRAANARKRISRRPSRLGLVAGATLKPDRVREADAGFP - GLLKRVWRRAEQTEDLRSFVEVLLTLDGHVPADVQLRALSAAEEAALAALCGLSWRATA - TAAPAARGDAAPATAAPGDGTSGDAEETVFSGEIALATSGRIVLRVPSAAPLKADGLVG - GVRRVPWTRATLDAYRAQLRRAEDRVARTVADCRGWLAEQGAEGRGELLEQAKEAALRT - APFVLYQQGRQYTNFRDHNTLTGKTLWPGHPDCALSSLQDLPLELWSDHDVQLVVCLTL - LIRSAGPGRVEEANGTQLTVDHVAHMLERIRVGYNAALGRDQVPPAASATVADLHELAV - SLRSHRGEVAREAQLYREIHGALMHKIEKVAGPCADLARAREDAVTARLTSRLPLRGDN - LAELGEALAAAPGWLAAPHGDFATGLEALVYESAAAATEAFEADFAMSRGMRSLPDLIT - ALREERWAEICDWEITRFFCCVVPDPSAARHFGDSTAALADAAWAMSSRMQYNSWHFIA - GNLPKAPEVVDRDHFVPPTIPDVAFYSDQHHHGHVNNNVRFSIRSPQSVVVDGRRFNGF - VDLRLLRCDGAPFGEQDLLAAHRVSAFTARATGLVAELAAAGEQIEVTAFDSPWHWSAV - TGGADPATRAS" - mRNA complement(18440..18766) - /locus_tag="JK1GL000024" - /note="MULTISPECIES: 4Fe-4S ferredoxin" - gene complement(18440..18766) - /locus_tag="JK1GL000024" - CDS complement(18440..18766) - /EC_number="7.2.1.2" - /codon_start=1 - /db_xref="COG:COG1149 MinD superfamily P-loop ATPase, - contains an inserted ferredoxin domain" - /db_xref="UniProtKB/TrEMBL:A0A399CKM6" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000024" - /product="MULTISPECIES: 4Fe-4S ferredoxin" - /protein_id="ncbi_JK1GL000024" - /transl_table=11 - /translation="MKKIASSAALSGRVERIAQRDRPDNWKKPPRRIEKSECITCDTCL - RSCPAEFGAIFDRGLDVVIIPELCSGCPACVLECPVDCIYVDEDWTPTDDAMWNHIELT - AKGA" - mRNA complement(18897..20342) - /locus_tag="JK1GL000025" - /note="alkaline phosphatase family protein" - gene complement(18897..20342) - /locus_tag="JK1GL000025" - CDS complement(18897..20342) - /codon_start=1 - /db_xref="COG:COG1524 Predicted pyrophosphatase or - phosphodiesterase, AlkP superfamily" - /db_xref="UniProtKB/TrEMBL:A0A429NFG1" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000025" - /note="GO_function: GO:0003824 - catalytic activity" - /product="alkaline phosphatase family protein" - /protein_id="ncbi_JK1GL000025" - /transl_table=11 - /translation="MTPTTSSGGPVPLLVLDVVGLTPRLLDHMPHLKRLGQSGSRAPLG - TVLPAVTCAAQSTFLTGTYPSEHGIVGNGWYFRELGDVLLWRQHNGLVTGDKLWDAARR - AHPGYSVANICWWYAMGADTDITVTPRPVYYADGRKEPDCYTRPAALHDELTDRLGTFP - LFHFWGPGADLVSSQWIIDATRHIMHTRHPDLTLCYLPHLDYDLQRYGPDDPRSHKAAT - DLDTALAPLLDDARAEGRTVVALSEYGITPVSRPVDINRALRRAGLLEVHTQDGMEYLD - PMASRAFAVADHQIAHVYVRRPEDLDATRAALDGLPGIETLLDDEGKKAHHLDHPRAGE - LVAVAEPDAWFTYYYWLDDARAPDFAQLVEIHRKPGYDPVELFMDPLDPYVKVKAATAL - ARKKLGMRYRMAVVPLDASPVRGSHGRLPASDDDGPLLICSIPRAVGDRVAATDVKQLL - LRLAGLESAAAREEPRPRTGTTV" - mRNA complement(20339..21514) - /locus_tag="JK1GL000026" - /note="TIM barrel protein" - gene complement(20339..21514) - /locus_tag="JK1GL000026" - CDS complement(20339..21514) - /codon_start=1 - /db_xref="COG:COG1082 Sugar phosphate isomerase/epimerase" - /db_xref="UniProtKB/TrEMBL:A0A399CJC3" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000026" - /note="GO_function: GO:0008270 - zinc ion binding" - /product="TIM barrel protein" - /protein_id="ncbi_JK1GL000026" - /transl_table=11 - /translation="MRFRHPDGSTVHLAYCTNVHPAETLDGVLAQLRDHCEPVRRRLGR - DRLGIGLWLAKDAAHALATDPSALRGLRTELDRRGLEVVTLNGFPYEGFGAEEVKYRVY - KPDWADPERLEHTTSLARVLAGLLPDDVTDGSISTLPLAWRTAWDETRADKARAALATL - GERLDALHELTGRSIRIGLEPEPGCVVETTHDAIAPLGAIGHDRIGICVDTCHLATSFE - DPHTALDALTAARVPVVKSQLSAALHAEHPSRPEVRDALAAFAEPRFLHQTRTTAATAG - LRGTDDLDEALAGGGPLPDTAPWRAHFHVPLHADPAAPLTSTLPVLKSALSRLVGGARP - LTRHLEVETYTWQALPAQLRPRGRAQLTDGIAAELMLARDLLTDLGLKELP" - mRNA complement(21518..22393) - /locus_tag="JK1GL000027" - /note="MULTISPECIES: hydrolase TatD" - gene complement(21518..22393) - /locus_tag="JK1GL000027" - CDS complement(21518..22393) - /codon_start=1 - /db_xref="COG:COG1099 Predicted metal-dependent hydrolase, - TIM-barrel fold" - /db_xref="UniProtKB/TrEMBL:A0A399CKK9" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000027" - /note="GO_function: GO:0016788 - hydrolase activity, acting - on ester bonds" - /product="MULTISPECIES: hydrolase TatD" - /protein_id="ncbi_JK1GL000027" - /transl_table=11 - /translation="MRIFDPHIHMTSRTTDDYEAMHAAGVRAVVEPAFWLGQPRTSPAS - FCDYFDALLGWEPFRAAQYGIAHHCTIALNPKEANDPRCTPVLAELPRYLVKDRVVAVG - EIGYDSMTPAEDTALAAQLQLAADHGLPALVHTPHRDKLAGLRRTLDVVRESALPTDRV - LVDHLNETTVKEAKDSGAWLGFSVYPDTKMDEARMVALLREYGPEKVLVNSAADWGRSD - PLKTRKVGDLMLEEGFGEDDVDRVLWRNPVAFYGLSGRLDLDVTATAPTHEGNSVLRGA - PAAEPLPTGA" - mRNA complement(22395..22994) - /locus_tag="JK1GL000028" - /note="MULTISPECIES: sugar phosphate isomerase" - gene complement(22395..22994) - /locus_tag="JK1GL000028" - CDS complement(22395..22994) - /codon_start=1 - /db_xref="COG:COG1082 Sugar phosphate isomerase/epimerase" - /db_xref="UniProtKB/TrEMBL:A0A399CHG5" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000028" - /product="MULTISPECIES: sugar phosphate isomerase" - /protein_id="ncbi_JK1GL000028" - /transl_table=11 - /translation="MTVVHTPPDADLPGEFAGLGTDARRWLTAARASATARDTDWELRF - AEAGRRCGTEHADAARVLLLAAARPDAETVTLLYHRGTAAERRAVLLALDGLDTEPAHA - LPLVEDALRANDTTLLAAALGPYAARHLDAHQWRHAVLKCLFTGVPVATVANLAARARA - DAELARMLRAYAAERTAAHRDIPADLDRVLALTQEQ" - mRNA complement(22991..23836) - /locus_tag="JK1GL000029" - /note="MULTISPECIES: TIM barrel protein" - gene complement(22991..23836) - /locus_tag="JK1GL000029" - CDS complement(22991..23836) - /codon_start=1 - /db_xref="COG:COG1082 Sugar phosphate isomerase/epimerase" - /db_xref="UniProtKB/TrEMBL:A0A454W1I9" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000029" - /product="MULTISPECIES: TIM barrel protein" - /protein_id="ncbi_JK1GL000029" - /transl_table=11 - /translation="MSPLRLGYGTNGLTDLRLEDALRLLADLGYDGVGLTLDHMHLDPL - APDLAARTRHVARQLHRLGLAVTVETGARYVLDPRRKHGPSLLDDDPDARWARVRLLIR - SVRVAADLGAHAVHCFSGPRPAGLDQDTAWKRLADALGPVLDAAEDTGVPLAVEPEPGH - LLATLTDFHRLRTELGDPEPLGLTLDIGHCQCLEPLPPADCVRAAAPWLRHVQIEDMRR - GVHEHLPFGDGEIDFPPVLDALAATGYQGLTVVELPRHSHAGPELAAQSMRFLRNGGTR - " - mRNA complement(23833..24789) - /locus_tag="JK1GL000030" - /note="prenyltransferase UbiA" - gene complement(23833..24789) - /locus_tag="JK1GL000030" - CDS complement(23833..24789) - /EC_number="2.5.1.39" - /codon_start=1 - /db_xref="COG:COG0382 4-hydroxybenzoate - polyprenyltransferase" - /db_xref="UniProtKB/TrEMBL:A0A454W1H9" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000030" - /note="GO_component: GO:0016021 - integral component of - membrane; GO_function: GO:0016765 - transferase activity, - transferring alkyl or aryl (other than methyl) groups" - /product="prenyltransferase UbiA" - /protein_id="ncbi_JK1GL000030" - /transl_table=11 - /translation="MSAQRPAHGPARDGHLHAWAELLRAPAAFTVPGDVLAGTAAAGTR - PTGRTALAAGASLCLYEAGMALNDWADREEDATARPHRPLPSGRVRPGAALAAAGLLSA - AGLALAACAGRRALAVAGPLAATVWAYDLGLKHTPAGPAAMAAARSLDLLLGAAAGPGA - VRRAIVPAAFLGSHTLAVSLVSRRETEGGSSTAPLTALAAAGALTTVLAGRPTAHPAPD - ASTGAPTPATPPADKAARAVRAALAASYAATFARPLAHAALNPSPELTQRAVGAGVRAT - IALQSGLMARAGAPGTGVLTAALAPLAAHLARKVSTT" - mRNA complement(24786..25901) - /locus_tag="JK1GL000031" - /note="MULTISPECIES: myo-inositol-1-phosphate synthase" - gene complement(24786..25901) - /locus_tag="JK1GL000031" - CDS complement(24786..25901) - /EC_number="5.5.1.4" - /codon_start=1 - /db_xref="COG:COG1260 Myo-inositol-1-phosphate synthase" - /db_xref="UniProtKB/TrEMBL:A0A454W1J4" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000031" - /note="GO_function: GO:0004512 - inositol-3-phosphate - synthase activity; GO_process: GO:0006021 - inositol - biosynthetic process; GO_process: GO:0008654 - phospholipid - biosynthetic process" - /product="MULTISPECIES: myo-inositol-1-phosphate synthase" - /protein_id="ncbi_JK1GL000031" - /transl_table=11 - /translation="MTSADETRTGVWLVGARGSVATTAVSGCAALAAGLLPPTGMVTET - PPFADCGLPALASLVFGGHDTATTPLPKRAEELAAQGVLPPWLPTAVQGELAAADEHIR - PGGPVPGDRRATEELIADFATDLRTFARTTGVARTVVVNVASTEPDPAHGAWPASSLYA - AAALRAGCPYVNFTPSTGLSHPQLAGAARASGLPYAGRDGKTGQTLLRSVLGPMFAQRA - LAVRAWSGTNLLGGGDGAALADPAAAAAKNAGKERVLTDTLGTRVEGEVHIDDVPALGD - WKTAWDHVAFDGFLGTRMVLQTIWQGCDSALAAPLVLDLARLLARAHERGLSGPLGELG - FYFKDPDAEGSALAEQYTRLLTLAGRLGGTR" - mRNA complement(26152..27273) - /locus_tag="JK1GL000032" - /note="ScyD/ScyE family protein" - gene complement(26152..27273) - /locus_tag="JK1GL000032" - CDS complement(26152..27273) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A429NH62" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000032" - /product="ScyD/ScyE family protein" - /protein_id="ncbi_JK1GL000032" - /transl_table=11 - /translation="MANSRNSWTKILLAAGAAGAVAVPLTAGPVQAQPQAHRHGHTHTH - TRTEATVTVVASQLNNPRGVTALGDGGVLVAEAGAGLADCPVDQTCVGTTGSVYKVKGS - FQGRVATGLASTAKGVAPGAPISANGPSDVVPDRFGGYVVVSGLGGTTESRAALGEGAQ - TLGTVFRTRDHKVLADLTDHETRLNPDGGDVHANPWRLTRSGSGYLATDAGANTVVRGN - ADGTTATEYLLPKNELPTGAAETVPTGIAKAADGTVYVADMSGGRVGASRVWKIAPGQQ - PEILATGMTNLIDLDLDRDGDLIALSYSAAALAGPPQPGALFEIDADSGAVTEIPTGDQ - LKQPTGVAVDPCGKVYVTNNTLGTNGQLVRVNR" - mRNA 27631..28602 - /locus_tag="JK1GL000033" - /note="MULTISPECIES: hydroxyneurosporene methyltransferase" - gene 27631..28602 - /locus_tag="JK1GL000033" - CDS 27631..28602 - /codon_start=1 - /db_xref="COG:COG1414 DNA-binding transcriptional - regulator, IclR family" - /db_xref="UniProtKB/TrEMBL:A0A399CND7" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1042:O-methyltransferase (Score: 322.9; E-value: - 4e-98)" - /gene_functions="biosynthetic-additional (t2pks) MET - (Score: 266.1; E-value: 1e-81)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000033" - /note="GO_function: GO:0008168 - methyltransferase - activity; GO_function: GO:0008171 - O-methyltransferase - activity" - /product="MULTISPECIES: hydroxyneurosporene - methyltransferase" - /protein_id="ncbi_JK1GL000033" - /transl_table=11 - /translation="MGVMVTRAVHVAAELKVAEALAEGPLSADELAGRVGADADALGRV - LRLLASNGVFATRPDGAFELTPMADALRADHPMSMRGIALLMGHPIHWEDWSGFPETVV - TGEPALPKLRGMHAFEFLTKNAEYGQVFFQGMGSMSASETEPILAAYDFSQFGTVVDFC - GGQGALLAGILGAAPGCEGVLFDPRVEENGAAEFLAAQGVADRTKRVAGDLFDVPPGGA - DAYVLKHIVHDWPEEQALRILRNVRAAIKPGGKLLIAEMVIPEQGDQPHSGKLVDLWLM - LLVGGRERTPGQYADLLARAGFRLERVVETAAAISLVEAVPV" - mRNA complement(28804..30318) - /locus_tag="JK1GL000034" - /note="FAD-binding protein" - gene complement(28804..30318) - /locus_tag="JK1GL000034" - CDS complement(28804..30318) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A399CJT3" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 551.4; E-value: - 3.7e-167)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 570.9; E-value: 5.2e-174)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000034" - /note="GO_function: GO:0071949 - FAD binding" - /product="FAD-binding protein" - /protein_id="ncbi_JK1GL000034" - /transl_table=11 - /translation="MEGTAADTDVIVVGAGPTGLMLAGELRLGGARVVVIEKLAAPTGQ - SRGLGFTARAMETFDERGLLPRFGQGETLATSPVGHFGGAQFDFTVLEDAHFGARGIPQ - GDTEAVLEGWAGELGADIRRGWEFVSLTDGFLDGDGVEITVRTPQGEERTLRASYLAGC - DGGSSRVRRAAGFDFLGTDATQGMYLADITGVELTPRFLGERLNNGMVMAAPLSQGVWR - IIVCPDGRPAHDRERTVTFEEVAAAWQDITGEDISHGGASWVSSFTNATRQASEYRRGR - VFLAGDAAHIHLPAGGQGLSTGVQDAANLGWKLASVIRGDAPRELLDTYHAERHPVGAR - LLMNTRAQGIVFLGGAESDPLRELMAELVRYDDVKRHLAGIVSHLDIRYDLADTATGPT - HPLLGRRMPPRLLVGADGETRIARLLHAGHGVLLDLADDETVRATAAGHADRVDVVTAV - AKPTDGPDALAGATAVLIRPDGYVAWTGTCAQGLETALERWFGPPR" - mRNA complement(30421..31896) - /locus_tag="JK1GL000035" - /note="FAD-dependent oxidoreductase" - gene complement(30421..31896) - /locus_tag="JK1GL000035" - CDS complement(30421..31896) - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:Q5YTV5 Rifampicin - monooxygenase" - /db_xref="UniProtKB/TrEMBL:A0A3R9U1U9" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 556.6; E-value: - 9.8e-169)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 585.0; E-value: 2.9e-178)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000035" - /note="GO_function: GO:0071949 - FAD binding" - /product="FAD-dependent oxidoreductase" - /protein_id="ncbi_JK1GL000035" - /transl_table=11 - /translation="MAADALTTDVVVVGAGPVGMMLAGELAHGGVGVVVVEKRRAPSTE - SRASTLHARTMEILDSRSLLPEFGDPPNEPRGHFGGIPLDLTLPSSHPGQWKVPQTRTE - VILGEWALSLGAELQCKHELTALDDSGDLVEAEAAGPDGRTLRLRCRYLVACDGEESTV - RRLIGADFPGRDATRELLRADVAGIDIPGRRFERLEHGLAIAARRPDGVTRVMVHEFGS - AARARPHGDVSFEEITAVWKRVTGEDISGGTPLWANAFGDASRQLTRYRHGRVLFAGDA - AHRQMPVGGQALNLGMQDAFNLGWKLALVVRGKAPQTLLDSYHDERHEVGRQVLANIRA - QSLLLLGGPEVEPLRDLLTELIGQEDVRRRLAGMISGLDVRYDVGGPAHPLLGARLPCT - EVRARRRLLTTTQLVRSGGGVLLDLTGRPGRPPAVLDGWADRVTALDAQPSPGSSLQGT - DRVLVRPDGHVAWAGPGTDGLAEALTRWFGPPR" - mRNA complement(31900..32844) - /locus_tag="JK1GL000036" - /note="cyclase" - gene complement(31900..32844) - /locus_tag="JK1GL000036" - CDS complement(31900..32844) - /EC_number="4.2.1.-" - /NRPS_PKS="Domain: Polyketide_cyc2 (4-146). E-value: - 2.2e-16. Score: 52.4. Matches aSDomain: - nrpspksdomains_JK1GL000036_Polyketide_cyc2.1" - /NRPS_PKS="Domain: Polyketide_cyc2 (157-310). E-value: - 2.8e-09. Score: 29.3. Matches aSDomain: - nrpspksdomains_JK1GL000036_Polyketide_cyc2.2" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:P41178 hypothetical protein" - /db_xref="UniProtKB/TrEMBL:A0A399CFS4" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1128:cyclase/dehydrase (Score: 454.2; E-value: - 3.6e-138)" - /gene_functions="biosynthetic-additional (t2pks) CYC C7-C12 - (Score: 472.7; E-value: 9.4e-145)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000036" - /product="cyclase" - /protein_id="ncbi_JK1GL000036" - /transl_table=11 - /translation="MTTREVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEAD - GDHERIHIWATANGQAKEWTSRRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDR - SRVRLLHDYSAVGDDPHDLLWIEQAVDKNSTSELAALKVNVEAAHAAATEELTFSFTDT - VHIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGLQELEMDTRAKDGSVHTTKSY - RVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTASSQHTVTLNTANIARILGQDA - TVADARAYVHTALSTNSRATLAHAKAYAEQKKG" - aSDomain complement(31915..32373) - /aSDomain="Polyketide_cyc" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000036_Polyketide_cyc2.2" - /domain_subtype="Polyketide_cyc2" - /evalue="2.80E-09" - /label="JK1GL000036_Polyketide_cyc2.2" - /locus_tag="JK1GL000036" - /protein_end="310" - /protein_start="157" - /score="29.3" - /tool="antismash" - /translation="FSFTDTVHIDGAAKDVFDFINEAQLWAERLPHVAVVRLSEDTPGL - QELEMDTRAKDGSVHTTKSYRVVFPHHKIAYKQVTLPALMTLHTGEWTFTEGDEATTAS - SQHTVTLNTANIARILGQDATVADARAYVHTALSTNSRATLAHAKAYAE" - aSModule 31915..32832 - /domains="nrpspksdomains_JK1GL000036_Polyketide_cyc2.1" - /domains="nrpspksdomains_JK1GL000036_Polyketide_cyc2.2" - /incomplete - /locus_tags="JK1GL000036" - /tool="antismash" - /type="unknown" - aSDomain complement(32407..32832) - /aSDomain="Polyketide_cyc" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000036_Polyketide_cyc2.1" - /domain_subtype="Polyketide_cyc2" - /evalue="2.20E-16" - /label="JK1GL000036_Polyketide_cyc2.1" - /locus_tag="JK1GL000036" - /protein_end="146" - /protein_start="4" - /score="52.4" - /tool="antismash" - /translation="EVEHEITIGAPADAVYQLLADVTNWPRIFPPTIHVDRTEADGDHE - RIHIWATANGQAKEWTSRRTLDRENLTITFRQEIPAAPVKHMGGTWIIEPLADDRSRVR - LLHDYSAVGDDPHDLLWIEQAVDKNSTSELAALKVNVE" - mRNA complement(32884..33672) - /locus_tag="JK1GL000037" - /note="MULTISPECIES: SDR family NAD(P)-dependent - oxidoreductase" - gene complement(32884..33672) - /locus_tag="JK1GL000037" - CDS complement(32884..33672) - /EC_number="1.1.1.-" - /NRPS_PKS="Domain: PKS_KR (8-164). E-value: 7.1e-11. Score: - 34.2. Matches aSDomain: - nrpspksdomains_JK1GL000037_PKS_KR.1" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:P41177 Monensin polyketide - synthase putative ketoacyl reductase" - /db_xref="UniProtKB/TrEMBL:A0A3R9UGD4" - /gene_functions="biosynthetic-additional - (rule-based-clusters) adh_short" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1001:short-chain dehydrogenase/reductase SDR (Score: - 259.1; E-value: 6.8e-79)" - /gene_functions="biosynthetic-additional (t2pks) KR C9 - (Score: 472.0; E-value: 1.1e-144)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000037" - /note="GO_function: GO:0016491 - oxidoreductase activity" - /product="MULTISPECIES: SDR family NAD(P)-dependent - oxidoreductase" - /protein_id="ncbi_JK1GL000037" - /sec_met_domain="adh_short (E-value: 1.4e-33, bitscore: - 115.1, seeds: 230, tool: rule-based-clusters)" - /transl_table=11 - /translation="MTDTTTQRVAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVA - ATVKELQGEGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIA - DELWDDVIDTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKH - GVVGFTKALGNELAPTGITVNAVCPGYVETPMAQRVRQGYAAAYDTSEDAILEKFQAKI - PLGRYSTPEEVAGLVGYLASDTAASITSQALNVCGGLGNF" - aSDomain complement(33181..33648) - /aSDomain="PKS_KR" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000037_PKS_KR.1" - /evalue="7.10E-11" - /label="JK1GL000037_PKS_KR.1" - /locus_tag="JK1GL000037" - /protein_end="164" - /protein_start="8" - /score="34.2" - /specificity="KR activity: inactive" - /specificity="KR stereochemistry: C1" - /tool="antismash" - /translation="VAVVTGATSGIGLASARLLGRQGHQVFIGARNAENVAATVKELQG - EGIDADGTVVDVRDTESVNAWIQAAVDRFGSVDVVVNNAGRSGGGPTADIADELWDDVI - DTNLNSVFRVTRAALTIGGLRAKDRGRIINVASTAGKQGVVLGAPYSASKHG" - CDS_motif complement(33580..33642) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000037_0001" - /evalue="6.00E-05" - /label="PKSI-KR_m1" - /locus_tag="JK1GL000037" - /protein_end="31" - /protein_start="10" - /score="15.7" - /tool="antismash" - /translation="VVTGATSGIGLASARLLGRQG" - mRNA complement(33685..33954) - /locus_tag="JK1GL000038" - /note="MULTISPECIES: acyl carrier protein" - gene complement(33685..33954) - /locus_tag="JK1GL000038" - CDS complement(33685..33954) - /NRPS_PKS="Domain: ACP (12-83). E-value: 9.1e-13. Score: - 40.2. Matches aSDomain: nrpspksdomains_JK1GL000038_ACP.1" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="COG:COG0236 Acyl carrier protein" - /db_xref="UniProtKB/Swiss-Prot:P41174 Monensin polyketide - synthase acyl carrier protein" - /db_xref="UniProtKB/TrEMBL:A0A399CG47" - /gene_functions="biosynthetic-additional - (rule-based-clusters) PP-binding" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1129:acyl carrier protein (Score: 114.7; E-value: - 2.6e-35)" - /gene_functions="biosynthetic-additional (t2pks) ACP - (Score: 127.3; E-value: 3.8e-40)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000038" - /product="MULTISPECIES: acyl carrier protein" - /protein_id="ncbi_JK1GL000038" - /sec_met_domain="PP-binding (E-value: 3.6e-06, bitscore: - 26.1, seeds: 164, tool: rule-based-clusters)" - /transl_table=11 - /translation="MASKSFTLDDLKRTLREAAGVAEGVDLDGDILDTEFEVIGYESLA - LLEAGSLIEREYGISLDEEAVGEANTPRSFIEVVNAQLAPAKAA" - aSDomain complement(33706..33918) - /aSDomain="ACP" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000038_ACP.1" - /evalue="9.10E-13" - /label="JK1GL000038_ACP.1" - /locus_tag="JK1GL000038" - /protein_end="83" - /protein_start="12" - /score="40.2" - /tool="antismash" - /translation="RTLREAAGVAEGVDLDGDILDTEFEVIGYESLALLEAGSLIEREY - GISLDEEAVGEANTPRSFIEVVNAQL" - mRNA complement(34023..35234) - /locus_tag="JK1GL000039" - /note="MULTISPECIES: ketosynthase chain-length factor" - gene complement(34023..35234) - /locus_tag="JK1GL000039" - CDS complement(34023..35234) - /EC_number="2.3.1.-" - /EC_number="2.3.1.260" - /EC_number="2.3.1.235" - /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (48-401). E-value: - 9.4e-31. Score: 98.9. Matches aSDomain: - nrpspksdomains_JK1GL000039_PKS_KS.1" - /NRPS_PKS="type: PKS/NRPS-like protein" - /codon_start=1 - /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) - synthase" - /db_xref="UniProtKB/Swiss-Prot:Q02062 Actinorhodin - polyketide putative beta-ketoacyl synthase 2" - /db_xref="UniProtKB/TrEMBL:A0A399CKN5" - /gene_functions="biosynthetic (rule-based-clusters) T2PKS: - t2clf" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1093:Beta-ketoacyl synthase (Score: 672.2; E-value: - 3.4e-204)" - /gene_functions="biosynthetic-additional (t2pks) CLF 8|9 - (Score: 704.2; E-value: 9.9e-215)" - /gene_kind="biosynthetic" - /locus_tag="JK1GL000039" - /note="GO_function: GO:0003824 - catalytic activity" - /product="MULTISPECIES: ketosynthase chain-length factor" - /protein_id="ncbi_JK1GL000039" - /sec_met_domain="t2clf (E-value: 4.4e-207, bitscore: 686.3, - seeds: 26, tool: rule-based-clusters)" - /transl_table=11 - /translation="MTASVVVTGLGVVSPNGMGVKDYWAATLGGKHGIGRITRFDPTGY - PARLAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPAHLPEFDMGVIT - ASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGMKGPSGVVVSEG - AGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSDEPDHAYLPFDR - DANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGREPNLAKAIETA - LADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKTMTGRLYSGGAP - LDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLARGAGGFNSAMV - VRAA" - aSDomain complement(34032..35090) - /aSDomain="PKS_KS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000039_PKS_KS.1" - /domain_subtype="Iterative-KS" - /evalue="9.40E-31" - /label="JK1GL000039_PKS_KS.1" - /locus_tag="JK1GL000039" - /protein_end="401" - /protein_start="48" - /score="98.9" - /tool="antismash" - /translation="LAGQIEDFDAEELLPSRLLPQTDRVTRLALVAADWALADAGADPA - HLPEFDMGVITASAAGGFEFGQGELQALWSQGSQYVSAYQSFAWFYAVNSGQISIRNGM - KGPSGVVVSEGAGGLDAVAQARRQIRRGTPLIVTGGVDASICPWGWVAQLACGRLTTSD - EPDHAYLPFDRDANGYVPGEGGAILIAEDADAARARGVRPYGEIAGYGATIDPRPGSGR - EPNLAKAIETALADADVNAADIDVVFADGAGDPAGDLAEARAVSTVFGDRGVPVTVPKT - MTGRLYSGGAPLDLAAAFLALRDGVIPPTVHIDPCADYPLDLVLGEPRPAELRTALVLA - RGAGGFNSAMVVR" - CDS_motif complement(34539..34577) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000039_0002" - /evalue="1.20E-04" - /label="PKSI-KS_m4" - /locus_tag="JK1GL000039" - /protein_end="232" - /protein_start="219" - /score="15.0" - /tool="antismash" - /translation="FDRDANGYVPGEG" - CDS_motif complement(34746..34769) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000039_0001" - /evalue="9.90E+01" - /label="PKSI-KS_m4" - /locus_tag="JK1GL000039" - /protein_end="163" - /protein_start="155" - /score="-2.9" - /tool="antismash" - /translation="SGVVVSEG" - mRNA complement(35231..36484) - /locus_tag="JK1GL000040" - /note="beta-ketoacyl-acyl-carrier-protein synthase family - protein" - gene complement(35231..36484) - /locus_tag="JK1GL000040" - CDS complement(35231..36484) - /EC_number="2.3.1.-" - /EC_number="2.3.1.260" - /EC_number="2.3.1.235" - /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (1-389). E-value: - 9.4e-53. Score: 171.4. Matches aSDomain: - nrpspksdomains_JK1GL000040_PKS_KS.1" - /NRPS_PKS="type: PKS/NRPS-like protein" - /codon_start=1 - /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) - synthase" - /db_xref="UniProtKB/Swiss-Prot:P41175 Putative polyketide - beta-ketoacyl synthase 1" - /db_xref="UniProtKB/TrEMBL:A0A454W1H2" - /gene_functions="biosynthetic (rule-based-clusters) T2PKS: - t2ks" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1022:Beta-ketoacyl synthase (Score: 482.3; E-value: - 2.3e-146)" - /gene_functions="biosynthetic-additional (t2pks) KS (Score: - 773.1; E-value: 1.4e-235)" - /gene_kind="biosynthetic" - /locus_tag="JK1GL000040" - /note="GO_function: GO:0003824 - catalytic activity" - /product="beta-ketoacyl-acyl-carrier-protein synthase - family protein" - /protein_id="ncbi_JK1GL000040" - /sec_met_domain="t2ks (E-value: 7.1e-244, bitscore: 808.0, - seeds: 25, tool: rule-based-clusters)" - /transl_table=11 - /translation="MITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAPFRSRVA - AEADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVTVGSAVG - ATMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPSTVVSTG - CTSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEPECASRP - FDKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRPDGVEMA - EAIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSSIKSMVG - HSLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQLIDAVLTVGSG - FGGFQSAMVLATPERSLV" - aSDomain complement(35318..36481) - /aSDomain="PKS_KS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000040_PKS_KS.1" - /domain_subtype="Iterative-KS" - /evalue="9.40E-53" - /label="JK1GL000040_PKS_KS.1" - /locus_tag="JK1GL000040" - /protein_end="389" - /protein_start="1" - /score="171.4" - /tool="antismash" - /translation="ITGIEVIAPGGVGRENFWNLLSNGRTATRGITFFDPAPFRSRVAA - EADFDPYEHGLTPQEVRRLDRAAQFAVVASRGAVADSGLDIPSLDPHRVGVTVGSAVGA - TMGLDQEYRVVSDGGRLDTVDHTYAVPHLYDYMVPSSFAAEVAWAVGAEGPSTVVSTGC - TSGIDSVGYAVELVREGSADVVIAGSSDAPISPITMACFDAIKATTPRHDEPECASRPF - DKTRNGFVLGEGTAFFVLEELDSARKRGAHIYAEIAGYATRSNAYHMTGLRPDGVEMAE - AIDLALGEARLNPQSIDYINAHGSGTKQNDRHETAAFKRSLGDHAYRTPVSSIKSMVGH - SLGAIGSIEIAASALAMEYDVVPPTANLHTPDPECDLDYVPLVARDQL" - mRNA complement(36499..36828) - /locus_tag="JK1GL000042" - /note="MULTISPECIES: TcmI family type II polyketide - cyclase" - gene complement(36499..36828) - /locus_tag="JK1GL000042" - CDS complement(36499..36828) - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:P23159 hypothetical protein" - /db_xref="UniProtKB/TrEMBL:A0A399CJD3" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1225:Polyketide synthesis cyclase (Score: 161; - E-value: 1.3e-49)" - /gene_functions="biosynthetic-additional (t2pks) CYC - C4-C17/C2-C19 (Score: 199.8; E-value: 9.5e-62)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000042" - /note="GO_process: GO:0030639 - polyketide biosynthetic - process" - /product="MULTISPECIES: TcmI family type II polyketide - cyclase" - /protein_id="ncbi_JK1GL000042" - /transl_table=11 - /translation="MHSTLIVARMAATSSNDVAQLFADFDATEMPHRMGTRRRQLFSYR - GLYFHLQDFDEDNGGELIEAAKADPRFVRISEDLKPFIEAYDPTTWRSPADAMATRFYS - WEASR" - mRNA complement(37086..37784) - /locus_tag="JK1GL000041" - /note="hypothetical protein" - gene complement(37086..37784) - /locus_tag="JK1GL000041" - CDS complement(37086..37784) - /codon_start=1 - /db_xref="COG:COG2329 Heme-degrading monooxygenase HmoA and - related ABM domain proteins" - /db_xref="UniProtKB/TrEMBL:A0A454W1H6" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000041" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000041" - /transl_table=11 - /translation="MPIISAEDKHLTVLNLFTTDTPEKQAKLIEEMTKIVNAAAYEGWM - SSTVHSGVDGYGTLNFIQWRSGEDLEKRYAGEEFKHRTLPVFGEITTSIRLMQNEVAHT - LTSDALGGKIEIGPDRDDYTVFTLFPVTPEGQDEAVDALGPGQAFLADVPGFRAHVVLK - GLRARGLEGSFVISYSQWDSKEAFEVYRDQAPEEQADARKAAVARVRAVVTGEPYLNTY - RVVHTRSAGE" - mRNA complement(37841..39313) - /locus_tag="JK1GL000043" - /note="MULTISPECIES: monooxygenase" - gene complement(37841..39313) - /locus_tag="JK1GL000043" - CDS complement(37841..39313) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W1G7" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1050:monooxygenase FAD-binding (Score: 529.6; E-value: - 1.4e-160)" - /gene_functions="biosynthetic-additional (t2pks) OXY - (Score: 512.5; E-value: 2.7e-156)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000043" - /note="GO_function: GO:0071949 - FAD binding" - /product="MULTISPECIES: monooxygenase" - /protein_id="ncbi_JK1GL000043" - /transl_table=11 - /translation="MEFYDSDVIVVGAGPTGLMLAGELRLAGVSVVVLDKLSEPIQESR - ALGFSARTIEEFAQRGLMDRFGEVGVIPVGHFGGVPLDYRVIEGGSYGARGIPQARTEG - VLGGWARELGADIRRGCEVTGIEQTDASVTVTAAGADGPFSLRARHVVGCDGARSIVRK - LAGIGFPGTEPAIELRFADLAGVALRPRFSGERVAGGMVMVIPMGPDRCRVIYFDSSEP - LRTSPDPITFDEVAQTWQRLTGEDVSGATPLWVSSTTDVSRQADRYRHGRVFLAGDAAH - IHLPIGAQGMSAGVQDAVNLGWKLALDIKGQAPEGLLDTYHAERHPVGARILTNTLAQR - ILYLGGDEITPMREVLAELMGAHESVQRHLAGMVTGLDIRHDVGEGDHPLLGRRLPDRE - LVVDGEKTPFYALLRTARPVLLELGGDHGLRTAAAGWADRVDLVAAEFDGCEAPVDGIL - VRPDGYVAWVAGLGAGPDGLTAALGRWFGPTA" - mRNA 39480..39962 - /locus_tag="JK1GL000044" - /note="MULTISPECIES: nuclear transport factor 2 family - protein" - gene 39480..39962 - /locus_tag="JK1GL000044" - CDS 39480..39962 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A399CRN6" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000044" - /product="MULTISPECIES: nuclear transport factor 2 family - protein" - /protein_id="ncbi_JK1GL000044" - /transl_table=11 - /translation="MTSSLTTDQSASVSAAESSAQVAGLLHRYLVSLDDERLDDAWTAG - LFTEDAVVAFPVSRHEGADGMAEYHRSALSAFAATQHLGSPAVVDVDGDRAVFRANLIS - THVHHPRHTPPEGDLPPLFATGTFVNGEARRTARGWRLSLLAFRLLWADGSPPPAR" - mRNA complement(40155..40571) - /locus_tag="JK1GL000045" - /note="MULTISPECIES: pyridoxamine 5'-phosphate oxidase" - gene complement(40155..40571) - /locus_tag="JK1GL000045" - CDS complement(40155..40571) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W1F9" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000045" - /note="GO_function: GO:0048037 - cofactor binding" - /product="MULTISPECIES: pyridoxamine 5'-phosphate oxidase" - /protein_id="ncbi_JK1GL000045" - /transl_table=11 - /translation="MPSMPRPDAVTVPDSVQAFLTGTALVAAFTTMRPDGTPHVAPVRF - TWDADAQLARVMTVSSSRKARNLLATPGAPVALCQVDGFRWVTLEGTGTVVTDPERVAL - GARLYAKRYWSAPPTPSDRVVIEIAVDRVLSLNA" - mRNA complement(40814..40960) - /locus_tag="JK1GL000046" - /note="hypothetical protein" - gene complement(40814..40960) - /locus_tag="JK1GL000046" - CDS complement(40814..40960) - /codon_start=1 - /locus_tag="JK1GL000046" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000046" - /transl_table=11 - /translation="MHEGDDERHEGDTARCARAVHGGPPPLRLAGAEEREDEDGRVIVR - SID" - mRNA complement(40995..42485) - /locus_tag="JK1GL000047" - /note="hypothetical protein" - gene complement(40995..42485) - /locus_tag="JK1GL000047" - CDS complement(40995..42485) - /NRPS_PKS="Domain: Condensation_DCL (38-314). E-value: - 1e-48. Score: 157.8. Matches aSDomain: - nrpspksdomains_JK1GL000047_Condensation_DCL.1" - /NRPS_PKS="type: NRPS-like protein" - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W1I0" - /gene_functions="biosynthetic-additional - (rule-based-clusters) Condensation" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1127:condensation domain-containing protein (Score: - 260.3; E-value: 6.5e-79)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000047" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000047" - /sec_met_domain="Condensation (E-value: 7.1e-28, bitscore: - 96.2, seeds: 42, tool: rule-based-clusters)" - /transl_table=11 - /translation="MAWHSRPRALRGPGTARPPGVPALWPHLDLLGDFGGRRGAGRHVE - QLVWRWHGPLDTERFAAAWQSVVDRESVLRAALAPGPRPHLVLHEHAHGDVVRHRAGGA - GWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGPVTRVVLTFHHALLDAWSVCLL - MQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGARDFWRGAVPDGPVAVLPARPG - PRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSALETVWALLLYRAAGPGGAATVG - FGVTVSGRGITLDCAERLPGPLRNCLPMVVRVDPGETVGRLLTALRDRALDMAAYEWVS - TRRIHRWTGRCPDGELLQSVVSVDSLPRPPGNLRNELADAGIALEPEPAHGACPDLPVA - LLVRPGGDGRLTFCVDHDRNRISDADARLLAGHCARLLRHLPGTDEATTNGAVLDVLAG - EALPRIAPRPSRPRPAGSWLRPRSTSFGAAVDRAASHP" - CDS_motif complement(41508..41567) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000047_0004" - /evalue="3.90E+01" - /label="C2_LCL_024-062" - /locus_tag="JK1GL000047" - /protein_end="326" - /protein_start="306" - /score="-3.2" - /tool="antismash" - /translation="LPMVVRVDPGETVGRLLTAL" - aSDomain complement(41544..42371) - /aSDomain="Condensation" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000047_Condensation_DCL.1" - /domain_subtype="Condensation_DCL" - /evalue="1.00E-48" - /label="JK1GL000047_Condensation_DCL.1" - /locus_tag="JK1GL000047" - /protein_end="314" - /protein_start="38" - /score="157.8" - /tool="antismash" - /translation="GAGRHVEQLVWRWHGPLDTERFAAAWQSVVDRESVLRAALAPGPR - PHLVLHEHAHGDVVRHRAGGAGWDRLLERDRRRGLDPSRPCPLRVTLVERTDDPAGAGP - VTRVVLTFHHALLDAWSVCLLMQELCRAYLAGGELPGGERRPDLRDWAGWLQRQDPAGA - RDFWRGAVPDGPVAVLPARPGPRTRQRGRGRTEVRLSPAEAERLHRWAALRAVPDSSAL - ETVWALLLYRAAGPGGAATVGFGVTVSGRGITLDCAERLPGPLRNCLPMVVRVD" - CDS_motif complement(41559..41645) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000047_0003" - /evalue="6.10E-06" - /label="C5_DCL_263-294" - /locus_tag="JK1GL000047" - /protein_end="309" - /protein_start="280" - /score="18.7" - /tool="antismash" - /translation="GFGVTVSGRGITLDCAERLPGPLRNCLPM" - CDS_motif complement(41973..42038) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000047_0002" - /evalue="4.90E-08" - /label="C3_DCL_135-156" - /locus_tag="JK1GL000047" - /protein_end="171" - /protein_start="149" - /score="25.5" - /tool="antismash" - /translation="FHHALLDAWSVCLLMQELCRAY" - CDS_motif complement(42255..42356) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000047_0001" - /evalue="3.80E-10" - /label="C2_DCL_024-062" - /locus_tag="JK1GL000047" - /protein_end="77" - /protein_start="43" - /score="32.1" - /tool="antismash" - /translation="VEQLVWRWHGPLDTERFAAAWQSVVDRESVLRAA" - mRNA complement(42690..43436) - /locus_tag="JK1GL000048" - /note="MULTISPECIES: 4'-phosphopantetheinyl transferase - superfamily protein" - gene complement(42690..43436) - /locus_tag="JK1GL000048" - CDS complement(42690..43436) - /EC_number="2.7.8.-" - /NRPS_PKS="Domain: ACPS (113-174). E-value: 6.1e-12. Score: - 37.3. Matches aSDomain: nrpspksdomains_JK1GL000048_ACPS.1" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="COG:COG2091 Phosphopantetheinyl transferase" - /db_xref="UniProtKB/TrEMBL:A0A399CJU2" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1012:4'-phosphopantetheinyl transferase (Score: 140.4; - E-value: 8.9e-43)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000048" - /note="GO_function: GO:0000287 - magnesium ion binding; - GO_function: GO:0008897 - holo-[acyl-carrier-protein] - synthase activity" - /product="MULTISPECIES: 4'-phosphopantetheinyl transferase - superfamily protein" - /protein_id="ncbi_JK1GL000048" - /transl_table=11 - /translation="MREDLFRHGNALVCTTWSEWLPSVLTTPRLRELLGDDWQRYRRTR - DAAVRYRFAASRMLIKYTAAAALAVPPEYLDLAYRLGGRPYLRGFDQIELSLSHTGDVM - AVGLSRIGRIGVDVEPAERPVRLDLLETQVFTPAEARELAELPEGERTAHALRLWTLKE - AYSKALGQGLRFGFKEFGFRQGRLSAPDGSRVTRDEWGFATYPVMDRFLLSVACHNAGL - STAGDTSVGTMLDQGFLSAMTDTGQQ" - aSDomain complement(42915..43097) - /aSDomain="ACPS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000048_ACPS.1" - /evalue="6.10E-12" - /label="JK1GL000048_ACPS.1" - /locus_tag="JK1GL000048" - /protein_end="174" - /protein_start="113" - /score="37.3" - /tool="antismash" - /translation="IGVDVEPAERPVRLDLLETQVFTPAEARELAELPEGERTAHALRL - WTLKEAYSKALGQGLR" - mRNA complement(43588..45402) - /locus_tag="JK1GL000049" - /note="acyl-CoA dehydrogenase" - gene complement(43588..45402) - /locus_tag="JK1GL000049" - CDS complement(43588..45402) - /codon_start=1 - /db_xref="COG:COG1960 Acyl-CoA dehydrogenase related to the - alkylation response protein AidB" - /db_xref="UniProtKB/TrEMBL:A0A3R9SSA2" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1006:acyl-CoA dehydrogenase (Score: 155.1; E-value: - 4.6e-47)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000049" - /note="GO_function: GO:0016627 - oxidoreductase activity, - acting on the CH-CH group of donors; GO_function: - GO:0050660 - flavin adenine dinucleotide binding; - GO_process: GO:0055114 - oxidation-reduction process" - /product="acyl-CoA dehydrogenase" - /protein_id="ncbi_JK1GL000049" - /transl_table=11 - /translation="MTAALDTAAGPTGQAPDPRSTTPTPAPEHTTPESQHITRAPEPER - AARLEAALGDPFDPVNPHGHLALVRADDTREAPHATEALLTEHGLSAEFVPHDLGGRLR - DLEELARVLRPLFRRDLALGYGFGITSLFAASSVWTAGDTHQRAALADVLLGGGRVAIV - HREVAHANAILRREVRAQRPAGGGFLLNGSKDAVMNADRTDTFVVYARTSAGSGSASHS - VLLLPGPPASGEVRRLARVEMPGMRGARFHGLRLADVRLPDSALVGSLGEGVTLALRSF - QISHCLIPGTVLAGVDSVLRLAVRAATENRPDGRPARRWHKALSGVFADLLACDAMAVT - GLRALSLVPQHAHLLAAAVKYTMPDLLREDLEELAAVLGARGYDRGPLYGGFQKLARDL - PVAGLGHSGTAVCQAVLVPQLPALARTAWFRTAEPSAALFLPGAPLPPLDHRRLTHSGT - DDPLTATLIGAAERLAARTGTQPLHAALAALARALVEELRVLRARCAALPAAGSTVFDP - LACALADRYALLLCAAACLGVWEGQADGDGFLADPAWAVLVLSRIGRRLGIAVPETPAD - AEQAVLAEALGRCRHGRSLDLYDTPLAG" - mRNA complement(45399..46259) - /locus_tag="JK1GL000050" - /note="MULTISPECIES: cyclase" - gene complement(45399..46259) - /locus_tag="JK1GL000050" - CDS complement(45399..46259) - /EC_number="4.2.1.-" - /NRPS_PKS="Domain: Polyketide_cyc2 (2-127). E-value: - 2.5e-11. Score: 36.0. Matches aSDomain: - nrpspksdomains_JK1GL000050_Polyketide_cyc2.1" - /NRPS_PKS="Domain: Polyketide_cyc2 (138-245). E-value: - 1e-07. Score: 24.3. Matches aSDomain: - nrpspksdomains_JK1GL000050_Polyketide_cyc2.2" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A399CG55" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1128:cyclase/dehydrase (Score: 266.8; E-value: - 4.2e-81)" - /gene_functions="biosynthetic-additional (t2pks) CYC C7-C12 - (Score: 256.3; E-value: 6.9e-79)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000050" - /product="MULTISPECIES: cyclase" - /protein_id="ncbi_JK1GL000050" - /transl_table=11 - /translation="MLYGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMWAVAGDRIS - SWVSHRRLDVGQRRVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFTVVGDAPAD - AAWTERVTRANSRAQLQRLAWLAERWTRLDDLVMSFEDTVRVNVPAELVFDFLYRAGDW - PDDLAGTRPLTVQEDTPGIQVLALDGRSATGGEAVRISFPAAGRLVHKHTRTSGPLAAY - TGEWTIEPQPGAGLDVTVRHDVLLNDDAALDQDAARRVCDEVGRAGRRLLEHAVRHASD - AVRVL" - aSDomain complement(45525..45845) - /aSDomain="Polyketide_cyc" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000050_Polyketide_cyc2.2" - /domain_subtype="Polyketide_cyc2" - /evalue="1.00E-07" - /label="JK1GL000050_Polyketide_cyc2.2" - /locus_tag="JK1GL000050" - /protein_end="245" - /protein_start="138" - /score="24.3" - /tool="antismash" - /translation="SFEDTVRVNVPAELVFDFLYRAGDWPDDLAGTRPLTVQEDTPGIQ - VLALDGRSATGGEAVRISFPAAGRLVHKHTRTSGPLAAYTGEWTIEPQPGAGLDVTVRH - DVL" - aSModule 45525..46253 - /domains="nrpspksdomains_JK1GL000050_Polyketide_cyc2.1" - /domains="nrpspksdomains_JK1GL000050_Polyketide_cyc2.2" - /incomplete - /locus_tags="JK1GL000050" - /tool="antismash" - /type="unknown" - aSDomain complement(45879..46253) - /aSDomain="Polyketide_cyc" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000050_Polyketide_cyc2.1" - /domain_subtype="Polyketide_cyc2" - /evalue="2.50E-11" - /label="JK1GL000050_Polyketide_cyc2.1" - /locus_tag="JK1GL000050" - /protein_end="127" - /protein_start="2" - /score="36.0" - /tool="antismash" - /translation="YGLIADATVWPLFFPPSVHVEQLDFDGTRERLRMWAVAGDRISSW - VSHRRLDVGQRRVEFRQERPSAPVETMTGLWTVEPLGDGSRVTLEHAFTVVGDAPADAA - WTERVTRANSRAQLQRLAWLA" - mRNA 46599..46835 - /locus_tag="JK1GL000051" - /note="hypothetical protein" - gene 46599..46835 - /locus_tag="JK1GL000051" - CDS 46599..46835 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W1G8" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000051" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000051" - /transl_table=11 - /translation="MRRFRPRRCVRGLWEGLVAYGRLCLAGETDRYDHPPRPRVRWHRP - PPGHPERVRDDMPLTDLERRLARELTDEDHDVR" - mRNA complement(47200..48465) - /locus_tag="JK1GL000052" - /note="ketosynthase chain-length factor" - gene complement(47200..48465) - /locus_tag="JK1GL000052" - CDS complement(47200..48465) - /EC_number="2.3.1.-" - /EC_number="2.3.1.260" - /EC_number="2.3.1.235" - /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (85-416). E-value: - 4.3e-25. Score: 80.3. Matches aSDomain: - nrpspksdomains_JK1GL000052_PKS_KS.1" - /NRPS_PKS="type: PKS/NRPS-like protein" - /codon_start=1 - /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) - synthase" - /db_xref="UniProtKB/Swiss-Prot:Q02062 Actinorhodin - polyketide putative beta-ketoacyl synthase 2" - /db_xref="UniProtKB/TrEMBL:A0A454W1F8" - /gene_functions="biosynthetic (rule-based-clusters) T2PKS: - t2clf" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1093:Beta-ketoacyl synthase (Score: 579.4; E-value: - 5.2e-176)" - /gene_functions="biosynthetic-additional (t2pks) CLF 8|9 - (Score: 582.6; E-value: 8.2e-178)" - /gene_kind="biosynthetic" - /locus_tag="JK1GL000052" - /note="GO_function: GO:0003824 - catalytic activity" - /product="ketosynthase chain-length factor" - /protein_id="ncbi_JK1GL000052" - /sec_met_domain="t2clf (E-value: 5.9e-170, bitscore: 564.0, - seeds: 26, tool: rule-based-clusters)" - /transl_table=11 - /translation="MTKATQAPEPARPAGAQGPRQTLVTGIGVAAPNGLGTRAWWDAVL - CGRTGLGPITRFDASGYPVRIAGEIPGFVDEDHIPSRLLPSTDRGTRIALVAAEEALRD - ANVSPADLPAYGAGVITASSAGGAEFGERGLAALWSKGAQHVSAYQSFASFHAAAPAQI - SIRHRLRGHGSTVVSEQAGGIDALARARRRIRDGACLMVTGGIDSTLCAWGWAAHLADG - RLSPATEPARAYRPFAATADGHAVGEGGALLVLEDARAAARRGATGYGVIAGCAATFDG - PDRPTLRQAAELALADAGLAPEHVDVVFADGAAERRADLVESQALCALFGPYGVPVTVP - KTMTGRLGAGGSALDVAAALLALREKVVPPTTGTGRVADDCPLDLVTGAPRELPRLRVA - LVLARGRGGFNSAAVLRAPQAQ" - aSDomain complement(47218..48210) - /aSDomain="PKS_KS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000052_PKS_KS.1" - /domain_subtype="Iterative-KS" - /evalue="4.30E-25" - /label="JK1GL000052_PKS_KS.1" - /locus_tag="JK1GL000052" - /protein_end="416" - /protein_start="85" - /score="80.3" - /tool="antismash" - /translation="STDRGTRIALVAAEEALRDANVSPADLPAYGAGVITASSAGGAEF - GERGLAALWSKGAQHVSAYQSFASFHAAAPAQISIRHRLRGHGSTVVSEQAGGIDALAR - ARRRIRDGACLMVTGGIDSTLCAWGWAAHLADGRLSPATEPARAYRPFAATADGHAVGE - GGALLVLEDARAAARRGATGYGVIAGCAATFDGPDRPTLRQAAELALADAGLAPEHVDV - VFADGAAERRADLVESQALCALFGPYGVPVTVPKTMTGRLGAGGSALDVAAALLALREK - VVPPTTGTGRVADDCPLDLVTGAPRELPRLRVALVLARGRGGFNSAAVLR" - mRNA complement(48462..49733) - /locus_tag="JK1GL000053" - /note="MULTISPECIES: beta-ketoacyl-acyl-carrier-protein - synthase family protein" - gene complement(48462..49733) - /locus_tag="JK1GL000053" - CDS complement(48462..49733) - /EC_number="2.3.1.-" - /EC_number="2.3.1.260" - /EC_number="2.3.1.235" - /NRPS_PKS="Domain: PKS_KS(Iterative-KS) (3-396). E-value: - 4.8e-49. Score: 159.2. Matches aSDomain: - nrpspksdomains_JK1GL000053_PKS_KS.1" - /NRPS_PKS="type: PKS/NRPS-like protein" - /codon_start=1 - /db_xref="COG:COG0304 3-oxoacyl-(acyl-carrier-protein) - synthase" - /db_xref="UniProtKB/Swiss-Prot:P16538 Tetracenomycin C - polyketide putative beta-ketoacyl synthase 1" - /db_xref="UniProtKB/TrEMBL:A0A399CKM9" - /gene_functions="biosynthetic (rule-based-clusters) T2PKS: - t2ks" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1022:Beta-ketoacyl synthase (Score: 423.8; E-value: - 1.3e-128)" - /gene_functions="biosynthetic-additional (t2pks) KS (Score: - 659.9; E-value: 3.3e-201)" - /gene_kind="biosynthetic" - /locus_tag="JK1GL000053" - /note="GO_function: GO:0003824 - catalytic activity" - /product="MULTISPECIES: beta-ketoacyl-acyl-carrier-protein - synthase family protein" - /protein_id="ncbi_JK1GL000053" - /sec_met_domain="t2ks (E-value: 6.8e-200, bitscore: 663.1, - seeds: 25, tool: rule-based-clusters)" - /transl_table=11 - /translation="MNRVVITGIGVVAPGAVGTAGFWDLLTVGRTATRRVTLFDACGYR - SRVAAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSL - GSAIGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVA - LVSSGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPA - TASRPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAVTAHSSAHHMTGLRPG - ALEMADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSI - KSMIGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTSTVL - TVASGFGGFHTAAVLTRPQLKEAA" - aSDomain complement(48546..49724) - /aSDomain="PKS_KS" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000053_PKS_KS.1" - /domain_subtype="Iterative-KS" - /evalue="4.80E-49" - /label="JK1GL000053_PKS_KS.1" - /locus_tag="JK1GL000053" - /protein_end="396" - /protein_start="3" - /score="159.2" - /tool="antismash" - /translation="VVITGIGVVAPGAVGTAGFWDLLTVGRTATRRVTLFDACGYRSRV - AAEVDFTPAAHGFDLADTERLDRAAQFALVAAREAVADSGVADRIGRNPLRTGVSLGSA - IGCTTSLATQYAILSDCGTTWTLDHTEAAESLYDYFVPSSLAATVARDRGAQGPVALVS - SGCTSGLDAVGHGADLIREGSADIVVAGGTEAPIVPIAMACFDRLRLTSSRNDDPATAS - RPFDRTRDGFVLGEGAAVLVLEELEHARRRGARPYAELSAVTAHSSAHHMTGLRPGALE - MADAIRAALDQARLNPADVDYISAHGAGTRHNDRHETHALKESLGGSAHRVPVSSIKSM - IGHALGAAGALDLAASALAIRHDTVPPTANLHEPDPTCDLDYTPLFAREQRTS" - mRNA complement(49730..50509) - /locus_tag="JK1GL000055" - /note="MULTISPECIES: thioesterase" - gene complement(49730..50509) - /locus_tag="JK1GL000055" - CDS complement(49730..50509) - /NRPS_PKS="Domain: Thioesterase (15-242). E-value: 9.4e-38. - Score: 122.7. Matches aSDomain: - nrpspksdomains_JK1GL000055_Thioesterase.1" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A399CHI6" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1004:thioesterase (Score: 181.7; E-value: 2.1e-55)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000055" - /note="GO_function: GO:0016788 - hydrolase activity, acting - on ester bonds; GO_process: GO:0009058 - biosynthetic - process" - /product="MULTISPECIES: thioesterase" - /protein_id="ncbi_JK1GL000055" - /transl_table=11 - /translation="MASRSRDREAGTARITLTCLAHAGAGVASYRGWSAAVGPGIDVAA - LPLPGRDSRRREPRLTERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALAD - SGLPPLFLAVGACPPPHTTTVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTF - LPVLRDDLRLARSLRNAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIE - LHTVAGGHFFASSSSLAQHVGRACRGHVTALPTGGGR" - aSDomain complement(49784..50464) - /aSDomain="Thioesterase" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000055_Thioesterase.1" - /evalue="9.40E-38" - /label="JK1GL000055_Thioesterase.1" - /locus_tag="JK1GL000055" - /protein_end="242" - /protein_start="15" - /score="122.7" - /tool="antismash" - /translation="TLTCLAHAGAGVASYRGWSAAVGPGIDVAALPLPGRDSRRREPRL - TERAGLLADFLPTLLQTARRGPYALYGHSMGALVGYTLTRALADSGLPPLFLAVGACPP - PHTTTVLADAADLPDEDLLPLLDEIGSLPPGASASPGGLWRRTFLPVLRDDLRLARSLR - NAALDPVTGGPLDVPVLVFAGRDDPLAAPAALRHWQQWTTNLIELHTVAGGHFFASSSS - LAQHV" - CDS_motif complement(50204..50272) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000055_0001" - /evalue="3.80E-07" - /label="NRPS-te1" - /locus_tag="JK1GL000055" - /protein_end="102" - /protein_start="79" - /score="22.6" - /tool="antismash" - /translation="RGPYALYGHSMGALVGYTLTRAL" - mRNA complement(50767..51588) - /locus_tag="JK1GL000054" - /note="MULTISPECIES: AfsR/SARP family transcriptional - regulator" - gene complement(50767..51588) - /locus_tag="JK1GL000054" - CDS complement(50767..51588) - /codon_start=1 - /db_xref="COG:COG3629 DNA-binding transcriptional activator - of the SARP family" - /db_xref="UniProtKB/Swiss-Prot:P25047 Regulatory protein - DnrI" - /db_xref="UniProtKB/TrEMBL:A0A399CRP3" - /gene_functions="regulatory (smcogs) - SMCOG1041:transcriptional regulator, SARP family (Score: - 327.7; E-value: 3e-99)" - /gene_kind="regulatory" - /locus_tag="JK1GL000054" - /note="GO_function: GO:0003677 - DNA binding; GO_function: - GO:0005515 - protein binding; GO_process: GO:0000160 - - phosphorelay signal transduction system; GO_process: - GO:0006355 - regulation of transcription, DNA-templated" - /product="MULTISPECIES: AfsR/SARP family transcriptional - regulator" - /protein_id="ncbi_JK1GL000054" - /transl_table=11 - /translation="MEIKVLGALNAEFEGISVVPSAGKPRQILALLALYPGRVVPVPTL - MEEIWGTDLPQSSMTTLQTYILQLRRLLGTAMGPDVPGSAKDVLATRYGGYLLQIPAEA - VDAFTYERLVTEGRQAYEDGEDERAATVLRRALDLWDGPALVDVRVGPVLEIEAMRLEQ - SRLVARERRIDADLRLGRHVELIAELTDLIARHPQHEGLHSQAMVALYRSGRQAAALDV - YRRLRQRLIDELGVEPSPQLQRLHQAMLAVDPRLDIVAGPRRTSTFDLYAA" - mRNA 52329..53318 - /locus_tag="JK1GL000056" - /note="AfsR/SARP family transcriptional regulator" - gene 52329..53318 - /locus_tag="JK1GL000056" - CDS 52329..53318 - /codon_start=1 - /db_xref="COG:COG3629 DNA-binding transcriptional activator - of the SARP family" - /db_xref="UniProtKB/Swiss-Prot:P16922 Transcriptional - regulator RedD" - /db_xref="UniProtKB/TrEMBL:A0A454W7A1" - /gene_functions="regulatory (smcogs) - SMCOG1041:transcriptional regulator, SARP family (Score: - 320; E-value: 6.6e-97)" - /gene_kind="regulatory" - /locus_tag="JK1GL000056" - /note="GO_function: GO:0003677 - DNA binding; GO_function: - GO:0005515 - protein binding; GO_process: GO:0000160 - - phosphorelay signal transduction system; GO_process: - GO:0006355 - regulation of transcription, DNA-templated" - /product="AfsR/SARP family transcriptional regulator" - /protein_id="ncbi_JK1GL000056" - /transl_table=11 - /translation="MIRAGGCGIGCFPGKGEMEFRILGSVQIHDERFGVRVVPAGAKQR - ALLGALLVRAGQAVPAECLVEELWGGQPPVNAANALQAHVARLRRLLPAPGPGGPRHVW - LRTSPLGYTLSLGPAVTDAQRFHRLVGQGRELAATAPGRAVEVLREGLALWRGPALQGS - GQGPICSAEAALLEESRLRALEVLYDVCLRADRCAEITGELEELVAVHPLRERFHEQLM - TALHRCGRRAEALSTYDRARRRLARDLGIGPGQVLSRRREAILRSCEPAADSADRAGAG - TAGQGGDELGVLREELVRLRGHVELLRRQQRELSEQVARLTAHHPCGP" - CDS complement(53334..54149) - /codon_start=1 - /db_xref="COG:COG3629 DNA-binding transcriptional activator - of the SARP family" - /db_xref="UniProtKB/Swiss-Prot:P25047 Regulatory protein - DnrI" - /db_xref="UniProtKB/TrEMBL:A0A399CPF0" - /gene_functions="regulatory (smcogs) - SMCOG1041:transcriptional regulator, SARP family (Score: - 316.1; E-value: 9.8e-96)" - /gene_kind="regulatory" - /locus_tag="JK1GL000057" - /note="GO_function: GO:0003677 - DNA binding; GO_function: - GO:0005515 - protein binding; GO_process: GO:0000160 - - phosphorelay signal transduction system; GO_process: - GO:0006355 - regulation of transcription, DNA-templated" - /product="MULTISPECIES: AfsR/SARP family transcriptional - regulator" - /protein_id="ncbi_JK1GL000057" - /transl_table=11 - /translation="MDIEVLGALSVREHGVSVVPTAPKPRQVLALLALNADQVVPVAAL - VDELWGENPPRSARTTLQTYVLQLRELMAQALAHGPDERCTAKDILATVPGGYRLQTRG - GHVDYREFDQRAGLGYRAMDAEDYAGAARRLADALALWNGQALTDIQAGLRIDTEVKRL - EEARLCALDQRIEADLRLGRHRELLSELTVLVNQYRMHESLHGQFMLALHRSGRRGEAL - NVYQRLRSTLVHELGLEPSAALSRLQRSILMARPETPAAAGGSGRLVTR" - protocluster 53334..62701 - /aStool="rule-based-clusters" - /category="other" - /contig_edge="False" - /core_location="[70693:71686](+)" - /cutoff="20000" - /detection_rule="AfsA" - /neighbourhood="5000" - /product="butyrolactone" - /protocluster_number="2" - /tool="antismash" - proto_core 57418..58410 - /aStool="rule-based-clusters" - /tool="antismash" - /cutoff="20000" - /detection_rule="AfsA" - /neighbourhood="5000" - /product="butyrolactone" - /protocluster_number="2" - cand_cluster 53334..62701 - /candidate_cluster_number="2" - /contig_edge="False" - /detection_rules="AfsA" - /kind="single" - /product="butyrolactone" - /protoclusters="2" - /tool="antismash" - mRNA complement(53334..54149) - /locus_tag="JK1GL000057" - /note="MULTISPECIES: AfsR/SARP family transcriptional - regulator" - gene complement(53334..54149) - /locus_tag="JK1GL000057" - mRNA complement(54551..55162) - /locus_tag="JK1GL000058" - /note="helix-turn-helix transcriptional regulator" - gene complement(54551..55162) - /locus_tag="JK1GL000058" - CDS complement(54551..55162) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W7A3" - /gene_functions="regulatory (smcogs) SMCOG1057:TetR family - transcriptional regulator (Score: 65.9; E-value: 1.1e-19)" - /gene_kind="regulatory" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000058" - /note="GO_function: GO:0003677 - DNA binding" - /product="helix-turn-helix transcriptional regulator" - /protein_id="ncbi_JK1GL000058" - /transl_table=11 - /translation="MRTREALIRSAAEIFHDEGFHAAALTTISSRAGVSNGALHFHFAS - KAALADAVEEAAADVLRAVCGRWDGGPPGVLQCLVNATHELACALQNDVVLRAGFELSR - EAGRQPRTDLRLCWQNWVTDMVGRAGRGGELRESVAPESAVAAVVAATSGFEVLGMRNQ - AWLSRSTVAQFWLLLLPALAPAPHAGLWQAEGSWTGTATG" - mRNA complement(55195..56883) - /locus_tag="JK1GL000059" - /note="propionyl-CoA carboxylase beta chain" - gene complement(55195..56883) - /locus_tag="JK1GL000059" - CDS complement(55195..56883) - /EC_number="6.4.1.3" - /EC_number="2.1.3.15" - /codon_start=1 - /db_xref="COG:COG4799 Acetyl-CoA carboxylase, - carboxyltransferase component" - /db_xref="UniProtKB/Swiss-Prot:I3R7F1 Propionyl-CoA - carboxylase, carboxyltransferase subunit" - /db_xref="UniProtKB/TrEMBL:A0A2W6PRG9" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1059:acetyl-CoA carboxylase, carboxyl transferase, - (Score: 732.8; E-value: 3.8e-222)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000059" - /note="GO_function: GO:0016874 - ligase activity" - /product="propionyl-CoA carboxylase beta chain" - /protein_id="ncbi_JK1GL000059" - /transl_table=11 - /translation="MRAELPEPKPHRWFVTVKRRPGRAMREGQIVTILNDIPRVALPAE - PADARGRVAELHGVRAQALAGPSEKATAAQHAKGKLTARERIELLLDAGSFREVEQLRR - HRATGFGLEARKPYTDGVITGWGTVEGRTVFVYAHDFRIFGGALGEAHATKIHKIMDMA - IAAGAPLVSLNDGAGARIQEGVSALAGYGGIFQRNTRASGVIPQISVMLGPCAGGAAYS - PALTDFVFMVRDTSQMFITGPDVVKAVTGEEITQNGLGGADVHAETSGVAHFAYDDEET - CLAEVRYLLSMLPQNNREFPPCTPCSDPQSRRSEALLDLVPADGNRPYDMARVIEEIVD - DGEYLEVHEGWARNIICALARLNGQVVGIVANQPQALAGVLDIEASEKAARFVQMCDAF - NIPLVTFLDVPGFLPGVDQEHGGIIRHGAKLLYAYCNATVPRISLILRKAYGGAYIVMD - SQSIGADLTYAWPTNEIAVMGAEGAANVIFRRQIAEAEDPDAVRARMVKEYRAELMHPY - YAAERGLVDDVIDPAETREVLIESLAMLRTKDADVPSRKHGNPPQ" - mRNA complement(56915..57121) - /locus_tag="JK1GL000060" - /note="MULTISPECIES: acyl-CoA carboxylase subunit epsilon" - gene complement(56915..57121) - /locus_tag="JK1GL000060" - CDS complement(56915..57121) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W782" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000060" - /product="MULTISPECIES: acyl-CoA carboxylase subunit - epsilon" - /protein_id="ncbi_JK1GL000060" - /transl_table=11 - /translation="MAEPERAVPAVRIERGRAGAEELAALTAVLYALTARRDEGPGGRE - RSGAAPWRPGHRAGAYRSPYCWR" - mRNA 57418..58410 - /locus_tag="JK1GL000061" - /note="2-oxo-3-(phosphooxy)propyl 3-oxoalkanoate synthase" - gene 57418..58410 - /locus_tag="JK1GL000061" - CDS 57418..58410 - /EC_number="2.3.1.277" - /codon_start=1 - /db_xref="UniProtKB/Swiss-Prot:P18394 putative A-factor - biosynthesis enzyme" - /db_xref="UniProtKB/TrEMBL:A0A454W7E0" - /gene_functions="biosynthetic (rule-based-clusters) - butyrolactone: AfsA" - /gene_kind="biosynthetic" - /locus_tag="JK1GL000061" - /product="2-oxo-3-(phosphooxy)propyl 3-oxoalkanoate - synthase" - /protein_id="ncbi_JK1GL000061" - /sec_met_domain="AfsA (E-value: 3.3e-24, bitscore: 83.5, - seeds: 34, tool: rule-based-clusters)" - /transl_table=11 - /translation="MATSAFPATHPALGQEPVLPAGTPRLRPSLFRYPNLTTTVPKELV - HRAAVAEVMLTDWERVDDTRFKVAAQWPRGHSFFTPIDGRYHDPLIAAETIRQVGSLLG - HAEFGVPFGHHYLLHDLSLRVDPHHLMIHQAPASLDLDVTCEDLKMRGGRLAALRYEAV - VRRDGHTAATGVFSFSCVSPTVYRRLRPPHVFADGHRPLPLTAPAAPQSVGRMSPADVV - LSPTEDPHRWQLRLDTQHPVLFDHPGDHVPGMVLLEAARQAAAGALGRTSLLPLGLTSE - LVQYAELDIPCIIEAAPHPTHSPGLTTVHITGHQRGQTVFTCTVTAADA" - mRNA complement(58433..59041) - /locus_tag="JK1GL000062" - /note="NAD(P)H-binding protein" - gene complement(58433..59041) - /locus_tag="JK1GL000062" - CDS complement(58433..59041) - /EC_number="1.3.1.113" - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W7B3" - /gene_functions="other (smcogs) SMCOG1199:NmrA family - protein (Score: 192.5; E-value: 1.8e-58)" - /gene_kind="other" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000062" - /product="NAD(P)H-binding protein" - /protein_id="ncbi_JK1GL000062" - /transl_table=11 - /translation="MRAAADAGVEHVVKLSAAAVEDAGADDLITRWQRESEELLRSSGL - AWTLLRPRSFMSNSLGWAAEVRAEGVVRELFGASLNACVDPGDVAEVAVRALTGPGHAG - RAYVLTGPEAVSAVQRTARLSCVLGRPLRFEELGWEEARARWGRRYPPAVVEALLRSAV - RQREGAKAGVDGTFARLVGRPARSFGQWAADHVAGFSGR" - mRNA 59436..60077 - /locus_tag="JK1GL000063" - /note="TetR/AcrR family transcriptional regulator" - gene 59436..60077 - /locus_tag="JK1GL000063" - CDS 59436..60077 - /codon_start=1 - /db_xref="COG:COG1309 DNA-binding transcriptional - regulator, AcrR family" - /db_xref="UniProtKB/TrEMBL:A0A454W784" - /gene_functions="regulatory (smcogs) SMCOG1057:TetR family - transcriptional regulator (Score: 89.2; E-value: 7.5e-27)" - /gene_kind="regulatory" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000063" - /note="GO_function: GO:0003677 - DNA binding" - /product="TetR/AcrR family transcriptional regulator" - /protein_id="ncbi_JK1GL000063" - /transl_table=11 - /translation="MPAQERAIRTRQNIMLAAATVFNERGYKAATIADILTTAGVTKGA - LYFHFPSKDDLAQEVLATQNRNLTIPERPSKTQELIDVVMLHTHRLQTDPMVRAAVRLT - MDQLSTEFDRTGPFRQWADLTRQRLEQARDQGELLPHVNPTETADVLVGAYAGIQSMSH - ALTDYTDLTTRANALLRHLLPTITLPSILTSLDLNENRGAHVYTEIHTTT" - mRNA complement(61157..62014) - /locus_tag="JK1GL000064" - /note="hypothetical protein" - gene complement(61157..62014) - /locus_tag="JK1GL000064" - CDS complement(61157..62014) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454WJI8" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000064" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000064" - /transl_table=11 - /translation="MKAGAIVVAAVTGSVVLSGCGDGDGSQAKRDGVSPSASSSAGTQE - QGTVEVRAAYDKTAEAESARMTIKMKLAAEGKTITSDGKGVLDLAEGDSVMTLTVQDKT - IEQRVVDQVLYQKIPGEKALGGKPWIKIDLEKVAAQQGLSNQQIGDPAQTAAYARAITN - KDVTKAGTEEIDGANTTQYKVSVDVSKLPGGEQLSKQVGPTLPMHVWLDDKGRLRRQQI - EMTLKAPASASAKPEGSASPQQLQMSTVMEFSDFGTEVNAEAPPAGQVADMTDQSLQGS - QQHS" - mRNA 62297..62701 - /locus_tag="JK1GL000065" - /note="hypothetical protein" - gene 62297..62701 - /locus_tag="JK1GL000065" - CDS 62297..62701 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A2A2DC84" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000065" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000065" - /transl_table=11 - /translation="MNVQVPADPSGRLLWASPALPGAVHDVRAAREHDIVRKLTDAGIT - CWTDKGYRGAGGTVRVPLGPSGDTSRGQKDVNRSHAKKWVLVEQAAATLNAWRLLRNLR - CSTSGVTSLVRSVVTVHLASTDGKGSMTTF" - mRNA complement(63194..66505) - /locus_tag="JK1GL000066" - /note="MULTISPECIES: Wall-associated protein" - gene complement(63194..66505) - /locus_tag="JK1GL000066" - CDS complement(63194..66505) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A429NJW2" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000066" - /product="MULTISPECIES: Wall-associated protein" - /protein_id="ncbi_JK1GL000066" - /transl_table=11 - /translation="MWRDRRTHRTALVSAITAAAVVIAAAPGLAATPKPELPEPESPWT - KPTKVEAPATPAGTVKAPTSEAEAKPSAEVAAWRAAQKARAAGAERAKTSASRSAAVDA - AVAGYVPEGQGEVPWHQILDTRLNDALVARVNVSNGNLMLAATDFDIAGVGQKLQLTRT - YNSLEAPWGKVSQRWWQAYERYLQINDGEVDVFDTTGSLLRFTANADGTYTTPTGYSKD - LKKNADGTYTLTDRKSGTKDTYNEHGTLTKVTDKNKGTITVDQHDEGAEHKGFKLTETR - SGRWIDLVKTDASQWQAKDHTGRTAVLDLDAAGNLAKVTDTTGKATAYEYDSSRRLTKV - TTPEGTVTLFTYDSHNRVTSMQRATGTSGSGHTGPTWRYDYTAATPSDAGTTTVTDPDG - DETIYTHNADGEVTKVTDPLGHSRHATYKNHLTQTAIDAMGTGTDGTGGNTTTYGWDDR - NNPVSQKLPMGATASVSAYQTIAGTDLPSDMTGANGRKDSFKYDTNGNTLSVTTSGTAG - TTREYTYNKDTPTCGGFEGQRCTAKDGNGKVTSFTYDDQGNLIKVTPPAPLGETTYTYD - ALGRVETVKDGRGITTVYAYDSRDRVHEVSSTNFTVTYSYDGDGNVKSRTDASGTTKWD - YDKLNRESVRTLQNGAQTALAYTPGGDVDFYTDPTGTTDYTWDKAGRLDYLTAPDGKKT - DFDYNNNDKRTKTVYPGGTTQTVTIDKNGRPQAIKTTSGTQTFVDLTYSYANAGKDTTK - IRTRTDNLTKLKTTYTYDSQDRLSYALEADAAGTRKASWLYCWDKAGNLTSRDGSKNTC - PGGTTYTYNDASELTGKNGSTTGWSYDKLGNETAAADNTPRTDESWTDYSQLSGITAGG - KTYDLVHAGTTNAERTKLGSTWFHHTALGLASTTTNGVDTGFIREPAGTLNSMTTGGKS - YYYLTDATGNVLGLADDTGKRTHTYTYGPTGLPRTTPTEAVPQPYRYAGAYADPTGLYK - MGHRYYDPTLGRFTQPDPSGQETNPYLYAAGDPINNMDPSGLGFLDSVSNFLEDTNDIW - GAVTGCVAGVGAAAETGIIAAASTFGPWGTAGAVVTSCAVGGVLGYNNAEIITYG" - mRNA 67026..67361 - /locus_tag="JK1GL000067" - /note="hypothetical protein" - gene 67026..67361 - /locus_tag="JK1GL000067" - CDS 67026..67361 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A429NJP0" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000067" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000067" - /transl_table=11 - /translation="MKDAPAMSTPGRHTPCSRSSRHHVPAQRLTRFVQQAGRLLCWSLT - AGMTTAALDLLITPEAAWWHMMWPLPWYLTCLSAPLWATLRAHEKAAHQQAPEEDNDIP - CEWEQAA" - mRNA complement(67729..67908) - /locus_tag="JK1GL000068" - /note="hypothetical protein" - gene complement(67729..67908) - /locus_tag="JK1GL000068" - CDS complement(67729..67908) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454W205" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000068" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000068" - /transl_table=11 - /translation="MQVAWRAGEMSGVTVVFVAACALWLVLWRRRTGRGCLAWPLVVLL - CGATGVLIMAAMAG" - mRNA complement(67919..68248) - /locus_tag="JK1GL000069" - /note="hypothetical protein" - gene complement(67919..68248) - /locus_tag="JK1GL000069" - CDS complement(67919..68248) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A1Y2PQM0" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000069" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000069" - /transl_table=11 - /translation="MDESKMPEETPLMGPDGKVVKEANGKTLMVKTRVEFSESEAPMFG - PRAGEKRSVSTDAEGRETEIIEAVPSVPPAQGRKELGSRTMMSRLLEAVCALTMRARCA - PRMGR" - mRNA complement(68739..68951) - /locus_tag="JK1GL000071" - /note="hypothetical protein" - gene complement(68739..68951) - /locus_tag="JK1GL000071" - CDS complement(68739..68951) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A1A9CFR1" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000071" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000071" - /transl_table=11 - /translation="MRLRAYAILCIYALMLVNGIPRIADAPFETVMACSSVGFGFAAAA - AVLFLLSARKDSSARTAGPVAPWEG" - mRNA 68965..69090 - /locus_tag="JK1GL000070" - /note="hypothetical protein" - gene 68965..69090 - /locus_tag="JK1GL000070" - CDS 68965..69090 - /codon_start=1 - /locus_tag="JK1GL000070" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000070" - /transl_table=11 - /translation="MRIHGGVHPASIATGIGSMSVVDTASAIQWYSGFPFIPTPS" - mRNA complement(69802..70122) - /locus_tag="JK1GL000072" - /note="hypothetical protein" - gene complement(69802..70122) - /locus_tag="JK1GL000072" - CDS complement(69802..70122) - /codon_start=1 - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000072" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000072" - /transl_table=11 - /translation="MAFNVYKAAQWAMESHKGKGLIAGNRLDQDEVIAPERIPGIDAEV - IKNFRTMSEATERGVGQVLDSSKWTILVNDAWLLGGAHYMAQVVETVYGRPRQSMVCAF - SR" - mRNA 70261..70440 - /locus_tag="JK1GL000073" - /note="hypothetical protein" - gene 70261..70440 - /locus_tag="JK1GL000073" - CDS 70261..70440 - /codon_start=1 - /locus_tag="JK1GL000073" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000073" - /transl_table=11 - /translation="MSALLGSVAFPADNRRHADIARTYVASVRPRPGGGEIVLKLGDSL - LKPGVLDAWAPSGQ" - misc_feature 70270..70272 - /note="tta leucine codon, possible target for bldA - regulation" - /tool="antismash" - mRNA 70614..71384 - /locus_tag="JK1GL000074" - /note="hypothetical protein" - gene 70614..71384 - /locus_tag="JK1GL000074" - CDS 70614..71384 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A3M0I621" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000074" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000074" - /transl_table=11 - /translation="MPDAALEALGGWWGQNAVRLTDGTPGAHTVRYTPSRWAHITTWPS - MMASTFQAGDADVSRTQVASIVADALERGACEEALVATYVWGKGKGGSPAGSGPATLHK - ILLGTEGLNAILASVVNTLREQDAEAAYAELRGRIAGFGPSFYSKFLYFAGKSVRAASG - TQPLILDQVLARRMRSLAQAVGRETGYDPDGSIARWVWRDTNWSPHRYAIYLSFMQAAS - RQVAATHSWPSNATPDLLEYALFTTSWVESAEAT" - mRNA complement(72274..73149) - /locus_tag="JK1GL000075" - /note="SDR family oxidoreductase" - gene complement(72274..73149) - /locus_tag="JK1GL000075" - CDS complement(72274..73149) - /EC_number="1.1.1.340" - /NRPS_PKS="Domain: PKS_KR (8-160). E-value: 1.8e-07. Score: - 23.0. Matches aSDomain: - nrpspksdomains_JK1GL000075_PKS_KR.1" - /NRPS_PKS="type: other" - /codon_start=1 - /db_xref="COG:COG4221 NADP-dependent 3-hydroxy acid - dehydrogenase YdfG" - /db_xref="UniProtKB/Swiss-Prot:Q82IY9 - 1-deoxy-11-beta-hydroxypentalenate dehydrogenase" - /db_xref="UniProtKB/TrEMBL:A0A454WJJ0" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1001:short-chain dehydrogenase/reductase SDR (Score: - 168.7; E-value: 2.7e-51)" - /gene_functions="biosynthetic-additional (t2pks) KR (Score: - 103.5; E-value: 3.6e-32)" - /gene_kind="biosynthetic-additional" - /locus_tag="JK1GL000075" - /note="GO_function: GO:0016491 - oxidoreductase activity" - /product="SDR family oxidoreductase" - /protein_id="ncbi_JK1GL000075" - /transl_table=11 - /translation="MNWPTGEAALVTGAASGIGFGVAHALVAAGAKVALVDIDEARLAG - AEQSLRDAGGTVLALPFDISETDRWESMADRAEEALGPISILCNVAGVNGGTTVDRTPL - QVWRWVHGVNVDAQFASVAAFLPRFKSRGGRSHIVNTSSISGLIPMAGVAAYTSSKFAS - VGLSMALREELAGTHVGVSLLVPGAVATPINFNAGAAEAKLLGREMDAAVVEKNSALLL - QGADPGRVGEQVVEAMQQGQFMVVTHREWGPFAAHVHREIERAYEEFDGRHGPDPVATA - MAAGEETISS" - aSDomain complement(72670..73125) - /aSDomain="PKS_KR" - /aSTool="nrps_pks_domains" - /database="nrpspksdomains.hmm" - /detection="hmmscan" - /domain_id="nrpspksdomains_JK1GL000075_PKS_KR.1" - /evalue="1.80E-07" - /label="JK1GL000075_PKS_KR.1" - /locus_tag="JK1GL000075" - /protein_end="160" - /protein_start="8" - /score="23.0" - /specificity="KR activity: inactive" - /specificity="KR stereochemistry: C2" - /tool="antismash" - /translation="ALVTGAASGIGFGVAHALVAAGAKVALVDIDEARLAGAEQSLRDA - GGTVLALPFDISETDRWESMADRAEEALGPISILCNVAGVNGGTTVDRTPLQVWRWVHG - VNVDAQFASVAAFLPRFKSRGGRSHIVNTSSISGLIPMAGVAAYTSSK" - CDS_motif complement(72676..72738) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000075_0002" - /evalue="3.80E-04" - /label="PKSI-KR_m4" - /locus_tag="JK1GL000075" - /protein_end="158" - /protein_start="137" - /score="13.0" - /tool="antismash" - /translation="IVNTSSISGLIPMAGVAAYTS" - CDS_motif complement(73054..73122) - /aSTool="nrps_pks_domains" - /database="abmotifs" - /detection="hmmscan" - /domain_id="nrpspksmotif_JK1GL000075_0001" - /evalue="1.50E-03" - /label="PKSI-KR_m1" - /locus_tag="JK1GL000075" - /protein_end="32" - /protein_start="9" - /score="11.2" - /tool="antismash" - /translation="LVTGAASGIGFGVAHALVAAGAK" - mRNA complement(73386..73754) - /locus_tag="JK1GL000076" - /note="hypothetical protein" - gene complement(73386..73754) - /locus_tag="JK1GL000076" - CDS complement(73386..73754) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454WJH3" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000076" - /note="GO_function: GO:0003677 - DNA binding; GO_process: - GO:0006355 - regulation of transcription, DNA-templated" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000076" - /transl_table=11 - /translation="MALRLTDASTPAVDAADLGAMLLLAQTYDPEHPHEDVRALARLDR - RSADVLRTLVEADSVRSAAAELGMHHSTVQARHEALTHTLGYDPRSNVGRMRYIAAALL - LRLTDPVPPTRPGSPWNT" - mRNA complement(73739..74398) - /locus_tag="JK1GL000077" - /note="hypothetical protein" - gene complement(73739..74398) - /locus_tag="JK1GL000077" - CDS complement(73739..74398) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454WJI3" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000077" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000077" - /transl_table=11 - /translation="MHQLVGRLNSLDPQAGETLRIVSYFDVLITRGAGLDGLLRGAAVL - SGTVAGAKIRGRVTRRDPDGHPVTDDADRRRHSSRRSHADWTVWLERDGEPEPADEMIV - ERLALGVELLDARRSPERGLDAIVDQARSVAERTALLAKRRIDPATPVRVLATAADAPE - ISEAPSAIVPTRYGLLRATLDLSGTIRRPPEPVGFGTRYEPTGPPNPGRRRSWRSD" - mRNA complement(74528..75133) - /locus_tag="JK1GL000078" - /note="acetyl esterase" - gene complement(74528..75133) - /locus_tag="JK1GL000078" - CDS complement(74528..75133) - /EC_number="3.1.1.-" - /codon_start=1 - /db_xref="COG:COG0657 Acetyl esterase/lipase" - /db_xref="UniProtKB/TrEMBL:A0A0N0YWT6" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1066:alpha/beta hydrolase domain-containing protein - (Score: 140.4; E-value: 1.1e-42)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000078" - /note="GO_function: GO:0016787 - hydrolase activity" - /product="acetyl esterase" - /protein_id="ncbi_JK1GL000078" - /transl_table=11 - /translation="MVSGDQFSGLVQALPWVIEHDAVLVTVDYRLAPEHPDPYPVEDCY - AGLLWTAEHARELGMDPDRLIIAGQSAGGGLAAGVALMARDRQGPALIGQVLMYPMLDD - RDRTVSSAQFDAVGVWDRGSNVMGWTALLGERRGTDDVSAYALPHAPPISRDCHPRSST - AARPRCSGTRTSLTRRPCGTRAYRPNSTSGPVASTGSA" - mRNA complement(75120..77789) - /locus_tag="JK1GL000079" - /note="hypothetical protein" - gene complement(75120..77789) - /locus_tag="JK1GL000079" - CDS complement(75120..77789) - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A2R2WDT7" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1066:alpha/beta hydrolase domain-containing protein - (Score: 200.2; E-value: 7e-61)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000079" - /note="GO_function: GO:0008270 - zinc ion binding; - GO_function: GO:0016491 - oxidoreductase activity; - GO_function: GO:0016787 - hydrolase activity; GO_process: - GO:0055114 - oxidation-reduction process" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000079" - /transl_table=11 - /translation="MPTHPRPPFHPEAEAALTALAEPMPAVTPGAIPVLRQAALPVVSD - KTLLAAGVTRRDVTVPGHHGAELVASVIARSGHTGTGPGIYHIHGGGMIAGERVIGVSQ - ILPWIVEHDAVAVTVEYRLAPEFPDPCPVEDCYAGLVWTAEHAAELGIDPGRLIIAGAS - AGGGLAAGTALLARDRKGPALIGQVLICPMLGDRDRTVSSPQYEDAGRWVRESNRTGWA - ALLGDRCGTDEVSVYAAPARASDLEGLPPAFIDCGSAEVFRDEDAAYANALMELRRAGR - AACMARRLPRIRHARAGLRHRTGSDRGPERMSRPHSRRTVSGHERAVSRAVASAVLDRT - ERGVGTPGGARRDGPRRQERPPVTGGHGTGKRRRNMKAARFYGREDIRIEEAAEPSPGP - GQVKLRNAFAGICGSDLHFFFYPESLPFSLDEPHPLTGATLPQILGHEFSGTVVETGEG - VTDVRVGDRCAVFPLAVSCGKCAACRRGLPFSCPLMGSLGSNVEGGGLSEFTVCEASKV - HVLPDGVDLRMGALVEPMAVGWHAVARSGVRPGGSALVAGAGPIGIGTWFAFKARGVEK - VLVSEPSEDRRAIMAALGARVIDPVNEDLADAVASLTDGDGVDAAVDAAGAGAAVTSAM - AGLVPGGRLVVAALHEHTMDFQPTRLMMGETEIVGAVGYRPEEFDEVIAAMADGFYTPP - AGCGNCRWRALSTPSTRCATASAGRPFCAWAEAPEHSGTDGSRVLSVPGCARPVRTRRA - SGGGHGPRLRRSAVRHEAAHPARLMYTATMRCGRTRSSHVQQRSAPPVRPGARGRTRGP - RGPDPADPDRGHDPRHAPGGTGRGHRRDARDLRSDPTRRHDPGVPGRRNHRLCDRPGGS - SGARAGDLPHARRRHGLR" - mRNA 78186..78578 - /locus_tag="JK1GL000080" - /note="MULTISPECIES: SDR family NAD(P)-dependent - oxidoreductase" - gene 78186..78578 - /locus_tag="JK1GL000080" - CDS 78186..78578 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A454WJI7" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000080" - /product="MULTISPECIES: SDR family NAD(P)-dependent - oxidoreductase" - /protein_id="ncbi_JK1GL000080" - /transl_table=11 - /translation="MALADIDEERLDDDAKKPAGAGGTAMAVPLDVSDADSSAAAADRA - EEALGPISILRSNPAAPTSRSEPASSTFARMKGILRDFRLKGNSAHYAMLSIARLHNLA - LTGERTLRTAGHLTRVHWEIISGTAL" - mRNA complement(78575..79306) - /locus_tag="JK1GL000081" - /note="MULTISPECIES: class I SAM-dependent - methyltransferase" - gene complement(78575..79306) - /locus_tag="JK1GL000081" - CDS complement(78575..79306) - /EC_number="2.1.1.156" - /codon_start=1 - /db_xref="COG:COG2226 Ubiquinone/menaquinone biosynthesis - C-methylase UbiE" - /db_xref="UniProtKB/TrEMBL:A0A454WJJ2" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1248:methyltransferase (Score: 127.7; E-value: - 8.5e-39)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000081" - /product="MULTISPECIES: class I SAM-dependent - methyltransferase" - /protein_id="ncbi_JK1GL000081" - /transl_table=11 - /translation="MYEWLIGDDRLTPAKAAAVYYSDVVGSVPPSARVLDCACGTGQLA - VGLASLGLDVVAADASDGMVRRTEKAADEQGVSLRALHARWDELPDHLEDSTFDLVFCV - GNSLGHAEGAAGRLAALAAMSRLLKPGGRLVLHSRNWELVRSAGSRVDVRDRLVRRNDR - DAVVSYYWQIEQRWEQEHFLEIVVAQIEPDGAVRACSERLSIWPYRYEDLVVQLRSVGL - RVESTTFDPESDGYLMVASRD" - mRNA complement(79932..80435) - /locus_tag="JK1GL000082" - /note="MULTISPECIES: GNAT family N-acetyltransferase" - gene complement(79932..80435) - /locus_tag="JK1GL000082" - CDS complement(79932..80435) - /codon_start=1 - /db_xref="COG:COG3153 Predicted N-acetyltransferase YhbS" - /db_xref="UniProtKB/TrEMBL:A0A454WJI5" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000082" - /note="GO_function: GO:0008080 - N-acetyltransferase - activity" - /product="MULTISPECIES: GNAT family N-acetyltransferase" - /protein_id="ncbi_JK1GL000082" - /transl_table=11 - /translation="MVRLAQYTKADQEEILGNSDDPFGVAWTGLTWLPKEEHFGIRHHG - RLVAHAGLLRLPVAISDAETEVVGVGGVAVSPAMQGQGFARLVVTAALEHARTMGPQHA - LLFCRPPLVSLYQRLGWHPLDKDVLVEQPEGRLVTMPLRTMVTPLLDDARWPSGPVRLF - SLPM" - mRNA 80441..81022 - /locus_tag="JK1GL000083" - /note="hypothetical protein" - gene 80441..81022 - /locus_tag="JK1GL000083" - CDS 80441..81022 - /codon_start=1 - /db_xref="COG:COG1309 DNA-binding transcriptional - regulator, AcrR family" - /db_xref="UniProtKB/TrEMBL:G2GK72" - /gene_functions="regulatory (smcogs) SMCOG1215:TetR family - transcriptional regulator (Score: 94; E-value: 2.1e-28)" - /gene_kind="regulatory" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000083" - /note="GO_function: GO:0003677 - DNA binding" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000083" - /transl_table=11 - /translation="MPQWTGSQTYPHDDLSADHWPECRARDGSPGSLAAVTAGLVGLRL - IQAHAGRLFTDHGYDAVTVADVAKAAGVSSMTVYRNFPTKGDLVLIDQPAQLIAEHVAA - SSATQPLVRRIGSALIDAATASTSGNGDEQAADERFLLDCLRLMVSTPALRPRHLDSQY - ALQQAIVEALGKDAADPDAAFRAEARERHR" - misc_feature 80567..80569 - /note="tta leucine codon, possible target for bldA - regulation" - /tool="antismash" - mRNA complement(81216..81332) - /locus_tag="JK1GL000085" - /note="hypothetical protein" - gene complement(81216..81332) - /locus_tag="JK1GL000085" - CDS complement(81216..81332) - /codon_start=1 - /locus_tag="JK1GL000085" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000085" - /transl_table=11 - /translation="MRARVAAGMICAVACRRPRSGRISITQKMPRKAPPPWS" - mRNA 81456..81854 - /locus_tag="JK1GL000084" - /note="hypothetical protein" - gene 81456..81854 - /locus_tag="JK1GL000084" - CDS 81456..81854 - /codon_start=1 - /db_xref="UniProtKB/TrEMBL:A0A101MYS4" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000084" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000084" - /transl_table=11 - /translation="MVRRRRRPAGAAPRPPARTPVGSEGQLAGNWRGADGSVLQLAPGG - QAELTRVPAHNDVDEDGDFSLCDGTGTWTREEGNDFQNTDRDGVLVHLDDECGQETYWT - IGGTELKPELFVLFGDPDTGELRILTQP" - mRNA 82128..82394 - /locus_tag="JK1GL000086" - /note="hypothetical protein" - gene 82128..82394 - /locus_tag="JK1GL000086" - CDS 82128..82394 - /codon_start=1 - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000086" - /product="hypothetical protein" - /protein_id="ncbi_JK1GL000086" - /transl_table=11 - /translation="MPWNGYGEQRAMADLTPRHHRGRSAHRQSAQVVVCPGAAPAVGVE - DRAVQGEAVAGVGGLGVVEQDQVQPVTPELLVVVRVGGSGPGR" - mRNA complement(82569..83279) - /locus_tag="JK1GL000087" - /note="MULTISPECIES: alpha/beta hydrolase" - gene complement(82569..83279) - /locus_tag="JK1GL000087" - CDS complement(82569..83279) - /codon_start=1 - /db_xref="COG:COG0596 Pimeloyl-ACP methyl ester - carboxylesterase" - /db_xref="UniProtKB/TrEMBL:A0A454WJG9" - /gene_functions="biosynthetic-additional - (rule-based-clusters) Abhydrolase_6" - /gene_functions="biosynthetic-additional - (rule-based-clusters) PF00561" - /gene_functions="biosynthetic-additional (smcogs) - SMCOG1036:alpha/beta hydrolase fold protein (Score: 90.9; - E-value: 1.9e-27)" - /gene_kind="biosynthetic-additional" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000087" - /product="MULTISPECIES: alpha/beta hydrolase" - /protein_id="ncbi_JK1GL000087" - /sec_met_domain="Abhydrolase_6 (E-value: 2.4e-16, bitscore: - 59.7, seeds: 455, tool: rule-based-clusters)" - /sec_met_domain="PF00561 (E-value: 5.3e-13, bitscore: 47.9, - seeds: 48, tool: rule-based-clusters)" - /transl_table=11 - /translation="MFLHYWGGSARTWDLVVDRLSGRDVLTVDFRGWSRSSALPGPYTL - GQFADDTLAVLADAGITDYILVGHSMGGKVAQLVAAARPAGLRGMVLVGSAPARPAAQV - TPEYQQALSHAYDCAESVAGARDHVLTATELPEPVKAQIVTDSRTVTDAARTEWPLHGI - TQDITEHTRTVSVPVLVVAGEHDQVEPVGVLRDNLVPYLSHADFVVIPHTGHLIPLEAP - ANLVDAITAFAPTA" - mRNA 83457..84281 - /locus_tag="JK1GL000088" - /note="MULTISPECIES: AraC family transcriptional regulator" - gene 83457..84281 - /locus_tag="JK1GL000088" - CDS 83457..84281 - /codon_start=1 - /db_xref="COG:COG2207 AraC-type DNA-binding domain and - AraC-containing proteins" - /db_xref="UniProtKB/TrEMBL:A0A454WJH6" - /gene_functions="regulatory (smcogs) SMCOG1260:AraC family - transcriptional regulator (Score: 44.3; E-value: 2.8e-13)" - /gene_kind="regulatory" - /inference="similar to DNA sequence:INSD:" - /locus_tag="JK1GL000088" - /note="GO_function: GO:0003677 - DNA binding; GO_function: - GO:0003700 - DNA-binding transcription factor activity; - GO_function: GO:0043565 - sequence-specific DNA binding; - GO_process: GO:0006355 - regulation of transcription, - DNA-templated" - /product="MULTISPECIES: AraC family transcriptional - regulator" - /protein_id="ncbi_JK1GL000088" - /transl_table=11 - /translation="MSVIRQMTYQPAGRPATSVEVMTFGRLRELNDGGTQRADFHVLAV - VDAGPGSVTVDFRHYPLQDRSAVWIPPGAVHRWDDIADVAGHLVLFVPTAPVTHATREL - AASPDPAAHWGIPDADWPFVDTARSHLLFEASAPPSESRTELPEILLSALITRLHPPHA - EALTPQVFRLFRSSVEAHFRRHHDADYYARALGYAPRTLSRAVQQATGRTAKAYIVERI - VLEAKRLLAHDRLTAARCADVLGFPDASNFSAFFRRATGMRPGAWQAMMAAE" -ORIGIN - 1 gtggcggtga ccgccgacgc gacgacagtg aactggaaca tctggggcga cgtggcggtg - 61 gcggtgctgc cgcagccgta tctggacaag gtgacgcagg cgggcggcgc cccggtgctg - 121 ctgcccccgc tcgtggaggc ggtggagtcc gtgatggagc gggtggacgc cctgctgatg - 181 agcggtggcg cggacatcga cccggccctg tacggcgccc ggcccggtga gttcgtcttc - 241 ccgccgcacc cggcgcgtga cgcggcggag ctggccgccc tggccgtggc ggaacggcgg - 301 ggcatccccg tcctcggggt ctgccggggt ctgcagctga tctcgatcac ccgcggcggc - 361 accctcgacc agcacctgcc cgagcactcc cccgccgtgc ccggccgtta cgagccgcgc - 421 accatccggg tgaagcccga ctcgctgctg ggcggcgcgc tcggaccgtc gccgaccgtg - 481 tactgccacc accaccaggg catcgacaag ctcggcgccg ggctggtggc caccgcctgg - 541 tcggacgacg gcgtcatcga gggggcggag gccgaggacc cgtcggcgcc cttcctggcc - 601 ggtctgcaag cccacggtga actgggcgag gacaccgtcg cgctgttcga ggcgttcatc - 661 gaggcggcga aggccggacc gcgccgctga ccggccttcg ccgccggccc cggccacagc - 721 acgtgacggc cgccgcccgc ggccccgctc gatgcggggc cgcgggcggc ggccgtctgc - 781 ggtcgtcccg tgcccgggcg cgggacgccg gcgaagaccg gtccggtctc cagtgagcca - 841 ccgcaccgcg ccggcggcgc gggggatgtg accgccgcac gatgcggtgg cggcaccgga - 901 tgggacccga ccctcatctg tctgacgacg cgcgggcctc gtgtgtgacg gggcgggcga - 961 aaccggtgcc ggaccggtgt gcgccggctg gtcagacgcc ggccgcgccg acggcgtgcg - 1021 ccctgctgcc ggcggtgtcc cggccgcggc cgaaccagcg ctccagtgcc cgcccgagca - 1081 gttccacgcc gtccggggcc gcccaggcga catggccgtc ggggcgcagc agcaccgcag - 1141 cgggacggtc cccggtcacc ggctcggccc actcccccac gaccgtgcgg acccggtcgt - 1201 cccagccggc ggcggccccg cggacgcgcg cggcgtcgtc cgccgcgccg gtgaccagga - 1261 gtacaccgcg cgccgggtgg agcagttcgg cgacccgggt gcggccgccg tcctcgagca - 1321 gcagctcgtg gccgggagcc agccgcagac cgagcagcgg atggtcgccg ggacccatgt - 1381 cgtagcggat gtcgacgccg ctgacgatcc cggccaggtg ccgggcggcc tcgggcagtt - 1441 ccaccagttc acgcatgacg gcgcgcagcg gctccatctc gtcgccggtg aggtagaggc - 1501 gggtctgggc gcgggtgttg cgcatcagct tctcgccgac cgggtgccgc tcgctctcga - 1561 aggtgtcgag caggccttcg ggtgcccagc cgttgatggc cgcggccagc ttccagccga - 1621 ggttggcggc gtcctggacg ccgacgctca tgccctgtgc gccggccggc atgtggatgt - 1681 gggtggcgtc gccggcgagg aagacccggc cgctgcggta gtgctcggcc tggcgggtgg - 1741 tgtcggtgaa ggagctgatc cagcggacct ccgcgtggtg cagcgactcg ccggtcatgc - 1801 gctgccaggc gtcggcgatg tcggtgaacc tcagggcgct cttgtcctcg ggcgggcgca - 1861 ggttctcgtc gtggatgacg atccggtcca cgccgttctc caggttgaac gccatcacca - 1921 tgccgcccgg caccttctcg ccgatgggcc gctgccgcac cccggcgccg accaggtcgg - 1981 ccatgtacat gccgcgggtg gcgccccagc ccttgaagtc gatgcccgcc agggtccgca - 2041 ccaggctgcg tgccccgtcg cagcccacca ggtactgcgc ggtgtcctca ccgtgcccgt - 2101 ccgggccctc gtactcgacg acgacgccgt ccggcctctc ccggtagccg gtcacctcgt - 2161 ggttgcgcag gacgggcacg cccagttcct tgagccagtt ctcgaggatc tcctcggtgc - 2221 ggaactgggg tacgccgcgg acgctgaagt gattgtcgtc cagcttgccg aaatcgatgc - 2281 gtacgccgcc gaagtggccc tgggcccatt cgacgtcgcc gaagcgttcc agcagaccgc - 2341 gctgctcgaa cacctcggcc gcccggcggg tgaagccgac gccgcgcgac tccccgctgg - 2401 gtccgggcag cttgtcgtag accaccacgt ccacgccgcc gagccgcagt tcaccggcga - 2461 gcatcagccc gaccggaccg gcgccgacga cgatcgcgcc ctttgccatg tcgtactcct - 2521 catgcagatg gatggcgtga gtcagccgaa gaagtcgagc agggccccgg cgacgacctc - 2581 gggctcctcc tcgggcaggt agtgcaccga cttcgacgcc cgcaccatgc gcacgtcggt - 2641 ggcctgcgcg gtgagcttgc gctgaaggtc ctcgtaggtg aagttgccgc cgatgccgag - 2701 tacgggcatg gtcagcctgc cgtagccggc caggtcggcg atgtcctggt ggcacgcctg - 2761 gtaccagccg gtgccggccc ggatggcctg cgggctgttg taggcgtgcg cgtagatctc - 2821 gcggtcggcc tcgccgacca ggttctggtc ggcgagggag tgggcgaaca gccagtcgat - 2881 cacgtggcgc atgcggccgc acatcagctg ttccggcagc tgctggagct ggttgaccgc - 2941 ccaccaccac agggcggttc cggtcccggg ccggtacagc agccgcaggt cgtactcgct - 3001 ctcgtcgggg tgcggggtgt ccagcagtgc cagcctgcgg gtcgcttcgg ggtggttggc - 3061 ggcgaaggcg aacgccacca tggccccgat gtcgtgtccg gcgatgtcca cctgccggtg - 3121 gcccaggtgc cgcaccaggg cgtgcaggtc cgccgccatc gtcttcttgt cgtagccgcc - 3181 cgcgggcttg tccgagccgc ccatgccgcg caggtcgacg gcgatgacgc ggtgggtgcg - 3241 ggcgagctgg ggcatgacct tgcggtacgc ccaccaggtc tgcggccagc cgggcacgag - 3301 cagcaggggc cgtccgtgcc cgccggtcac gtagtgcagg cgcacgccgt tgaccgtggc - 3361 gcagcggctg cggaaaccgc cgggcaggga gcgggccagt tcgctgtcgg agggcacgga - 3421 gccggtgtgt tcgcgggcgt gggcggcagt ggcggtgccc gtcatggcga gggccgtcgc - 3481 tcctgtgccc agggcgagca tcgtgcgtct gttcagcgtc atctacccaa gtcctcgtcg - 3541 cttcgtggcc ggtgggccaa tcaggcgcgg aaggcgccgg cgtgctggtc cgcccatacg - 3601 gtgaaggggc gggccgggtg tccggtgagc tgctcgacgt ggtcggtgag cggcaccggc - 3661 gccgtgctgg ccgcccacag cttcagcagc gcgtcggcga tgtcgtccgg catgaagtcc - 3721 ggcttgttgg cccgccacac ctgcgggggg atccgctcga cggggatgtc ccggcccgcc - 3781 gcggccgcga tgatcgcgac gtgctcggcg aaggtgaggg actgcggccc ggtgaggtgg - 3841 tacgaccggc cgcgcagcgc ggggtcggtg aggaccgcgc acgccgcttc cgcgatgtcg - 3901 cgctcgttga ccggatcggc gtggctgtcc gggtagggca ggcccaccgc gccgcgcgcc - 3961 ttcagcgacc acgcccaggg cagggcgttg ccggccagtg cgccgcagtt caggggcgtg - 4021 gaggtgaggg acgacgcggc gagggcctgc tcgacggcga ggtggggggc ggcgatcggg - 4081 tcgtcggcgg ctgaggggcg cagcacggcg tcggcggaca tgatcacgac gtgttccacg - 4141 ccggctttct cggcctgcgc cacgaaggcg tcgaccgccg ccggctcggc gtacaggaag - 4201 acggagtcga caccgtcgag ggcggcggcg aaatcggccg gggtgtcgag tgcgagccgt - 4261 accgactcgg tgcccgcggg cagggacagc ttctcggggt tgctggaacc ggcgcggacg - 4321 gcgacgccgc gttcgtgcag tacctgcacg agcagggagc cgaccttgcc gcggctgccg - 4381 gtgacgagga cggtcatgac agtggccttc cgggggtctg ggggcggggt gaggggcccg - 4441 gcggggtgcc ggcgcggcct gcgcggcgtc gccggtggcg gggagttcgg cggtggcggg - 4501 gtgttcggcc gtggcggggt gttcggccgt ggcggggtgt ccggcggctg ccgggcggtg - 4561 ccgccgggcg gtcggcctgc gggtggcggg ccccggtgtg cgagacggcc ggggcccggc - 4621 gggcctgcgc cggtgtcaga ccgcggccgc gccgaaccag cgggtgaggg cgtcggtcac - 4681 atcgccgccg tccggggccg cccagacgac atggccgtcg ggacgcagca gcaccgcttc - 4741 ggggccgccg tcctccgccc aggtgccggc gacgacgtcg acccggtcgg accagtcggc - 4801 ggcggtcttg tggacggtgg aggggtcgcc ggtgacgatc agcacgcccc gggcctcgtg - 4861 cagcagttcg gcgacccgga cgcgggtgcc gtcggcgcgt tgcagcgcgc gctgcagcgg - 4921 caggcgcagg cccagcagcg ggtgttcgcc ggctccgacg tcgtagcgga tgtgcaggcc - 4981 gctgacctgg ccggccagat agcgggccgc gtcggggatg cgcacgagtt cgcgcatgac - 5041 cgcgcgcagc ggctccatct cctcgccgct gaggtagagc agcgactggg cgtggacgtt - 5101 gcgcagcagc tgctcgccga gcgggtgccg ctcggcgtgg taggtgtcga ggaggccgtc - 5161 gggggcccag ccgttgatcg tcgcggccag tttccagccg aggttgacgg cgtcctggag - 5221 gccgacgctg acgccctgcg cgcccagcgg cgcgtggtcg tgggcggcgt cgccggcgag - 5281 gaggacgcgg ccgctgcggt actgctcggc gaggccggtg gcgttggtga gggcggtcat - 5341 ccagcgggtg tggccgtggt ggatggactc gccggtcatg cgctgccagg cgtcggccac - 5401 ctcggtgaag gtcagcgtgc cctcgccgtg gtgggggcgg acgccgggct cgtggatgac - 5461 gatccggtcg tagccgtcgc ccaggccgac cgagaggacc atgccgccgc cctcgacgcg - 5521 ctccccgatg ggccgcggcc ggatgtcggc gccggtgacg tccgccaggt acatgccgcg - 5581 cgtcgcctcg tcgcccggga aggcgatgcc ggccaggcgg cgcacggtgc tgcggccgcc - 5641 gtcgcagccg atgaggtact gcgcgtggtc ctcgccgggg ccgtcggggc cgtcgtagcg - 5701 gacgacgacg ccgtcctcgg tctcctcgaa gccggtgacc tcacggccgc ggagcacggg - 5761 cacgcccagg cgggccgtcc agtcgccgag cagctgctcg gtgcgggact gggcgagccc - 5821 catcactccg aagtggctct cctccagcag ggtgaagtcg atgcggacgc cgccgaagtg - 5881 gccgtgccgg ccccagcgga attcccccag ctcgtcgagg agcccacgct ggtcgaggac - 5941 ttcggcggtg cggctggtga agccgaggcc acgcgattcc ccgctgggcg cgggcagttt - 6001 gtcgtagacg accacgtcca cgccgccgag ccgtagctca ccggcgagca tcagtccgac - 6061 cggcccggcg ccgacgacta tcgcgccctt tgccatgaag tactcctcac gcagatcgtt - 6121 ggtgaaccgc tcccgtgtgc gcggcggcag ccaggcacca ggaaagacct caccgatcga - 6181 gcggcgctgc agccggagtg cagggcctct caaaagcggc ccgccccgcc gcgggccggg - 6241 tccggggcgg ggtggcgcgg gcggtggcgg cggggcgtgt gaccaggtgt ccgtgcccgc - 6301 gggcggccgg ggtgcgggcg ccgcggcggc cgagcggggt cggtgacggc ggccgagccg - 6361 ggtcggtgac ggctccagcc ggcggcgagc ggatgccgag ccggccgccg tcaccgagcc - 6421 ggccgccgtc accgggcggg ggcgcggagg cgggcggggc ggggcggcgg gggcgccggg - 6481 gtgcgggcgc ggaacggccc cgccggttcg ggggacgacc ggcggggccg tggactgtgg - 6541 gtccggtgcc gcccgggaaa cgcccgggcg cggtggtgct acttctccgc gtcggccttc - 6601 accagggcgg ggccttcgcc cgcctcggcc ggggccgagc tcatggactg cttgccgcgg - 6661 ggcatcagga aggtgaccac cagcagcgcg accgtgccga gcatggcgcc cgagaggaac - 6721 gcgtcgtggt tggccgcctc gtggacctcg gcgatcagct cgggcttgcc gcccgtcgcg - 6781 gccatctcgg tgctcatgcc gctgtaggcg atggtcgcca cgacggccag gccgagggcg - 6841 ccgccggctt cctggctggt gttgatcagg ccggcgccca ctcccgcgtc ctcgtcggtg - 6901 actccgacga acgcggcgat ctgcagggtc acgaagacca tgccgcagcc gaggccgagc - 6961 aggatgaacg gggccagcag gtcgaccacg tagctgccgt cggcgggggc ccgccacatc - 7021 agcagcagac cggcgacggt gagcgtgaga cccatcatca cgaccggacg ggccgccatc - 7081 ttggtgacca ggccggaggc gatgcccgcg ccggccgcga cggagaacgc gagcggcacg - 7141 taggcgaagc ccgccttgag cggcgagtag ccgaacgcct gctgcatgaa gaggctggcg - 7201 aagaagaaca gcgagccgaa ggtgccgaag accagcacgg cggagatgtt cgcgacccgc - 7261 atggtcttca gccggaagat gcgcagcggc atcatcggcg aggcgacctt ggcctcgatg - 7321 acgacgaagg ccgtcagcag cgcgaccacg ccgaccagcg aaccgatggt gcggaaggtg - 7381 tcccagccga cggtggtggc ctcaccgagc gtgaagatca gcagcagcag gccggcggtg - 7441 agggtgaccg ctccgagggt gtcgaacttg ccccgctcct cggccttgct ctcgggcagg - 7501 atgcgcggtg ccagcacggc ggcgcccaga ccgatcggca cgttgatcca gaagatccac - 7561 tcccagcccc aggtgtcggc gagcacaccg ccgaggatca caccgacgat ggacgcgata - 7621 ccggacagcg agccccacac gcccagcgcc ttgttgcgct cgggtccctc ggcgaaggtg - 7681 ttggtcagga tcgccagggc ggcgggggtg atcagtgccg cgccgaagcc ctggacggcg - 7741 cgcgaggcga tgagcatcgt gccgttctcg gcgagaccgg aggtcagcga cgccagcgcg - 7801 aagatcacga agccgatctg gatcagccgg cggcggccga aggtgtccgc cagccgcccg - 7861 cccagcagca ggaagccgcc caggacggtg gcgtaggccg tgacgatgta gttcaggctg - 7921 acctcggaca tgccgaggcc ctcctggatg gagggcagag cgaggttcac gatcgacacg - 7981 tcggtgaaga ccatgaactg gcccatgcag acgaatgcca ggatcagccc ggggctcagg - 8041 cccgcccctg atgctgaccg ggccgtggtg gcgtcggagg cagccatcga ttactcctca - 8101 gaaggtgcag gatcgggtca tcgaacgcgg cccgcgccgg atggggccgg cgggaaccgc - 8161 tgggacagcc gccgggaggg actcggcggc cggagtgggt ccgtcgcagc tatgacgacc - 8221 ggggaccggc ggatgtgacc ggtcggcccg aatcgtctcc gggaccgccc cgcagtccct - 8281 ggatgccggc ctcgtactgg ctgatcagcc ggggtccggc ggcacgcagc tgcggcggga - 8341 agttctccgt cagcaggtcc cggccgcgcg cgggctcggg gtcgtcgagc aacccgaaca - 8401 tgaagtgcag accgaaacgc ggggagccct ggacgaacgc ctcgcgcagc cggtcgatgt - 8461 cgtccgcggg gaccccgggg aacaggtctt ccaccacggc ctcctcggcc gtgaggtgtc - 8521 cgtcgagcac ctggtggacc tgccgggcgg cctcggcgcc cgcccgggcg ccgtccgtcc - 8581 cgccggtggc ccgtgcggcc tgcgtcgcct cgtcgagggc gtcgatcgcc gtctccaggg - 8641 cgttcagcct ccggtcgagg accacgtggt cgtccgacag ttccttgagc tgtgcccgcg - 8701 cgtcggggta gagcgcctcc agcacgggcc agaagaggtc gtcctccgcc ttgtggtggg - 8761 cgtgggtgaa cgcgagcagc caccggcccg cgtcgaccag cgtcgcggtg tctgtgtcgt - 8821 ggccgtcggc cagccgctcg taggcgtcca ccaccaggcg cgtgccgcgc cgcagcaccg - 8881 cgtggatcgc gacgaactcc tcgtacatgc gggcgcccgg gctctgggcc ggatcgctca - 8941 tggacactcc cgtttcgcag tggcagggcc gtggccggac acgggtgccg gtgcggtccc - 9001 gtgggccgcg gccagtacac acgggcccgc acgaagcagc ctcgaggaat gctggaggcc - 9061 cgctcccgcc aggccgggca cgctcgagga atgcttgacg ggaagggccc gcccggcgct - 9121 tgccgtcagt ggccgcccgg cgcacgggaa acggccggcc gtgcggtgtc ctggcccgcc - 9181 ctgcgcagcg cgacctcccg cacgagcagt cccgcgccca gcaccgcggc gccgacaccc - 9241 gcgcagagca ggaacgcgac gtgggtgccc gcggcggtcg cgtgccggta ggcctcgtgc - 9301 agggcgggct ccaggcgctc aaggctctgc gcgtccagcc gggcgttgtc cagcgcgggg - 9361 acgccgggtg cccgctcggc cgtcacccgc agcacctcgc ggttgaacag ggtgcccatc - 9421 acggcgaccc cgaagcagct gcccagggtg cggaagaggg tgacggccgc ggaggcggca - 9481 ccgatgtcgc gcagttccac gctgttctgg gcgaccaccg tcacggtctg cgtcaggcag - 9541 cccagccccg cgcccagcac cgccatggac agggccgccg tgggccgcga ggtggaggtg - 9601 tccatccgcg acagcagcca ggccccggcg cacagcaggg caccgccggt caccgggaac - 9661 accttgtagc ggccgctgac cgtggtgacc ctgcccgcca ccagcgacgc cgcgatcagc - 9721 gcggccagca tcggcagcag cagcaggccg gagttggtcg ccgaggcgcc ctggacggcc - 9781 tgctggtaca gaggcaggaa gagcagcacc ccgaacatca cgaagccggt gaggaaaccg - 9841 atcaccgaca tcagcgtgaa gttgcgtacc tggaacatgt ggagcggcat gatcgggtcg - 9901 gcggtgcgcg cctgccgccg gacgaaggcc cacagggcgg caccggccgc cgcggcgagg - 9961 agcacgacgg cggcggagtc ccaggcgtag cgggtgccgc cccaggtggt gagcaggacg - 10021 gtggcggaga tcccgaccgt cagcagcgcc gcgcccaggg tgtcgacgcg ggccacccgg - 10081 ctccgtcggg gcagccgcag cagccgccag atcatcgcca gggcgagcgc gccgagcggc - 10141 aggttgaggt agaaggccca gcgccagccg aggtggtcgg tgaccgcgcc gccggccatg - 10201 gggccgccga tcatggcgac cgccatcgcg ccggagatca ggccctggta ccggccgcgt - 10261 tcgcggggcg gcaccagctc ccccacgatc gccatgacgc cggccatcag accgccggcg - 10321 cccagtccct gcacggcccg gaacccgatc agctggccca tgtcctgggc cgctccgctc - 10381 agtgccgagc cggccaggaa gaccacgatc gcggcgagca ggacgttctt gcggtcccgt - 10441 acgtccccga gccggcccca cacgggcgtg gagacggccg tggccagggt gtaggcggtg - 10501 acgacccacg acacgtgctc caggccgccg agttccgcgg tgacggtggg cagggccgtg - 10561 cccacgatca tggtgtcgag ctgggacagc atcatcgccg ccaccagcgg gatcaacagc - 10621 acccgtacgg acgtgccggc gggccggccc tgggcggcgg acgccgggtc ctcgacggtc - 10681 gtcatcacgg ctcccggctc gtacgcccgt ggagcgccgg gactatccgg cgcccagttt - 10741 gaatccgacg ccccgcacgg tcacgatcca cccgctgccg cccagtttgc cgcgcaggct - 10801 gctgacgtgg gtgtcgaccg tgcgctggga ccaggagtcc ccccagacct gcttgagcag - 10861 gtgcttgcgc gggatgacgg tgtcggggtg cgaggcgagc aggcacagca gatcgaactc - 10921 cttgcgggtc agcgcgacac cgctgccgtc cacggtgacc tcgcgggagt cgacgtcgat - 10981 gtgcagccgt ccgcggcgga tgtagcggcg ggcggccggc tgccagtggg tgcggcgcat - 11041 gacggcctcg atgcgggcca tcagttcgcg cagcccgtag ggcttggtca cgtagtcgtc - 11101 ggcgcccgcc tggaggccca ggacgcagtc cagttcggac tggcgggcgg tgacgatgac - 11161 gacgggcacc cggctgaccg cgcggatggc ccggcacacc tccagcccgt ccaggtccgg - 11221 cagttccagg gcgagcagca ccagatcggc gtccgcgtgc gcctggaggg cctgtccccc - 11281 gcactgcacg gcgacgggct cgtggccgta tcggcgcagc tgggtgacga gggagtcgcc - 11341 ggggccgacg tcggcgtcca cgacgaggat gcgccgtccg ccgggtgccg gcgcggcggg - 11401 cgcgggcgcc gtgccgtcct ggaccagccg gatgagctgg gacgtggatg tgcggagttc - 11461 cggcagcgtc tgtgccgaca tctgactcat gcctccccca gaggtcctgc acggtccgtg - 11521 gggcgtgggg agcgtcggcc ctatcctgcc gggccggctc ccgccgtgcg ccccgcccca - 11581 cggtaggaac cggtggtcga gccccggtac agcgccgggc cggacggcgt cgagccggtc - 11641 cggtcgcggc gcggccttgg cccggttacg ggttgagcac ccacgccgag ttgtgctggg - 11701 tgaatccgat gtgggggtag taggcggtgg ccgcgggcgc cgacagcagc acgatcttgg - 11761 cggtgggcgc ctccttgcgg gtggcgtcga tcagggcccg gccgatgccc gagcgctgga - 11821 gccggccgtc cacggcgatg tcggacaggt aggtgacgta ggagaagtcg gagacgctgc - 11881 gggcgatgcc gatcagggcg ccgtcgccgt cgcgggcgac cagtaccagg ttggcgccgg - 11941 tcagcatcgc cttcatgcgg tcgcggtcct cgacgggccg ccgctcaccc agtccggacg - 12001 agcggtagac ggcgagcacc tcgtccaggt ccaggtcctt gccctcggca cgctcaatcg - 12061 tccagttcac gaagggtctc caatcgggtg cgaatcacgt cgtggcgggt gaggaagcgc - 12121 tcgggttcga ggctttcgac gtcgatgccc tcgcgggcca ggccggcggc gaagtgttcg - 12181 ccggtggcga gggtgtggtc ggcggcggcc tggacgccac ggtaggcgcg ttcgcgttcc - 12241 acgccgcggg cgaggaggtc ggccaggacc gcggagctgt ggatgaggcc gtcggtggtg - 12301 tcgatgtggg cgcgcatccg ctcggggcgc acggtcaggg agtttatgag gtcggcggcc - 12361 atcactgtct ggaagtgtcc cacggacagg ctgtcgggca ggatgacccg ttccacggac - 12421 tggtgggcga ggtcgcgttc gtgccacagt gccacgttct ccagggcggt gtcggcgtag - 12481 ccccgcagca gccgggccag tccgcacagc cgttcgctgg tggtggggtt gcgcttgtgg - 12541 ggcatggcgc tggagccctg gtaggcgccg gtccggtgtt cctcgacctc gcggacctcg - 12601 gtgcgctgca gcagtcgcag ttccagggcg atctgttcga tgcaggcgcc cagcgcggcg - 12661 accgcctgca tcagctgggc gtgccggtcg cgggcgacga cctggctggg caccggttcg - 12721 acgccgaggc cgagggcgtc gcagacgtgg cgctcgacct cggggtcgat gagcgcgtag - 12781 gtgcccacgg agccggagac ggtgccgacg gcgacggcct cgcgggccgc ggtgagccgg - 12841 gtgatggagc ggtcgacggc gaaggcgtgg acgccgagct tgtgtccgaa ggtggtgggt - 12901 tcggcgtgca cgccgtgggt gcggcccacc atgacggtgt cccagtgttc cagtgccttg - 12961 ccgaccagtg tcgcgcgcag gcggcgggcg gccgccagga gcaggtcggt ggcgcgggcc - 13021 agggtgtggc ccagggcggt gtcgacgagg tcgtagctgg tcatgccgag gtggacccag - 13081 cgtgcggagt cctcggggat gtcctcgcag tacgcggcga ggaaggacag cacctcgtgg - 13141 tcgcgttcct tctcgatctc ggcgacccgg gcggccagcg gcacccgcgc gcgccgcatg - 13201 tcctccaccg cggcggcggg tacccggccg agcccggcct gtgcctcgga ggcgaggatc - 13261 tcgaccttca cccaggtcgc gtagcgggac tggtccgcga acaggtcggc catctcgggc - 13321 agcgtgtagc gaggaatcat cggtcggcct tcgtcgaggg gggtggggtc ggggacggcc - 13381 gtgcgggcac gccggacgcc gccccggtga ggggggtgtt cggggtgccc gcgccgtcag - 13441 tacacgccga agtactcacg ctgctcccag tcggtgacct gaccgggcgc gggcgcggtc - 13501 tgtgagctcc atgccgtgaa gcggcccagc tcgctctcct tgagcttggt catgcaggcc - 13561 gcgaggggcg cgccgagcag ctggtccgcg cggcccgtgc ggaaggcgtc cagggcctcg - 13621 gcgagggtct gcgggacggt ctgcggctgt gtctcggtgg gcgcctcgcc gcggggtgcg - 13681 gtctgcgggt cggcgggctg ggccgtcagg ccctccaggc cggcgaacag ctgggcggcg - 13741 atgttgaggt aggggttggc gcagggctcg cccacccggt tctcgatgtg ggcgccggct - 13801 ccgctgccga cgacccgcag catcgcggtg cggtcctcga agctccagcc gagccgggtg - 13861 ggggcgagcg cgtgttcggc ggccaggcgg cggtagccgt tgacggtggg cacggacagc - 13921 aggaacagtt cccgtgccca cgtcagcagg ccctccgcgt aggcctttcc gttcggtgac - 13981 agcccgcccg acaggccctc ggcgctgaac aggttgcggc cggtggccag gtccacgacg - 14041 gactggttca ggtgccagcc gctggggtcg gcggcgtcga gccgcggctg ggacatgaag - 14101 gaggcgtggt ggccgcggcg ggcgcagaac cgtttggtga cggtgcggaa cagcagcatc - 14161 gcatcagccg tgtcgagggc cgtcatcggg ctgaaggtgg tctccacctg gccggggccg - 14221 gactcgtgtt ccatcgagcg cagcggcagg ccgagctttc gcaggtggag tccgagcggg - 14281 ccggtgatcg gggcgacggt gtcgtaggcg gcgtcgaggt tgaactggta gccggcgttg - 14341 acggcggtca cgcgcggtgc ctggccctgc agcccgaagc cgttgccctg gttgccgggc - 14401 tcgtcgtcca ggcgccgggt gaggtaccac tcgacttcca ggcccagtac gggctggagg - 14461 ccgagtgcgg cgtagcggtt gacgacgcgg cgcagcacgg cccgggagga cagcgggtgg - 14521 ggggtgccgt cgcgcaggta ctcgtcgccg agcacccagg cggtgcgggg gccgcgttcg - 14581 ggcagcacct ggaaggtgac cgggtcgggc acgaggacga agttgcccgc gccggcgatc - 14641 tcgtcgacgc cgatgccgtg gtcgccgagg aagtcgacgg ccacggcgtg gccggtgtcg - 14701 aacaggaacg ggcccgggct gaagttcatg ccgttgcgca gcaccgagcg gaacgcgtcg - 14761 gcggtgaggg tcttggagcg ggccaggccg tgcgggtcgc cgaagacgag ccggacgaag - 14821 tcgacctcgt ccagggcggc ctcgacgcgt tcggcggcgg cgacgcgttc gtcgtcccac - 14881 agcccgtggt cggtgacgaa ggagggccgg ccgacgctgc cgtccggggc gggtgaggac - 14941 caggaccggg catacatggt ttcagaacgt cctttcgccg gtggtaccgg tggaggcggc - 15001 gaccggaggg gccgcgggcg gctggggcag cggcggcagc atcgcctcca ggcggcgggc - 15061 caccgtcagt acgaggtcgt cggcgccgac cgggccgacg agctgcactc cggccggcag - 15121 tccggaggag gtcaggccgg cgggcaggga ggcggcgggc tggccggtca tgttgtacgg - 15181 gtacgaggcg ggtgcccagg ccagccacag caggtcgcgc acgtcggcgg cccagtcggg - 15241 gcctatggcg ccggcgtcga agggttcgac gggcacggtg gccatggcga gcaggtcgta - 15301 gtcgtccatg accgagcgca gggtggcgcg caggttctgg cggatctcct ccgcctggat - 15361 caccgcgacg ccgctgaggg tgcgtccgtg ccggacgacg tgcaggcggc cggggtcgat - 15421 gagttcctcg tcctcggggc gggtgccggc cgcctcggtg gcggcgagga tgtcgacgac - 15481 ggccgggtag aggttgtggc agcgcacctg gacctcctcg accaggtggc cctcgtcgag - 15541 gagtacgtcg cgggccgctt cggtgacgcg gcggatctcc gggtcggtgc cttcgtactc - 15601 gatccagccg atgcgcaggg agcgcatgtc gcgcggggag tccagggagc cgagtccgga - 15661 gtcggggtcg gtggggtgcg ggccggcgat gacctggccg agcagggcgg cgtcggcgac - 15721 ggttgcggcg atggggccct ggtgggcgag gcggtcggcg ccgttggggt agtagggcac - 15781 ccggccgaag gagggcttgt agccgacgac gccgcagaac gcggcgggga tgcggatcga - 15841 tccggagccg tcggtgccca gcgccccctc gcacagtccg gccgcgacgc tcgccgcggc - 15901 accgccgctg gagccgccgg cggagcggct cgggtcgtag gggttgcggg tgggcggggc - 15961 gagccggccc acggtggagg cgctccagcc gaactcggag gtggtggtct tgccgacgac - 16021 gatcgcgccg gccgctcgca gccgggccac ggccggggcg tcctgtgcgg gccgcccgtt - 16081 gggcagcagg gagcccctgg tggtgggcag gtcccgggtc tgcagcaggt ccttgacgga - 16141 gaccgtcacg cccagcagcg ggaggtccca ccatgcctcg cggccgcggt cgcggatcag - 16201 ttcgtccgcg cgggcggccg cccggatcgc ctcgtccccc gcgaccgcga cgtaggcgcc - 16261 caggtggtcc cgttcccgga cggcggccag cacgtcctgg acgtgctcga cgacggtgag - 16321 ctcccggcgg gacagcagtt ccttggtccg gcggatgccg cgggcggtca tcgctcactc - 16381 cttccgctcc tggtccttcc tcacgggggg tcaggagcgc tgctgacggt gcgggacggg - 16441 atggtgcgcc cggcgggacg ggggatgacc cgccgggcgg ccgtgggggg tcaggacgcg - 16501 cgggtggcgg ggtcggcgcc gccggtgacg gccgaccagt gccacgggga gtcgaacgcg - 16561 gtgacctcga tctgttcgcc cgccgcggcc agttcggcga ccaggcccgt ggcccgcgcg - 16621 gtgaacgcgg acacgcggtg cgcggcgagc aggtcctgct cgccgaacgg ggcgccgtcg - 16681 cagcgcagca gccgcaggtc gacgaaaccg ttgaagcgcc gtccgtcgac cacgacggac - 16741 tgcggcgaac ggatggagaa ccgcacgttg ttgttgacgt gcccgtggtg gtgctggtcg - 16801 gagtagaagg cgacgtccgg gatggtgggc gggacgaagt ggtcgcggtc gaccacctcg - 16861 ggggccttgg gcaggttgcc ggcgatgaag tgccaggagt tgtactgcat gcgcgaggac - 16921 atcgcccagg ccgcgtcggc gagggcggcg gtggagtcgc cgaagtgccg ggcggcagag - 16981 gggtcgggca ccacgcagca gaagaagcgg gtgatctccc agtcgcagat ctccgcccag - 17041 cgttcctcgc gcagcgccgt gatcaggtcg ggcagcgagc gcatgccgcg gctcatcgcg - 17101 aagtcggcct cgaacgcctc ggtggcggcg gcggccgact cgtacaccag ggcctcgagc - 17161 ccggtggcga agtcgccgtg cggagcggcg agccaccccg gggccgcggc gagggcctcc - 17221 cccagctccg cgaggttgtc gccgcgcagc ggcagccggg acgtcagccg tgccgtcacc - 17281 gcgtcctcac gggcgcgggc caggtccgcg cagggaccgg cgaccttctc gatcttgtgc - 17341 atgagagcgc cgtggatctc gcggtacagc tgggcctcgc gggcgacctc gccgcggtgg - 17401 gagcgcagtg agacggccag ttcgtgcagg tcggcgaccg tcgcggacgc ggcgggcggc - 17461 acctggtcac ggcccagggc ggcgttgtag ccgactcgga tgcgctccag catgtgggcg - 17521 acgtggtcga cggtgagctg ggtgccgttg gcctcctcga cccggccggg gccggccgag - 17581 cggatcagca gggtgaggca caccaccagc tgcacgtcgt ggtcggacca cagttccagc - 17641 ggcaggtcct gaagactgct gagggcgcag tcgggatgcc cgggccacag cgtctttccg - 17701 gtgagggtgt tgtggtcgcg gaagttcgtg tactgcctgc cctgctggta gagcacgaag - 17761 ggcgcggtgc gcagcgccgc ctccttggcc tgctccagca gttcaccacg cccttcggcc - 17821 ccctgctcgg cgagccagcc gcggcagtcg gcgacggtcc gggcgacccg gtcctcggca - 17881 cgacgcagct gcgcccggta ggcgtcgagg gtggcccggg tccacggcac ccgccgcaca - 17941 ccgccgacca gtccgtcggc cttcagcggg gccgcggagg ggacgcgcag gacgatgcgg - 18001 ccgctggtgg cgagcgcgat ctcgccggag aagacggtct cctcggcgtc accggacgtg - 18061 ccgtcgccgg gagcagcggt cgcgggagcg gcgtcgccgc gagcggcggg ggcggcggtg - 18121 gcggtagcgc gccagctcag accgcacagg gccgccaggg cggcctcctc ggcggcgctg - 18181 agcgcgcgca gctgcacatc ggcggggacg tggccgtcca gggtgagcag cacctcgacg - 18241 aacgacctga ggtcctcggt ctgttcggcg cgccgccaga cccgcttgag cagtcccggg - 18301 aatccggcgt cggcttcacg cacccggtcc ggcttgagcg tggcgccggc gaccaggccg - 18361 aggcgactgg ggcggcggct gatccgcttc cgggcgttgg cggcgcggcg ggattccccg - 18421 cgttcgggca aggcactcat cacgcaccct ttgcggtgag ctcgatgtgg ttccacatgg - 18481 cgtcgtcggt gggcgtccag tcctcgtcga cgtagatgca gtcgacgggg cactccagga - 18541 cgcacgccgg gcagcccgag cacagctcgg ggatgatcac tacgtccaga ccccggtcga - 18601 agatggcgcc gaactccgcg gggcagctgc gcaggcacgt gtcgcacgtg atgcactcgg - 18661 acttctcgat acgccgcggc ggcttcttcc agttgtcggg gcggtcacgc tgggcaattc - 18721 gctcgacccg cccagacagc gcggccgacg aagcgatctt cttcatgagc tcggaacccc - 18781 ttcgggtgag tcttcctggc cacaaccggg atgcatccga tggtccttcg gccttctcga - 18841 ccggccccgg agccgtgatg ggaatcgggt cgagcccgcg ctcccgatgg cttgtttcag - 18901 accgtcgtcc cggtgcgcgg ccgtggttcc tcgcgggcgg cggcggactc cagtccggcc - 18961 agtcggagca ggagttgttt cacgtcggtg gccgcgacgc ggtcgccgac agcgcggggg - 19021 atggagcaga tgaggagcgg accgtcgtcg tcgctcgcgg ggaggcggcc gtggctgcca - 19081 cgaacaggtg aggcgtccag ggggacgacc gccatgcggt agcgcatgcc gagcttcttg - 19141 cgggccaggg cggtggccgc cttgaccttc acgtaggggt cgagggggtc catgaacaac - 19201 tcgaccgggt cgtagccggg tttgcggtgg atctcgacca gctgcgcgaa gtcgggcgcg - 19261 cgggcgtcgt cgagccagta gtagtacgtg aaccaggcgt ccggttccgc gacggcgacg - 19321 agttcaccgg cgcggggatg gtcgaggtgg tgggccttct tgccctcgtc gtccaggagc - 19381 gtctcgattc cgggcagacc gtccagggcg gcgcgggtgg cgtccaggtc ctcggggcgg - 19441 cggacgtaga cgtgggcgat ctggtgatcg gcgaccgcga aggcgcggga ggccatgggg - 19501 tcgaggtatt ccatgccgtc ctgggtgtgg acctcgagca gaccggcgcg gcgcagggcg - 19561 cggttgatgt cgacgggccg gctgacgggg gtgatgccgt actcggagag ggcgacgacg - 19621 gtgcgtccct cggcgcgggc gtcgtccagg agcggggcca gggccgtgtc caggtcggtg - 19681 gccgccttgt gggagcgggg gtcgtcgggg ccgtagcgct ggaggtcgta gtcgaggtga - 19741 gggaggtagc acagggtgag gtcggggtga cgcgtatgca tgatgtggcg ggtggcgtcg - 19801 atgatccact ggctggagac caggtccgcg cccggtcccc agaagtggaa gagggggaag - 19861 gtgccgagtc tgtcggtgag ttcgtcgtgc agggcggcgg ggcgggtgta gcagtcgggt - 19921 tccttgcggc cgtcggcgta gtagacgggg cggggggtga cggtgatgtc ggtgtcggcg - 19981 cccatggcgt accaccagca gatgttggcg acgctgtagc cggggtgggc gcggcgggcg - 20041 gcgtcccaga gtttgtcgcc ggtgaccagg ccgttgtgct ggcgccacag caggacgtcg - 20101 ccgagttcgc ggaagtacca gccgttgccg acgatgccgt gctcggacgg gtaggtcccg - 20161 gtgaggaagg tggactgggc ggcgcaggtg acggcgggca ggacggtgcc cagcggggcg - 20221 cgggagccgg actggccgag ccgtttgagg tggggcatgt ggtccaggag ccggggggtg - 20281 aggccgacga cgtccaggac cagcagcggc accggccccc cggaagatgt ggtgggggtc - 20341 atggcagctc cttcaggccg aggtcggtca gcaggtcacg ggcgagcatc agctccgcgg - 20401 cgatcccgtc ggtgagctgg gcccggcccc ggggccgcaa ctgggccggc aacgcctgcc - 20461 aggtgtaggt ctccacctcc agatgccggg tcaacggacg cgccccgccc accagccggg - 20521 acaaggccga cttcagcacc ggcagagtcg aggtgagcgg cgcggccgga tccgcgtgca - 20581 gggggacgtg gaagtgcgcc cgccagggcg ccgtgtcggg cagcggaccg ccgccggcca - 20641 gggcctcgtc caggtcatcc gtgccacgca gcccggccgt ggcggcggtg gtgcgggtct - 20701 ggtgcaggaa acgcggctcg gcgaaggccg ccagggcatc gcgtacttcg gggcgagaag - 20761 ggtgttcggc gtgcagggcg gcggagagct gcgacttgac gacggggacg cgggccgcgg - 20821 tcagggcgtc cagggcggtg tgcgggtcct cgaaggaggt ggcgaggtga caggtgtcga - 20881 cacagatacc gatgcggtcg tgtccgatgg cgcccagcgg ggcgatcgca tcatgtgtgg - 20941 tctccacgac gcagccgggt tcgggttcca ggccgatgcg gatggagcgg ccggtcagct - 21001 cgtggagggc gtccagacgc tcgccgagcg tggccagcgc cgcgcgcgcc ttgtcggcgc - 21061 gggtctcgtc ccaggcggtg cgccaggcca gcggcagggt ggagatgctg ccgtccgtga - 21121 cgtcgtcggg caagagtccg gcgaggacac gggccaggga cgtggtgtgc tccagacgct - 21181 ccgggtcggc ccagtccggc ttgtagacgc ggtacttgac ctcttcggcg ccgaagccct - 21241 cgtaagggaa gccgttgagg gtgacgacct ccagtccccg ccggtcgagt tcggtgcgca - 21301 gtccgcgcag cgcggagggg tcggtggcca gggcgtgggc ggcgtccttg gccagccaca - 21361 gcccgatgcc gagacggtcg cggcccaggc ggcggcggac cggctcgcag tggtcgcgga - 21421 gctgggcgag gaccccgtcg agggtttcgg cgggatggac gttggtgcag taggcgaggt - 21481 ggacggtgga gccgtccggg tgccggaacc gcaccgttca cgctcccgtc ggcagcggct - 21541 cggcggccgg ggcgccgcgc aggacggagt tgccctcgtg ggtgggcgcg gtggccgtga - 21601 cgtcgaggtc gaggcgtccg ctgaggccgt agaaggcgac ggggttgcgc cacagcaccc - 21661 ggtccacgtc gtcctcgccg aaaccctcct cgagcatcag gtcaccgacc ttgcgggtct - 21721 tgagcgggtc gctcctgccc cagtccgcgg ccgagttcac cagcaccttc tccgggccgt - 21781 actcacgcag cagagcgacc atgcgggcct cgtccatctt ggtgtccgga tagacggaga - 21841 accccagcca ggcaccgctg tccttggcct ccttgaccgt ggtctcgttg aggtggtcga - 21901 ccagcacccg gtccgtgggc agcgcggact cgcgcaccac gtccagggtg cggcgcagcc - 21961 cggcgagctt gtcccggtgc ggggtgtgca ccagcgccgg caggccgtgg tcggcggcga - 22021 gctgcaactg ggcggccagc gcggtgtcct cggccggggt catcgagtcg tagccgatct - 22081 cccccaccgc caccacccgg tccttgacca gatagcgcgg cagctcggcc agcaccggag - 22141 tgcagcgcgg atcgttcgcc tccttcgggt tcaacgcgat cgtgcagtga tgggcgatcc - 22201 cgtactgcgc cgcacggaac ggctcccagc ccagcaacgc gtcgaagtag tcacagaagg - 22261 aggccggaga agtgcggggc tgccccagcc agaaggcggg ctcgaccacg gcacggacac - 22321 ccgcggcatg catggcctcg tagtcgtcgg tggtccggga cgtcatgtgg atgtgggggt - 22381 cgaagatgcg caagtcactg ctcctgggtc agggcgagca cgcggtcgag gtcggccggg - 22441 atgtctcggt gggcggcggt gcgctcggcg gcgtaggcgc gcagcattct ggccagttcc - 22501 gcgtccgcgc gggcgcgggc cgccaggttt gccacggtgg ccacgggcac gccggtgaac - 22561 aggcacttga gtacggcgtg ccgccattgg tgggcgtcca ggtgccgggc cgcgtagggg - 22621 ccgagggcgg cggcgagcag ggtggtgtcg ttggcgcgca gggcgtcttc gaccagcggc - 22681 agagcgtggg cgggttcggt gtcgagtccg tccagggcga gcaggaccgc acgccgttcg - 22741 gcggccgtcc cccggtggta cagcagggtc acggtctccg cgtcggggcg tgccgccgcc - 22801 agcagcagta cgcgggcggc gtcggcgtgt tcggtgccgc agcggcggcc cgcctcggcg - 22861 aagcgcagtt cccagtcggt gtcccgggcg gttgccgagg cgcgggcggc ggtgagccag - 22921 cggcgtgcgt cggtgccgag gccggcgaac tcgccgggca ggtccgcgtc cggcggggtg - 22981 tgtacgacgg tcatctcgtc cctccgttgc gcaggaaccg catcgactgt gcggccagtt - 23041 cgggtccggc gtgggagtgc cggggcagtt cgacgacggt caggccctgg tagccggtgg - 23101 cggcgagggc gtcgagcacc ggcgggaagt cgatctcgcc gtccccgaag gggaggtgtt - 23161 cgtggacgcc gcggcgcatg tcctcgatct gcacgtgccg cagccagggc gcggcggccc - 23221 gtacgcagtc ggcgggcggc aggggctcca gacactggca gtgcccgatg tcgagggtca - 23281 gtcccagtgg ttcggggtcg cccagttcgg tgcgcaggcg gtggaagtcg gtcagtgtgg - 23341 ccagcaggtg gccgggctcg ggttcgaccg ccagggggac gccggtgtcc tccgcggcgt - 23401 ccaggacggg gccgagggcg tcggccaggc gtttccaggc ggtgtcctgg tccaggcccg - 23461 cgggccgtgg gccgctgaag cagtgcacgg cgtgcgcgcc gaggtcggcg gcgacgcgta - 23521 ccgagcggat cagcaggcgt acgcgtgccc agcgggcgtc cgggtcgtcg tcgagcaggc - 23581 tgggtccgtg cttgcggcgt gggtcgagga cgtagcgggc gccggtctcg acggtgaccg - 23641 cgaggccgag gcggtgcagt tgccgggcga cgtggcgggt gcgggccgcg aggtcggggg - 23701 cgagcgggtc gaggtgcatg tggtcgaggg tgagtccgac gccgtcgtag ccgaggtcgg - 23761 ccagcaggcg cagggcgtcc tccaggcgca ggtcggtcag cccgttggtg ccgtagccga - 23821 ggcgcagcgg gctcatgtgg tgctcacttt ccgggccagg tgcgcggcga ggggggccag - 23881 ggcggcggtg aggacgccgg tgccgggtgc gccggcccgg gccatcagtc cgctctgcag - 23941 ggcgatcgtg gcgcggacgc cggcgccgac ggcccgctgt gtcagttccg gggaggggtt - 24001 gagcgcggcg tgggccaggg ggcgggcgaa ggtggcggcg taggaagcgg ccagggcggc - 24061 gcgtacggcg cgggcggcct tgtcggccgg tggtgtcgcg ggagtaggtg cgccggtgct - 24121 ggcgtcgggc gcggggtggg cggtggggcg gccggcgagg acggtggtga gggcgcccgc - 24181 ggcggcgagg gccgtgaggg gtgcggtgct ggagccgccc tcggtctcgc ggcgggagac - 24241 gagggagacg gccagggtgt ggctgccgag gaacgccgcc gggacgatcg cccgtcgcac - 24301 ggcgcccggg ccggcggccg cgcccagcag caggtccagg gagcgggcgg cggccatcgc - 24361 cgcgggtccc gccggggtgt gtttcaggcc caggtcgtac gcccatacgg tggcggccag - 24421 ggggccggcg accgcgaggg cccgtcgtcc cgcgcatgcg gcgagggcca ggcccgcggc - 24481 ggagagcagg cccgcggcgg cgagggcggc gccgggccgg acgcggccgg acggcagggg - 24541 gcggtggggc cgggcggtgg cgtcctcctc gcggtccgcc cagtcgttga gtgccatgcc - 24601 cgcctcgtac aggcacagcg aggcgccggc cgcgagggcg gtgcgtccgg tgggccgtgt - 24661 gccggcggcc gcggtgccgg cgaggacgtc accggggacg gtgaacgcgg cgggggcgcg - 24721 cagcagttcg gcccaggcgt ggaggtgccc gtcgcgggcc gggccgtggg cgggccgctg - 24781 agcgctcacc tggttcctcc gagccggccg gcgagggtga gcagtcgggt gtactgctcg - 24841 gccagggcgg agccttcggc gtcggggtcc ttgaagtaga agccgagttc gcccagcggg - 24901 ccggacaggc cccgctcgtg ggcgcgggcg agcaggcggg ccaggtcgag gacgagcggt - 24961 gcggcgaggg cggagtcgca gccctgccag atggtctgca ggaccatgcg ggtgccgagg - 25021 aagccgtcga aggcgacgtg gtcccaggcg gtcttccagt ccccgagggc ggggacgtcg - 25081 tcgatgtgca cctcgccttc gacccgggtg ccgagggtgt cggtgaggac gcgttccttg - 25141 ccggcgttct tcgccgcggc ggcggcgggg tcggcgaggg cggcgccgtc gccgccgccc - 25201 agcaggttcg tgccggacca ggcccgtacc gccagtgccc gctgggcgaa catcggcccc - 25261 agcaccgaac gcagcagggt ctgcccggtc ttgccgtcgc ggcccgcgta cggcaggccc - 25321 gaggcgcggg ccgcgcccgc cagctggggg tggctcagcc cggtcgacgg cgtgaagttg - 25381 acgtaggggc agcccgcccg cagggccgcc gcggcgtaca gggagctggc cggccacgcg - 25441 ccgtgtgcgg ggtccggttc ggtggaggcg acgttgacga cgaccgtgcg ggcgacgccg - 25501 gtggtgcggg cgaaggtgcg caggtcggtg gcgaagtcgg ctatcagctc ttcggtggcg - 25561 cgacggtcgc cgggtaccgg tcctccgggg cggatgtgtt cgtccgcggc ggccagttcc - 25621 ccctggacgg cggtcggcag ccagggcggc agtactcctt gggcggccag ttcctcggcg - 25681 cgtttgggca ggggggtggt cgccgtgtcg tggccgccga agacgaggga ggccagggcc - 25741 ggcaggccgc agtcggcgaa ggggggcgtc tcggtgacca tgccggtggg tggcagcagt - 25801 cctgccgcca gcgccgcgca gcccgacacc gccgtcgtgg cgaccgaacc gcgggctccg - 25861 acgagccaca cgccggtccg ggtctcgtcg gccgaggtca tggcatcttg cgtcacgggg - 25921 cagcctccct gagcgtcgaa tgtgttgtcc ggcaagtgga tgcccggcca ggatgccgag - 25981 ccgggctgtg cgggggcgtc gccctccgtc ggctgtcgag cggccgccga gcggattccc - 26041 atcggccgcg ggcgtccggc gccgggcaca gcgaggcccc gccggtcgca ggggtgcggg - 26101 accggcgggg cctggcaggg gggtgtgcgc ggcgcacccc tctgcggggg gtcagcggtt - 26161 gacgcggacc agctggccgt tggtgccgag cgtgttgttg gtgacgtaca ccttgccgca - 26221 ggggtcgacg gcgacgccgg tgggctgctt gagctggtcg ccggtgggga tttcggtgac - 26281 cgcgccgctg tcggcgtcga tctcgaacag ggcgccgggc tgcggcgggc cggccagcgc - 26341 ggcggcgctg taggacaggg cgatcaggtc gccgtcccgg tccaggtcca ggtcgatgag - 26401 gttggtcatc ccggtggcga ggatctcggg ctgctggccc ggggcgatct tccagacgcg - 26461 ggaggcgccg acccggccgc cgctcatgtc ggcgacgtac acggtgccgt cggcggcctt - 26521 ggcgatgccg gtgggtacgg tctcggcggc gccggtgggc agttcgttct tgggcaggag - 26581 gtactcggtg gcggtggtgc cgtcggcgtt gccgcgtacg acggtgttgg cgcccgcgtc - 26641 ggtggccagg tagccgctgc cgctgcgcgt gagccgccac gggttggcgt gcacgtcgcc - 26701 gccgtcgggg ttcagtcgcg tctcgtggtc ggtgaggtcg gcgagcacct tgtggtcgcg - 26761 ggtgcggaag actgtgccca gggtctgggc gccctcgccc agcgcggcgc gcgactcggt - 26821 ggtgccgccg aggccgctga cgacgacgta gccgccgaac cggtcgggca cgacgtcgct - 26881 ggggccgttg gcggagatcg gggcgcccgg ggcgacgccc ttggccgtgg aggcgaggcc - 26941 ggtggcgacg cggccctgga agctgccctt gaccttgtag acggagccgg tggtgcccac - 27001 gcacgtctgg tcgaccgggc agtcggcgag tccggcgccg gcctcggcga ccagcacgcc - 27061 gccgtcgccc agcgcggtga cgccgcgcgg gttgttcagc tgggaggcca cgacggtcac - 27121 ggtcgcctcg gtacgggtgt gggtgtgggt gtgaccgtgg cggtgggcct ggggctgggc - 27181 ctggacgggg ccggcggtca gcgggacggc gacggcgccg gccgcgcccg ccgccagaag - 27241 tatcttcgtc caggagttac gcgagttcgc catttctctc ctcggtttcc aatgctcccc - 27301 ccttttcccg gagagcggat gcgaaatcag cgccacccta gggcagtcgc cggttttatt - 27361 gcgtcaaatt ttccgcagga aaaagtgggt gcacccgtga accagcggta ttcgagtctc - 27421 cctccaggag gcgtcgacct ttttccatat cgttgtagtc ccggtccctt ccggcggttg - 27481 ggacagactt ttgcgctcct gccatggagg aaactcatgc ccgaattgcc gcctccgcac - 27541 gtcgtacggg aagcggagaa agcacgagcg gatctgcagc ggcagagccg ggaactcgcg - 27601 cctccgccgt tcgctctgct ggaattgatc atgggtgtca tggtcacgcg tgcggtgcac - 27661 gtcgccgccg aactgaaggt ggccgaggcg ctcgccgagg gtccgctgtc cgccgacgag - 27721 ctcgccgggc gggtcggtgc ggacgcggac gcgctcggcc gggtgctgcg cctgctggcg - 27781 agcaacggtg tgttcgccac gcgcccggac ggtgccttcg agctgacgcc gatggcggac - 27841 gcgctgcgcg ccgaccatcc gatgtcgatg cggggcatcg cgctgctgat gggccacccg - 27901 atccactggg aggactggag cggcttcccg gagacggtgg tcaccggcga gccggcgctg - 27961 ccgaagctgc gcggcatgca cgccttcgag ttcctgacga agaacgcgga gtacggccag - 28021 gtgttcttcc agggcatggg cagcatgtcc gcctcggaga cggagccgat cctggcggcg - 28081 tacgacttct cgcagttcgg gacggtggtg gacttctgcg gcggccaggg cgcgttgctc - 28141 gcgggcatcc tgggtgcggc gcccgggtgc gagggcgttc tgttcgaccc gcgggtcgag - 28201 gagaacgggg ctgcggagtt cctggccgcg cagggtgtgg ccgaccggac gaagcgggtg - 28261 gccggcgacc tgttcgacgt gccgccgggc ggcgccgacg cctacgtcct caagcacatc - 28321 gtgcacgact ggcccgagga gcaggccctg cggatcctgc gcaacgtgcg ggcggcgatc - 28381 aagccgggcg gcaagctgct gatcgccgag atggtgatac cggagcaggg tgaccagccg - 28441 cactccggga agctggtcga cctgtggctg atgctcctgg tcggtggccg tgagcgtact - 28501 cccggccagt acgccgatct cctggcccgt gccgggttcc gtctggagcg ggtcgtggag - 28561 acggcggcgg cgatctccct cgtggaggcc gtccccgtgt gaccaccgtg gagggagggc - 28621 cccgtcgcgt gatgagggaa cgcggcgggg ccctccggtg tgtgcggccg ggcagcggcg - 28681 gccgggtggg cgggggcgcc ggcgggcagg cccgcgggga gcgccgggcg gcggggggtg - 28741 ccgggcggcg gacgaaggcc cccggcgtgc gcgcacgccg ggggccgcta gagggggtgc - 28801 gggtcagcgg ggcgggccga accaccgttc cagggccgtt tccaggccct gcgcgcaggt - 28861 gcccgtccag gcgacgtagc cgtcggggcg gatcagcacg gcggtggcgc cggcgagggc - 28921 gtccgggccg tcggtgggct tggcgacggc ggtgaccacg tccacccggt ccgcgtggcc - 28981 ggccgcggtc gcgcgtaccg tctcgtcgtc ggcgaggtcg agcagcacgc cgtgcccggc - 29041 gtgcaggagg cgggcgatgc gggtttcgcc gtccgcgccg acgagcagcc gcggcggcat - 29101 ccggcgtccc agcagcgggt gggtggggcc ggtcgcggtg tcggcgaggt cgtagcggat - 29161 gtccaggtgg ctgacgatgc cggccaggtg gcgtttgacg tcgtcgtagc ggaccagttc - 29221 ggccatcagc tcgcgcagcg ggtcggactc ggcgccgccg aggaagacga tgccctgggc - 29281 gcgggtgttc atcagcagcc gggcgccgac cgggtggcgt tcggcgtggt aggtgtccag - 29341 cagttcccgg ggggcgtcgc cgcggatcac cgaggccagc ttccagccga ggttggcggc - 29401 gtcctgcacg ccggtgctca ggccctggcc gccggccggc aggtggatgt gggcggcgtc - 29461 gcccgccagg aagacgcggc cccgccggta ctcggaggcc tgccgggtgg cgttggtgaa - 29521 ggagctgacc cagctcgcgc cgccgtggct gatgtcctcg ccggtgatgt cctgccaggc - 29581 ggcggcgacc tcctcgaagg tgacggtccg ctcacggtcg tgcgcggggc ggccgtcggg - 29641 gcagacgatg atgcgccaca cgccctggga gagcggtgcc gccatcacca tgccgttgtt - 29701 caggcgctct ccgaggaagc gcggggtcag ctccacaccg gtgatgtccg ccaggtacat - 29761 gccctgggtg gcgtcggttc cgaggaagtc gaacccggcc gccctgcgga cccggctgga - 29821 gccgccgtcg cagcccgcca ggtaggaggc gcgcagggtg cgttcctcgc cctgcggggt - 29881 gcgtacggtg atctcgacgc cgtcgccgtc caggaagccg tcggtgaggg agacgaactc - 29941 ccagccgcgg cggatgtccg cgccgagttc gcccgcccag ccctccagga ccgcctcggt - 30001 gtcgccctgg gggatgcccc gggccccgaa gtgggcgtcc tcgaggacgg tgaagtcgaa - 30061 ctgggcgccg ccgaagtgcc ctacggggct ggtggccagg gtctctccct ggccgaaccg - 30121 gggcagcagc ccgcgttcgt cgaacgtctc catggcgcgg gcggtgaagc ccaggccgcg - 30181 ggactgcccg gtgggggcgg ccagcttctc gatgacgacg acacgggccc cgcccaggcg - 30241 cagttcgccc gcgagcatca gtccggtcgg gccggcaccg acgacgatca cgtcggtgtc - 30301 cgccgctgtc ccttccatgg gtggtccttc ctggcagtgg ggtcggttcg gggcccggcg - 30361 gtggggggcg gcgcgtcgtg cggtgccggt cgtccccgcc gggccggggc gcacggcagg - 30421 tcagcgggga ggtccgaacc agcgggtgag tgcctcggcg aggccgtcgg tgcccgggcc - 30481 ggcccaggcc acgtggccgt cggggcggac caggacacgg tcggtgccct gcagtgaact - 30541 gcccggcgag ggctgggcgt ccagtgcggt gacgcggtcc gcccagccgt cgaggactgc - 30601 cggcggccgg ccgggccgtc cggtcaggtc cagcaggacg ccgccgcccg agcgcaccag - 30661 ctgggtggtg gtgagcaggc gtcggcgtgc ccgcacctcg gtgcacggca gccgggcccc - 30721 gagcagcggg tgggcggggc cgccgacgtc gtagcgcacg tccaggccgc tgatcatgcc - 30781 ggccaggcga cggcgtacgt cctcctgccc gatcaactcc gtcagcaggt cgcgcagcgg - 30841 ctcgacctcc ggtccgccga gcagcagcag cgactgggcg cggatgttgg ccaggacctg - 30901 ccggccgacc tcgtgccgtt cgtcgtggta gctgtcgagg agggtctgcg gtgccttgcc - 30961 gcgtaccacc agggccagtt tccagcccag gttgaaggcg tcctgcatgc cgaggttgag - 31021 ggcctggccg ccgaccggca tctgccggtg ggcggcgtcg cccgcgaaga ggacgcggcc - 31081 gtgccggtag cgagtcagct ggcgggaggc gtcgccgaag gcgttggccc acaggggggt - 31141 gccgccgctg atgtcctcgc cggtgacccg cttccacacc gcggtgatct cctcgaagga - 31201 gacgtcgccg tgcgggcggg cccgcgcggc ggagccgaac tcgtggacca tcacccgggt - 31261 caccccgtcg gggcggcggg cggcgatcgc caggccgtgc tccaggcgtt cgaagcgccg - 31321 gcccgggatg tcgatgccgg cgacgtcggc gcgcagcagt tcccgcgtcg cgtccctgcc - 31381 ggggaagtcg gcgccgatca ggcggcgtac ggtgctctcc tcgccgtcgc aggcgaccag - 31441 gtagcggcag cgcagccgca gcgtccgtcc gtccgggccg gcggcttcgg cctcgaccag - 31501 gtcgccgctg tcgtcgagcg cggtcagttc gtgcttgcac tgcagttcgg cgcccagtga - 31561 cagcgcccac tcccccagga tcacctcggt cctggtctgc ggcaccttcc actggccggg - 31621 gtgggaggag ggcagtgtca gatccagcgg gatgcccccg aagtggccgc gcggctcgtt - 31681 cggcgggtcg ccgaactcgg gcagcaggct ccggctgtcg aggatctcca tcgtgcgggc - 31741 gtgcagggtg gaggcccggg actcggtgct gggagcgcgt cgcttctcca cgaccaccac - 31801 gccgacgccg ccgtgggcca gttccccggc gagcatcatc ccgacggggc cggctccgac - 31861 gacgacgacg tcggtggtca gggcgtccgc tgccacggtt cagcccttct tctgctcggc - 31921 gtaggccttg gcgtgggcga gggtggcgcg gctgttggtg gacagggccg tgtggacgta - 31981 ggcgcgggcg tcggcgacgg tggcgtcctg gccgaggatg cgggcgatgt tggcggtgtt - 32041 gagggtgacg gtgtgctggg aggaggcggt ggtcgcctcg tcgccctcgg tgaaggtcca - 32101 ttcgccggtg tgcagggtca tcagcgcggg cagggtgacc tgcttgtagg cgatcttgtg - 32161 gtgggggaag acgacccggt aggacttggt ggtgtgcacc gagccgtcct tggcgcgggt - 32221 gtccatctcc agctcctgca ggccgggggt gtcctcgctc aggcgcacca cggcgacgtg - 32281 cgggagccgt tcggcccaca gctgggcctc gttgatgaag tcgaagacgt ccttggcggc - 32341 gccgtcgatg tgcacggtgt cggtgaagga gaacgtcagc tcctcggtgg cggcggcgtg - 32401 cgcggcctcg acgttgacct tcagggcggc cagctcggag gtgctgttct tgtccacggc - 32461 ctgctcgatc cacagcaggt cgtgcgggtc gtcgccgacg gcgctgtagt cgtgcaggag - 32521 ccgtacccgc gaccggtcgt cggcgagcgg ctcgatgatc caggtgccgc ccatgtgctt - 32581 gaccggggcg gcggggatct cctggcggaa ggtgatggtc aggttctcgc ggtcgagcgt - 32641 gcggcgcgag gtccactcct tggcctggcc gttggcggtc gcccagatgt ggatgcgttc - 32701 gtggtcgccg tcggcctcgg tgcggtcgac gtggatggtg ggcgggaaga tgcgcggcca - 32761 gttggtcacg tccgcgagca gctggtagac ggcgtcggcc ggtgcgccga tcgtgatctc - 32821 gtgctcgacc tcacgtgtgg tcatgaggct cactcctcgg gaaggggtcg ggtgccgggt - 32881 gcgtcagaag ttgccgaggc cgccgcagac gttgagggcc tgcgaggtga tggacgcggc - 32941 ggtgtcggag gccaggtagc cgacgaggcc ggcgacctcc tcgggggtgg agtagcggcc - 33001 gagggggatc ttcgcctgga acttctcgag gatggcgtcc tcggaggtgt cgtaggcggc - 33061 ggcgtatccc tggcgcacgc gctgggccat cggggtctcg acgtagccgg ggcagaccgc - 33121 gttgacggtg atgccggtgg gggccagctc gttgcccagt gccttggtga agccgacgac - 33181 gccgtgcttg gacgccgagt acggggcgcc caggacgacg ccctgcttgc ccgcggtgga - 33241 ggcgacgttg atgatccggc cgcggtcctt ggcgcgcagg ccgccgatgg tcagggcggc - 33301 gcgggtgacg cggaagacgc tgttgaggtt ggtgtcgatc acgtcgtccc acagctcgtc - 33361 cgcgatgtcg gcggtggggc cgccgccgga gcggccggcg ttgttgacga cgacgtcgac - 33421 gctgccgaag cggtcgacgg cggcctggat ccaggcgttg acggactcgg tgtcgcggac - 33481 gtcgacgacc gtgccgtccg cgtcgatgcc ctcgccctgg agttccttga cggtggcggc - 33541 gacgttctcg gcgttgcggg cgccgatgaa gacttggtgg ccctgccggc cgaggagccg - 33601 ggcggaggcc aggccgatgc cgctggtggc gccggtgacg acggcgacgc gctgggtggt - 33661 ggtgtcggtc atggtggggc tccttcaggc ggccttggcg ggcgcgagct gcgcgttgac - 33721 gacctcgatg aagctgcgcg gcgtgttggc ctcgccgacg gcctcctcgt ccagggagat - 33781 gccgtactcg cgctcgatga ggctgccggc ctccagcagg gcgagggact cgtagccgat - 33841 cacctcgaac tcggtgtcga ggatgtcgcc gtccaggtcc acgccctcgg cgacgcccgc - 33901 ggcctcccgc agggtgcgct tgaggtcgtc gagggtgaag gacttgctgg ccatggtggg - 33961 tcctttcgtc agtacgtggt ggcggttgcg gtgcgtcggt cgggtgcggt gcgcgggggt - 34021 cctcaggcgg cgcgcacgac catggcggag ttgaagccgc cggctccccg ggccaggacc - 34081 agggcggtgc gcagctcggc cgggcggggt tcgcccagga ccaggtcgag ggggtagtcg - 34141 gcgcacgggt cgatgtgcac ggtgggcggg atgacgccgt cgcgcagggc gaggaacgcg - 34201 gctgccaggt ccaggggcgc gccgccggag tacaggcgcc cggtcatggt cttgggcacc - 34261 gtcaccggca cgccccggtc gccgaagacc gtgctgacgg cgcgggcctc ggcgaggtcg - 34321 ccggccgggt cgccggcgcc gtcggcgaag accacgtcga tgtcggcggc gttcacgtcg - 34381 gcgtcggcca gtgccgtctc gatggccttg gccaggttgg gttcgcgtcc gctgccgggc - 34441 cgggggtcga tggtggctcc gtagccggcg atctcgccgt aggggcggac gccgcgggcg - 34501 cgtgcggcat cggcgtcctc ggcgatgagg atcgcgccgc cctctccggg gacgtagccg - 34561 ttcgcgtcgc ggtcgaaggg caggtaggcg tggtcgggtt cgtcgctggt ggtgagtcgg - 34621 ccgcaggcca gctgggccac ccagccccag gggcagatgg aggcgtcgac gccgccggtg - 34681 acgatcagcg gggtgccccg gcggatctgc cggcgggcct gcgcgacggc gtccaggccg - 34741 cccgcgcctt cgctgacgac gacgccggag gggcccttca tgccgttgcg gatggagatc - 34801 tggccgctgt tgacggcgta gaaccaggcg aaggactggt aggcggagac gtactggctg - 34861 ccctggctcc acagggcctg cagttcgccc tggccgaact cgaagccgcc cgcggcggag - 34921 gccgtgatga cgcccatgtc gaactcgggc aggtgcgcgg ggtcggcgcc ggcgtccgcg - 34981 agtgcccagt cggcggccac cagggccagc cgggtgacgc ggtcggtctg cggcagcagc - 35041 cggctgggca gcagttcctc ggcgtcgaag tcctcgatct gcccggccag acgggccggg - 35101 tagccggtgg ggtcgaagcg ggtgatgcgg ccgatgccgt gcttgccgcc cagggtggcc - 35161 gcccagtagt ccttcacccc catgccgttg ggtgagacga cgcccaggcc ggtcaccacc - 35221 acggaggcgg tcatacgagg ctcctttcgg gggtggcgag caccatggcg ctctggaagc - 35281 cgccgaatcc gctgccgacc gtgaggaccg cgtcgatcag ctggtcgcgg gcgaccaggg - 35341 gcacgtagtc gaggtcgcac tcggggtcgg gggtgtgcag gttggcggtg ggcgggacga - 35401 cgtcgtactc catggcgagt gccgaggcgg cgatctcgat ggagccgatc gcgccgagcg - 35461 agtgcccgac catcgacttg atggagctga ccggggtgcg gtaggcgtgg tcgccgaggc - 35521 tgcgcttgaa cgcggccgtc tcgtgccggt cgttctgctt ggtgcccgag ccgtgggcgt - 35581 tgatgtagtc gatggactgc gggttcagcc gggcctcgcc cagggccagg tcgatcgcct - 35641 cggccatctc cacgccgtcg gggcgcaggc ccgtcatgtg gtaggcgttg gagcgggtgg - 35701 cgtagccggc gatctcggcg tagatgtggg cgccgcgctt gcgggcgctg tcgagttcct - 35761 ccaggacgaa gaaggcggtt ccctcgccga ggacgaatcc gttgcgggtc ttgtcgaacg - 35821 gccgggaggc gcactcgggt tcgtcgtggc gcggggtggt cgccttgatc gcgtcgaagc - 35881 aggccatggt gatcggtgag atcggcgcgt cggaggagcc ggcgatcacg acgtcggccg - 35941 atccctcgcg gaccagttcg acggcgtagc cgacggagtc gatgccggag gtgcagccgg - 36001 tggagaccac ggtgctgggg ccttcggccc ccaccgccca ggcgacctcg gcggcgaagg - 36061 agctgggcac catgtagtcg tacaggtgcg ggaccgcgta ggtgtggtcg accgtgtcca - 36121 gccgtccccc gtcgctgacc acccggtact cctggtccag gcccatcgtg gcgccgacgg - 36181 cgctgccgac ggtgacgccc acgcggtgcg ggtccaggga ggggatgtcg aggccgctgt - 36241 cggcgacggc gccgcgcgag gcgacgacgg cgaactgcgc ggcccggtcc aggcggcgga - 36301 cctcctgcgg ggtcaggccg tgctcgtagg ggtcgaagtc cgcttcggcg gccacccggg - 36361 agcggaaggg ggcggggtcg aagaaggtga tgccccgtgt cgcggtacgg ccgttgctca - 36421 gcaggttcca gaagttctcc ctgccgacac cgccgggggc gatcacctcg atcccggtga - 36481 tcacaacgcg tcgcccgctc aacgggaggc ctcccagctg tagaagcgcg tggccatcgc - 36541 gtcggccggc gagcgccagg tcgtggggtc gtaggcctcg atgaagggct tgaggtcctc - 36601 gctgatccgc acgaagcgcg ggtcggcctt ggcggcctcg atcagttcac cgccgttgtc - 36661 ctcgtcgaag tcctggaggt ggaagtacag gccccggtag gagaagagct ggcggcgccg - 36721 tgtgcccatg cggtgcggca tctcggtggc gtcgaagtcg gcgaacaact gggccacgtc - 36781 gttgctcgag gtggccgcca tccgggcgac gatcagcgtg ctgtgcatag ggattagctc - 36841 ctcggcggtt gcgcggaagg gttctcgaag cgggcggacc ggcccggccc ggcggcccgg - 36901 ggggctgcgg cgccaccgcc ttcgacggtg cggcctggcg gtagcgcccc gcacggggcc - 36961 tgcctgagtc ccgcctgagc cgaagcggcg ggtgcacacg agcacgcctt cgggcctgcg - 37021 cccccgggtg ccggggacga ggtccgaagg cgtgcgggtc ccgtgcgccg tccggcgcgc - 37081 cgggctcact cgccggcaga gcgcgtgtgc acgacccggt aggtgttcag gtagggctcg - 37141 ccggtgacga cggcgcggac gcgggccacg gcggccttgc gggcgtcggc ctgctcctcg - 37201 ggggcctggt cgcggtagac ctcgaaggcc tccttgctgt cccactggga gtaggagatg - 37261 acgaaggatc cctccaggcc gcgggcgcgc aggcccttga gcacgacgtg ggcgcggaag - 37321 ccgggcacgt cggcgaggaa ggcctggccg gggccgaggg cgtcgacggc ctcgtcctgc - 37381 ccctcggggg tgaccgggaa gagggtgaag acggtgtagt cgtcgcggtc cgggccgatc - 37441 tcgatcttgc cgccgagggc gtccgaggtc agcgtgtggg cgacctcgtt ctgcatcagc - 37501 cggatcgagg tggtgatctc gccgaagacc gggagcgtgc ggtgcttgaa ctcctcgccc - 37561 gcgtagcgct tctcgaggtc ctcgccgctg cgccactgga tgaagttgag ggtgccgtag - 37621 ccgtcgacgc ccgagtggac ggtggaggac atccagccct cgtacgcggc cgcgttgacg - 37681 atcttcgtca tctcctcgat cagcttggcc tgcttctcgg gagtgtccgt ggtgaacagg - 37741 ttcaggacgg tgaggtgctt gtcctcggcg gagatgatgg gcatgggtcc ttcgctttcc - 37801 ttggtgggtg cggtgggtgt cgctgcgcgg cccgcgacgg tcaggcggtg gggccgaacc - 37861 agcggccgag ggcggcggtg agaccgtccg gcccggcgcc gaggccggcg acccaggcga - 37921 cgtagccgtc ggggcggacg aggatgccgt ccacgggggc ctcgcagccg tcgaactcgg - 37981 ccgcgacgag gtcgacccgg tcggcccagc cggcggccgc ggtgcgcagg ccgtggtcgc - 38041 ccccgagttc caggagcacg gggcgtgcgg tgcgcagcag cgcgtagaac ggggtcttct - 38101 caccgtcgac gaccagttcc cggtccggca ggcgccggcc gagcaggggg tggtcgcctt - 38161 cgccgacgtc gtgccggatg tccagtccgg tgaccatgcc ggccaggtgg cgctggacgg - 38221 attcgtgggc gcccatcagc tcggcgagca cctcgcgcat cggcgtgatc tcgtcgccgc - 38281 cgaggtagag gatgcgctgg gcgagggtgt tggtcaggat gcgggccccg acggggtggc - 38341 gctcggcgtg gtaggtgtcg agcagccctt cgggcgcctg gcccttgatg tcgagggcga - 38401 gcttccagcc gaggttcacg gcgtcctgca cgcccgcgct catgccctgc gcgccgatcg - 38461 gcaggtggat gtgcgcggcg tcgccggcca ggaagacgcg gccgtggcgg taccggtcgg - 38521 cctggcggct gacgtccgtg gtggagctga cccacagcgg ggtggcgccg ctgacgtcct - 38581 cgccggtcag gcgctgccag gtctgggcga cctcgtcgaa ggtgatcggg tccgggctgg - 38641 tgcgcagcgg ctcggagctg tcgaagtaga tgacgcggca gcggtccggg cccatcggga - 38701 tgaccatgac catgccgccg gcgacgcgct ccccgctgaa ccggggccgc agcgccactc - 38761 cggccaggtc ggcgaagcgc agctcgatgg ccggctcggt gccggggaag ccgatgcccg - 38821 cgagcttgcg cacgatgctg cgggcaccgt cgcagcccac cacgtggcgg gcgcgcaggg - 38881 agaaggggcc gtcggcgccc gcggcggtga cggtcaccga ggcgtcggtc tgctcgatgc - 38941 ccgtgacctc gcacccgcgg cggatgtcgg cgcccagctc gcgcgcccag ccgcccagga - 39001 cgccctcggt gcgggcctgc gggatgccgc gcgccccgta cgaaccgccc tcgatcaccc - 39061 ggtagtcgag cgggacgccg ccgaagtggc cgaccgggat gactccgacc tcgccgaacc - 39121 ggtccatcag cccgcgctgc gcgaattcct cgatggtccg cgccgagaaa cccagggcgc - 39181 gggattcctg aatcggctcg gaaagtttgt cgagaaccac caccgagact ccagcgagcc - 39241 tcaattcacc tgcgagcata agaccggtgg gaccggctcc cacgacaatg acatctgaat - 39301 cgtagaattc catctgccct cttctcactg gtgttccatc aatagtgcga gggcttacga - 39361 gggctgtaaa taggcgttgt tacaggtctt gtgcagtcaa tgccagaaaa acgtctggta - 39421 cgtcagagct tcgacaagcg gtcttgcccc gggcgcgtgg ggtgacggca ttctctggca - 39481 tgacctccag tctgacgacc gatcaatccg catccgtttc cgccgccgag tcgagcgcac - 39541 aggtcgccgg tctgctgcac cggtatctgg tctcgctcga cgacgagcgg ctcgacgacg - 39601 cctggaccgc cggcctgttc accgaggacg cggtcgtcgc gttcccggtc agccggcacg - 39661 agggcgccga cggcatggcc gagtaccacc ggtcggcgct gtcggcgttc gcggccaccc - 39721 agcacctcgg ttctccggcc gtggtcgacg tggacgggga ccgggccgtg ttccgggcga - 39781 acctgatctc cacccatgtg caccacccgc gccacacgcc tcccgagggg gacctgcccc - 39841 cgctcttcgc gacgggcacg ttcgtgaacg gcgaggcgcg ccgcaccgcg cggggctggc - 39901 ggctgagcct gctggccttc cggctgctgt gggcggacgg ctcccctccc ccggcccggt - 39961 gaccccggcc gcggtgcggc ggcgcctgga cgtccggcgg cgccgcgccg cggtacacgc - 40021 gcgtgccgcc ccggacgcgg tccggggcgg cgggggcggt gggggggggt gatgggggcg - 40081 gtggtgggtg gtgggggtgg tggtgggggt ggtggtgcgg agccggcggg gcaggcgttc - 40141 agacgttcag gcgttcaggc gttcaggctg aggacgcggt cgaccgcgat ctcgatgacc - 40201 acccggtcgg acggggtcgg cggggcggac cagtaccgct tggcgtacag ccgtgccccg - 40261 agcgccaccc gttcggggtc ggtcacgacc gtgccggtcc cctccagcgt gacccagcgg - 40321 aagccgtcca cctggcagag cgccaccggg gcgccgggcg tggccagcag gttgcgggcc - 40381 ttgcgggagg agctcaccgt catcacccgc gcgagctggg cgtccgcgtc ccaggtgaag - 40441 cgcacggggg ccacgtgcgg tgtgccgtcc ggccgcatcg tcgtgaacgc ggcgacgagc - 40501 gccgtaccgg tcaggaacgc ctggacggag tcgggcaccg tcacggcgtc cgggcgcggc - 40561 atcgacggca tgggcgggtc ctcgcttcca gagggtgttg cgtgcgtggg cgcttcccgt - 40621 gctccgggcg gctgtcgcgc gggcgtcggg ggcggccgtg ggtccggggc cagcttgccg - 40681 ggggccgctc gaccctcgct ggacccggct cccccgcccg gcccgccgcc cgcctccgcc - 40741 gtacgccgta cggcatgtgt cgtgcgctgt gcgcccgtgg gtcgtgcctc gtgcgtcgtt - 40801 tcgggtgtcc gggctagtcg atgctgcgga cgatgacgcg tccgtcctcg tcctcgcgct - 40861 cctccgcgcc cgccagccgc aggggcggcg ggccgccgtg gaccgccctg gcgcatcggg - 40921 ccgtgtcacc ctcgtgccgt tcgtcgtcgc cttcgtgcat gggcacctcc tcggtgatcg - 40981 gtcggcccag agtgtcaagg gtggctcgcg gcccggtcga cggccgcccc gaaggaagtg - 41041 gagcgcggcc ggagccagga cccggccggt cgcggcctcg agggccgcgg cgcgatgcgc - 41101 ggcagtgcct caccggcgag cacgtccagc acggccccgt tggtggtggc ctcgtcggtg - 41161 ccgggcagat gccgcagcag ccgggcgcag tgcccggcca gcaggcgggc gtcggcgtcg - 41221 gagatccggt tgcggtcgtg gtcgacgcag aaggtgaggc ggccgtcgcc gccgggacgg - 41281 accagcaggg cgacgggcag gtcggggcag gcgccgtgcg ccggttccgg ctccagtgcg - 41341 atgccggcgt cggcgagttc gttcctcagg ttgcccggcg ggcgcggaag gctgtcgacc - 41401 gagaccacgc tctgcagcag ttccccgtcg gggcagcggc ccgtccagcg gtggatccgg - 41461 cgggtggaga cccattcgta ggcggccatg tccagcgccc ggtcccgcag ggccgtcagc - 41521 agccggccga ccgtctcgcc agggtccacg cggaccacca tcggcaggca gttgcgcagc - 41581 ggcccgggca gccgctcggc gcagtccagg gtgatgccgc ggccggagac ggtgacgccg - 41641 aagcccaccg tcgcggcccc gccgggcccg gccgcgcggt acagcagcag cgcccagacc - 41701 gtctccaggg cgctggagtc gggtacggcg cgcagggcgg cccagcggtg gagccgttcg - 41761 gcctcggcgg ggctcagccg tacctcggtc ctgccccggc cccgctggcg ggtgcgcggg - 41821 ccgggccggg cgggcagcac ggcgaccggc ccgtcgggca cggcgccccg ccagaagtcc - 41881 cgggctccag cggggtcctg ccgctggagc cagcccgccc agtcgcgcag gtcggggcgg - 41941 cgctcgccgc cgggcagctc gccgccggcg aggtaggccc ggcacagctc ctgcatcagc - 42001 aggcacacgc tccacgcgtc cagcagcgcg tggtggaagg tgaggaccac ccgggtcacc - 42061 ggcccggcac cggccgggtc gtcggtgcgc tccacgaggg tgacgcgcag cgggcagggg - 42121 cggctggggt cgaggccgcg ccggcggtcc cgctccagca gccggtccca tccggcgccg - 42181 cccgcacggt ggcgcacgac gtcgccgtgg gcgtgctcgt gcaggaccag gtgcggccgg - 42241 ggccccgggg ccagggcggc ccgcagcacg ctctcccggt cgacgaccga ctgccaggcc - 42301 gcggcgaacc gctcggtgtc cagcgggccg tgccagcgcc agacgagctg ctcgacgtgg - 42361 cgcccggcgc cacggcgccc gccgaagtcg cccagcaggt cgaggtgggg ccacagggcc - 42421 ggtacgcccg gcggacgggc cgtgccgggg ccccgcaggg cacgcgggcg gctgtgccac - 42481 gccatgggac gccctcctcg tcgctgcctc ctcccgcacg ggccggccgt gcgcacggtt - 42541 ctcggggagc ggcgggcccc ttgagggggc gcggtactcc cccggcatcg tggcaccggt - 42601 ggctgccatg ggcctgacgg cccgctgacg ctgctcgcga ccgggcggag aaacgcttct - 42661 gcagcggtgg ggccgtaccg gaacgcccgc tactgctgtc ccgtgtccgt catcgccgac - 42721 aggaacccct ggtccagcat ggtccccacg gaggtgtccc cggcggtgct cagtccggcg - 42781 ttgtggcagg ccacgctgag caggaagcgg tccatgacgg ggtaggtggc gaagccccac - 42841 tcgtcgcggg tgacccggct gccgtcgggt gcgctcagcc ggccctgccg gaagccgaac - 42901 tccttgaagc cgaaccgcag tccctgcccg agggccttgc tgtaggcctc cttcagggtc - 42961 cacaggcgca gtgcgtgggc ggtccgctcg ccttcgggca gctcggccag ttcccgggcc - 43021 tcggccggtg tgaagacctg ggtctcgagc aggtccagcc gtacgggccg ctcggccggt - 43081 tccacgtcca ccccgatgcg gccgatgcgg ctcaggccga cggccatgac gtccccggtg - 43141 tggctcaggc tcagttcgat ctggtcgaag ccgcgcaggt agggccggcc gcccagccgg - 43201 taggccaggt ccaggtactc gggcgggacg gccagggcgg cggccgccgt gtacttgatc - 43261 agcatgcggg aggcggcgaa ccggtagcgc accgcggcgt cgcgggtacg ccggtagcgc - 43321 tgccagtcgt cgccgagcag ttcccgcagc cgcggggtgg tcagcacgct gggcagccat - 43381 tcgctccacg tcgtgcagac cagtgcgttg ccgtgccgga agaggtcctc gcgcaccgcg - 43441 ggccaggggc cgtggggccg cggcacgtga aggggcgcgg cacatgtgac ccgctccatc - 43501 gtcgtctccc tgcgtgtggt tctcgccggc ccgctccccc gttggggggc gggccgaggt - 43561 ggggggcgtc ttgccgtgcc gtctcggtca gccggccagt ggggtgtcgt acaggtcgag - 43621 actgcggccg tgccggcagc gtcccagcgc ctcggccagg accgcctgtt ccgcgtccgc - 43681 cggtgtctcg ggtacggcga tgccgagtct gcggccgatg cggctgagga cgagcaccgc - 43741 ccaggccggg tcggcgagga agccgtcacc gtccgcctgt ccctcccaga ccccgaggca - 43801 ggcggcggcg cacagcagca gggcgtagcg gtcggccagg gcgcaggcca gcgggtcgaa - 43861 cacggtgctc ccggcggccg gcagggccgc gcagcgcgcg cgcagcaccc gcagctcctc - 43921 caccagggcg cgggccagcg cggcgagggc ggcgtgcagt ggttgtgtcc ccgtccgtgc - 43981 ggccagccgt tcggcggccc cgatcagggt ggccgtgagc gggtcgtcgg tcccggagtg - 44041 cgtcagcctg cggtggtcga gcggtggcag cggcgcgccc ggcaggaaca gtgcggcgct - 44101 cggttcggcg gtccggaacc acgccgtgcg tgccagggcc ggcagctggg gtacgagcac - 44161 cgcctggcag acggccgttc ccgagtggcc gagtccggcc acgggcaggt cgcgggcgag - 44221 tttctggaag ccgccgtaca gcgggccgcg gtcgtagccg cgggcgccga gcacggcggc - 44281 gagttcttcc aggtcctcgc gcagcaggtc cggcatggtg tatttgaccg ccgccgcgag - 44341 cagatgggcg tgctggggta cgaggctgag cgcccgcagt cccgtgacgg ccatggcgtc - 44401 gcaggcgagc aggtccgcga agaccccgct gagtgccttg tgccagcggc gggcgggccg - 44461 tccgtcgggc cggttctcgg tggcggcgcg caccgcgagc cgcaggacgc tgtccacgcc - 44521 cgcgagcacc gtgcccggga tgaggcagtg gctgatctgg aagctgcgca gggccagggt - 44581 gacgccctcg ccgagcgagc cgaccagggc gctgtcgggc agtcgtacgt cggccaggcg - 44641 cagtccgtgg aagcgggccc cgcgcatgcc gggcatctcc acccgcgcca gccggcgcac - 44701 ttctccggag gcgggtggtc cgggcagcag gagcaccgag tggctggcgg agccggagcc - 44761 ggcggaggtg cgggcgtaga cgacgaaggt gtcggtgcgg tcggcgttca tgacggcgtc - 44821 cttgctgccg ttgagcagga agccgccgcc cgcagggcgt tgtgcgcgga cctcgcggcg - 44881 caggatggcg ttggcgtgtg ccacctcccg gtgcacgatc gcgacccggc ctccgccgag - 44941 caggacgtcc gcgagggccg cgcgctggtg ggtgtcgccc gcggtccaca ccgaggacgc - 45001 ggcgaacagc gaggtgatgc cgaagccgta gccgagggcc aggtcgcggc ggaagagcgg - 45061 gcgcagcacg cgggccagct cttcgaggtc cctcaggcgt ccgccgaggt cgtgggggac - 45121 gaactcggcg gacaggccgt gctcggtcag gagcgcctcg gtggcgtgtg gtgcctcgcg - 45181 ggtgtcgtcg gcccggacca gggccaggtg tccgtgcggg ttgaccgggt cgaaggggtc - 45241 gccgagcgcg gcctccagcc gggcggcgcg ctcgggttcg ggtgcgcggg tgatgtgttg - 45301 ggattcgggg gtggtgtgtt cgggtgcggg tgtgggggtg gtgctgcgcg ggtcgggggc - 45361 ctgccccgtc ggcccggcgg ccgtgtcgag ggcggcggtc acaggacccg caccgcgtcg - 45421 gaggcgtggc gcacggcgtg ctccagcagg cggcggccgg cccggccgac ctcgtcgcac - 45481 acccgccggg cggcgtcctg gtccagtgcg gcgtcgtcgt tgagcagcac gtcgtgccgc - 45541 acggtgacgt cgaggccggc tccgggctgg ggctcgatgg tccactcgcc ggtgtacgcg - 45601 gccagcggcc cggacgtgcg ggtgtgtttg tgcacgaggc ggccggcggc ggggaagctg - 45661 atgcgcaccg cctcgccgcc ggtggccgac cggccgtcca gggcgaggac ctggatgccg - 45721 ggggtgtcct cctgcaccgt cagggggcgg gtgccggcga ggtcgtcggg ccagtcgccg - 45781 gcccggtaga ggaagtcgaa gaccagctcg gcgggcacgt tgacccggac ggtgtcctcg - 45841 aaggacatca cgaggtcgtc cagccgggtc cagcgctcgg cgagccaggc caggcgctgg - 45901 agctgggcgc ggctgttggc gcgggtgacc cgctcggtcc aggccgcgtc ggccggagcg - 45961 tcgccgacga cggtgaaggc gtgttccagg gtcacccggg agccgtcgcc caagggctcg - 46021 acggtccaca ggccggtcat cgtctcgacc ggggcggagg gccgttcctg gcggaactcc - 46081 acccgccgct gtccgacgtc caggcgacgg tgggagaccc aggagctgat ccggtcgccc - 46141 gccacggccc acatgcgcag ccgttcccgt gtcccgtcga agtccagttg ttccacgtgg - 46201 acgctgggag ggaagaacag cggccacacg gtggcgtccg cgatcaggcc gtagagcact - 46261 ccgctcgggg ccggggccgt catctcacag gcagtacggt gcactcgcgc atccggcatc - 46321 gtccacaccc tccgtcgtcc aaggcgtcgc cgccgggccg gtccccgctg ggccgcacgc - 46381 gtgccgggtc caccgggggc gggccggtgc ggccgggccc gtcgtactgc ggcttttctc - 46441 gaccctgtcc ggaaccgcta gggatgtgcc ggtagcgcgc tcgtgtcccg ctggagcggc - 46501 gccccggggg cacgcgctcc agcgggaacc gtcgggtcct cgagcccggt ggccgacggt - 46561 ggcctgcggc cccagaagcg atccgggagg tggcagggat gagacgcttc cgcccgcgcc - 46621 gatgcgtccg tggcctgtgg gagggtctgg tcgcctacgg gcggctctgc ctggccggcg - 46681 agacggaccg gtacgaccac cctccgcgcc cgcgcgtccg gtggcaccgg ccgccgccgg - 46741 gacacccgga acgggtgcgc gacgacatgc ctctgaccga cctggagcgg cgcctggccc - 46801 gcgaactgac cgacgaggac cacgacgtcc gctaggcggg gacgccacca cgcgtgccgc - 46861 gggcggggcg gcggacgccg ggcagccggg agacacggac ggccgggcag ccaggagacc - 46921 ggcaaggccg gaaggccgga aggccaggag ccggaaggcc gggcagccag gagacctggc - 46981 agaccgggga gccaggaggg ccaagagccc aggagcccgg gaggccagga ggccaggagg - 47041 ccgggagccc aggagcccga aggccggaag accggagggc cgggagtccg ggagggccgg - 47101 ggagtcggcg ccgggggtgt ttccctttgc gcggcccgcg gggcgcgggc cgttcctggc - 47161 cgccggtgtg ttccgctccg tctcgttagg ggcgggccgt cactgcgcct gaggggcccg - 47221 gagcactgcg gcggagttga agccgccccg tccgcgggcc agtaccagcg ccactcgcag - 47281 ccggggcagt tcccgtgggg ctccggtgac caggtccagc gggcagtcgt cggcgacgcg - 47341 tccggttccg gtggtcgggg ggacgacttt ctcgcgcagg gcgagcagcg cggctgccac - 47401 gtccagggcc gagccgcccg cgcccagccg cccggtcatc gtcttcggca cggtgaccgg - 47461 tactccgtag ggtccgaaca gcgcgcacag cgcctggctc tcgacgaggt cggcgcgccg - 47521 ctcggcggcg ccgtcggcga agaccacgtc cacgtgttcg ggggccaggc cggcgtcggc - 47581 cagggcgagt tccgcggcct ggcgcagtgt ggggcggtcg gggccgtcga aggtggcggc - 47641 gcagccggcg atgacgccgt agccggtggc gccccggcgg gcggcggccc gggcgtcctc - 47701 caggacgagc agggcgccgc cctcgccgac cgcgtggccg tcggccgtgg ccgcgaaggg - 47761 ccggtaggcc cgggcgggtt cggtggccgg gctgagccgg ccgtccgcca ggtgcgcggc - 47821 ccagccccat gcgcacagtg tggagtcgat cccgccggtg accatgaggc atgccccgtc - 47881 gcggatccgc cgccgggcgc gggcgagtgc gtcgatgccg ccggcctgtt cgctgacgac - 47941 ggtcgagccg tggccgcgca gccggtgccg gatggagatc tgtgcggggg ctgccgcgtg - 48001 gaaggacgcg aaggactggt aggcgctgac gtgctgggcg cctttgctcc acagcgcggc - 48061 cagtccccgt tcgccgaatt cggcgccgcc cgcggagctg gcggtgatca cgccggcgcc - 48121 gtatgcgggc aggtcggccg ggctcacgtt agcgtcgcgc agtgcttctt cggctgcgac - 48181 cagggcgatg cgggtgccgc ggtcggtgga gggcagcagt ctgctgggga tgtggtcctc - 48241 gtcgacgaag ccggggatct cgccggcgat gcgtacgggg tagccggagg cgtcgaagcg - 48301 ggtgatgggg cccagtccgg tgcgcccgca cagcacggcg tcccaccagg ctctggtgcc - 48361 caggccgttg ggtgcggcga ctccgatgcc ggtgaccagg gtctggcggg ggccctgggc - 48421 gccggcgggg cgggccggtt cgggggcctg ggtcgccttg gtcatgcggc ctccttgagc - 48481 tgtggccggg tgaggacggc ggccgtgtgg aagccgccga agccgctggc gacggtgagg - 48541 acggtgctgg tgcgctgttc ccgggcgaac aggggggtgt agtcgaggtc gcaggtgggg - 48601 tcgggttcgt ggaggttggc ggtgggcggg acggtgtcgt gccggatggc cagggcgctg - 48661 gcggccaggt ccagggcgcc ggcggcgccc agggcgtgcc cgatcatcga cttgatggag - 48721 ctgacgggca cgcggtgggc gctgccgccc aggctttcct tgagggcgtg tgtctcgtgc - 48781 cggtcgttgt gccgggttcc cgcgccgtgg gcgctgatgt agtcgacgtc ggcggggttc - 48841 agccgtgcct ggtcgagggc ggcgcggatg gcgtcggcca tctccagtgc cccggggcgc - 48901 agtcccgtca tgtggtgggc gctgctgtgg gcggtgacgg cggacagttc cgcgtagggg - 48961 cgggcgccgc ggcggcgggc gtgttcgagt tcttccagga ccaggacggc ggcgccctcg - 49021 ccgagcacga atccgtcgcg ggtgcggtcg aaggggcggc tggcggtggc ggggtcgtcg - 49081 ttgcgggagc tggtgaggcg caggcggtcg aagcaggcca tggcgatggg cacgatgggt - 49141 gcttccgttc cgccggcgac gacgatgtcg gcgctgcctt cccggatcag gtcggcgccg - 49201 tggccgacgg cgtccaggcc ggaggtgcag ccgctggaga cgagagcgac ggggccctgt - 49261 gcgccccggt cgcgggcgac ggtggcggcc agggagctgg ggacgaagta gtcgtagagg - 49321 gattcggcgg cctcggtgtg gtcgagggtc caggtggtgc cgcagtcgct gaggatggcg - 49381 tactgggtgg ccaggctcgt ggtgcagccg atggcgctgc ccaggctgac gccggtgcgc - 49441 agggggttgc ggccgatgcg gtccgcgacg ccgctgtcgg cgacggcttc gcgtgcggcg - 49501 accagcgcga actgtgccgc gcggtccagg cgttcggtgt cggcgaggtc gaatccgtgg - 49561 gcggcggggg tgaagtcgac ctcggcggcg acgcgggagc ggtagccgca ggcgtcgaag - 49621 agggtgacgc ggcgggtggc ggtgcggccg acggtgagca ggtcccagaa gccggcggtg - 49681 cccaccgcgc cgggggcgac gacgccgatc ccggtgatca cgacgcggtt caccggccgc - 49741 ctcccgtggg cagcgcggtc acgtggccgc ggcaggcccg gccgacgtgc tgggccaggc - 49801 tcgaggagct tgcgaagaag tgtcccccgg cgacggtgtg cagttcgatc aggttggtgg - 49861 tccactgctg ccagtggcgc agggcggcgg gtgcggcgag cgggtcgtcg cggcccgcga - 49921 agaccaggac gggcacgtcc agcggccctc cggtgaccgg gtccagggcg gcgttgcgca - 49981 gcgaccgggc caggcgcagg tcgtcgcgca ggacgggcag gaaggtgcgc cgccacagtc - 50041 cgccgggaga ggccgaggcg cccggcggca gggagccgat ctcgtcgagc agcggcagca - 50101 ggtcctcgtc gggcaggtcc gccgcgtccg ccaggacggt ggtggtgtgc gggggcgggc - 50161 aggcgccgac ggccaggaac agcgggggca ggccggagtc ggccagggcc cgggtgagcg - 50221 tgtagccgac gagggctccc atgctgtgtc cgtagagcgc gtaggggccg cggcgtgccg - 50281 tctgaagcag ggtcggcagg aagtcggcga gcaggccggc gcgttcggtc aggcgtggtt - 50341 cgcggcggcg gctgtcgcgg cccgggagcg gcagggcggc cacgtcgatg ccgggtccga - 50401 ccgccgcgga ccagccgcgg tagctcgcca cgcccgctcc ggcgtgggcg aggcaggtga - 50461 gtgtgatccg tgcggtgccc gcctcacggt ccctggagcg ggaagccatg cgtcgccctc - 50521 cttgtgaacg gtccggtccg gccccatccg ggcgggcgcc gccggcgtgg cgcgtgccac - 50581 gcggtgccgt cccggcgccg gtccgggggg tgggtgcccc tgcgcaccga gcgtcgcccg - 50641 cgcggctcgt gcggcgctca accccgcggc gaggcgggcg gcgaccccgg ccggcggccg - 50701 cggcggccgc cgcccctgcg ggggccggcc tgccgggtcc ggccgggcgg cgagggcacc - 50761 ggcgtctcat gccgcgtaca ggtcgaacgt ggaggtgcgc cgggggcccg ccacgatgtc - 50821 caggcgcggg tcgacggcga gcatcgcctg gtgcagccgc tgcagttgcg gggagggttc - 50881 gacgccgagt tcgtcgatga gccgctggcg gagcctgcgg tacacgtcga gggcggcggc - 50941 ctgcctgccg gagcggtaga gcgccaccat ggcctgggag tgcagccctt cgtgctgggg - 51001 gtggcgggcg atcaggtcgg tgagttcggc gatgagttcg acgtgccggc ccagccgcag - 51061 gtcggcgtcg atgcggcgct cgcgggccac cagccggctc tgctccaggc gcatcgcctc - 51121 gatctccagg acgggcccga cccgcacgtc gaccagggcg gggccgtccc acaggtcgag - 51181 cgcccggcgc agcaccgtgg ccgcccgctc gtcctcgccg tcctcgtagg cctgtcgtcc - 51241 ttcggtcacg agccgctcgt aggtgaacgc gtcgaccgcc tcggcgggta tctgcagcag - 51301 gtacccgccg tagcgggtgg ccaggacgtc cttggccgag cccggcacgt cggggcccat - 51361 ggccgtgccc agcaggcggc gcagctggag gatgtacgtc tgcagcgtgg tcatcgaact - 51421 ctgcggcagg tcggtgcccc agatctcctc catgagggtg ggcaccggca ccacccggcc - 51481 ggggtacagg gcgagcagcg ccaggatctg ccggggcttg cccgcactgg ggacgaccga - 51541 gattccctcg aattcggcgt tcaacgcacc caggactttt atttccataa ttccctccgc - 51601 aatgtttcgg ggcgactggt tctgagccgt tgacggagct acttgatact gcctccttgc - 51661 gcctgtccgc gtcattcccg ccactccgcg gcaagaggaa ccggacggtt ctctgatcgg - 51721 cgcgcgaggg cggctctagt tattcttgac ccgtccctgg aagacaggag gctgcggctt - 51781 tgtccgggct gtcgccgggt taccgctcac gggtggtgat tttgcgcccg gtacggtcgg - 51841 gggcgtattc gtttcggttg tttttccggc cacggcgagg gccgcggtga gggccgcggt - 51901 gacggcgtcg ggcggcgcgt gcggggccgg ggagcggtgc cggccgtccg gggacggtcg - 51961 tggccggccg tccggtggcg gagggtttcc tgtcccgggc ggcggcgccg agcccctgtc - 52021 ccggccggtg gcggagggtt ccctgttccg gccggtggcg gagggtttcc tgtcctggcc - 52081 ggcggtaccg ggtttcctgt cctggcgggc ggcgggtggg tgtcaccggc tgtccgggcg - 52141 gggcgggctt ttcggtcgcg gtgtcctgtc cttttcgggc gggccggggc cgcgggggct - 52201 gaagaactct cgaggaatcg cccacgccgg tacggggccg gctggagaat agcgtgccgg - 52261 aaaccatggg cggatagagt ccgtgcggaa ggaagtgcac ctgctattcg tgagggaata - 52321 ccggggccgt gatccgggcc ggcggatgcg gaatcgggtg cttcccgggc aagggcgaga - 52381 tggagttccg gattcttggt tccgtgcaga tccacgacga gcgttttggc gtccgggtcg - 52441 ttcccgcggg tgcgaagcag cgtgcgctgc tgggtgcgct gctggtgagg gccgggcagg - 52501 cggtgccggc cgagtgcctc gtggaggagc tgtggggcgg gcagcctccg gtcaatgccg - 52561 ccaacgcgct gcaggcccat gtggcccggc tgcggcggct gctgccggcc ccgggcccgg - 52621 gcgggccgcg ccatgtgtgg ctgcggacct ccccgttggg ctacaccctg agcctggggc - 52681 cggcggtgac ggacgcgcag cgcttccacc gtctggtggg ccaggggcgc gagctggccg - 52741 ccaccgcccc gggccgggcg gtggaggtgc tgcgcgaggg tctggcgctg tggcgcgggc - 52801 ccgctctgca gggcagcggc caggggccca tctgttcggc cgaggcggcg ctgctggagg - 52861 agagccggct gcgtgccctg gaggtgctct acgacgtgtg tctgcgggcg gaccgctgtg - 52921 cggagatcac cggtgagctg gaggagctgg tcgccgtgca cccgctgcgt gagcggttcc - 52981 acgagcagct gatgacggcg ctgcaccgct gcggccgccg ggcggaggcg ctgagcacct - 53041 acgacagggc gcgccggcgg ctggcccgtg atctgggtat cgggccgggc caggtgctca - 53101 gccgtcgcag agaagcgatt ctgcgttcct gtgagccggc ggcggactcc gccgaccggg - 53161 cgggggccgg gacggccggg cagggcgggg acgaactcgg ggtgctccgg gaggagctgg - 53221 tgcggctgcg cggccacgtg gagctgctgc gccggcagca gcgggagctg tccgagcagg - 53281 tcgcccggct cacggcacac catccgtgcg gcccgtgagg aacggcggcc gggtcagcgg - 53341 gtgacgaggc ggccgctgcc gccggcggcg gcgggcgtct cggggcgggc catgaggatg - 53401 gagcgctgca ggcggctgag tgcggcggag ggttccaggc ccagttcgtg cacgagtgtg - 53461 ctgcgcagcc gctggtagac gttgagggcc tcaccgcgcc ggcccgagcg gtgcagggcc - 53521 agcatgaact ggccgtgcag gctctcgtgc atgcggtact ggttgaccag gaccgtcagt - 53581 tccgacagca gttcccggtg gcgtccgagc cgcaggtcgg cctcgatgcg ctggtcgagc - 53641 gcgcacagcc gggcctcctc cagccgcttg acctccgtgt cgatgcgcag gccggcctgg - 53701 atgtcggtca gggcctgccc gttccacagc gcgagcgcgt cggccagccg gcgggccgcg - 53761 ccggcgtagt cctcggcgtc catggcccgg tagccgaggc cggcgcgctg gtcgaactcg - 53821 cggtagtcga cgtggccgcc gcgtgtctgc aggcggtagc cgccgggaac cgtggcgagg - 53881 atgtccttgg cggtgcagcg ttcgtcgggg ccgtgggcca gcgcctgggc catcagctcg - 53941 cgcagctgca ggacgtaggt ctgcagggtg gtccgcgcgc tgcgcggcgg gttctccccc - 54001 cacagttcgt cgacgagcgc ggccaccggg accacctggt cggcgttgag cgcgagcagg - 54061 gccaggacct ggcgcggctt gggtgcggtc ggcacgaccg acaccccgtg ttcgcgcacc - 54121 gacagcgcac ccagcacttc gatgtccacg tttcccccat gttttcaagg ccgcaggccg - 54181 gtggccggcc tgcgcgtctc ccgctgaccg ggacccggcg cggctgcagt cccgataaaa - 54241 aaacagctca gtcggtttgt caatgtggac tcgacgcgtc gccccggcat cgcccagatc - 54301 cagtcaaacc ctgatcgaac atctgcccac aacccggctc cgagcaggcc gttcatcact - 54361 caacccgccc atgattcgcc agtgttgcgc gaaaccgcgc cctgtacagc accggagcga - 54421 ttgactggaa accatcggcg cggatcgcgc gggacgggga agccccgcac agggaaaagg - 54481 ggcgccattt cccgaatgcc cgattcgggc gtccggtcgg cgcccccaaa ggagaccgta - 54541 cggtctttaa ttatccggtg gcggtcccgg tccaggagcc ctcggcctgc cagagcccgg - 54601 cgtgcggcgc cggcgcgagc gcgggcagga gcagcagcca gaactgggcg accgtgctgc - 54661 gtgacagcca cgcctggttg cgcatgccga gcacctcgaa gccgctggtg gcggcgacca - 54721 cggcggccac ggcgctctcc ggcgcgacgc tctcgcgcag ctcgccgccg cgcccggccc - 54781 ggccgaccat gtcggtgacc cagttctgcc agcacagccg caggtcggtc cgcggctgcc - 54841 ggccggcctc ccggctcagc tcgaaacccg cccgcagcac cacgtcgttc tgcagggcgc - 54901 aggccagctc atgggtggcg ttcaccaggc actgcagaac cccgggcggt cccccgtccc - 54961 accggccgca gacggcccgc agcacgtctg cggccgcttc ctccaccgcg tccgccagcg - 55021 ccgccttgct ggcgaagtgg aagtgcagtg cgccgttgct cacccccgcc ctggagctga - 55081 tcgtggtgag cgcggcggcg tggaagccct cgtcgtggaa gatctcggcc gcagacctga - 55141 tcagggcttc ccgcgtacgc accgcacgtt cctgtctggc catcgatcac tccgtcactg - 55201 cggggggttg ccgtgcttgc gggagggcac gtcggcgtcc ttggtgcgca gcatcgccag - 55261 ggactcgatc agcacctcgc gggtctcggc ggggtcgatg acgtcgtcga ccaggccgcg - 55321 ttcggccgcg tagtaggggt gcatcagctc ggccctgtac tccttgacca tgcgggcgcg - 55381 caccgcgtcg gggtcctcgg cctcggcgat ctgccggcgg aagatgacgt tggcggcgcc - 55441 ctccgcgccc atcaccgcga tctcgttggt cggccaggcg taggtgaggt cggcgccgat - 55501 ggactgggag tccatcacga tgtaggcgcc gccgtaggcc ttgcgcagga tcagggagat - 55561 acgcgggacg gtggcgttgc agtacgcgta cagcagcttg gcgccgtggc ggatgatccc - 55621 gccgtgctcc tggtcgacgc ccggcaggaa gccggggacg tccaggaagg tgacgagggg - 55681 gatgttgaag gcgtcgcaca tctggacgaa gcgggcggcc ttctcggaag cttcgatgtc - 55741 caggacgccg gccagggcct gcggctggtt ggcgacgatg cccacgacct ggccgttcag - 55801 ccgcgccagg gcgcagatga tgttgcgggc ccagccctcg tggacctcca ggtactcgcc - 55861 gtcgtcgacg atctcctcga tgaccctggc catgtcgtag gggcggttgc cgtccgccgg - 55921 caccaggtcc agcagcgcct cggaacgccg ggactgcggg tccgagcagg gcgtgcaggg - 55981 cgggaactcc cggttgttct gcgggagcat cgacagcagg tagcggacct cggcgaggca - 56041 ggtctcctcg tcgtcgtagg cgaagtgcgc gacaccggag gtctcggcgt ggacgtcggc - 56101 cccgcccaga ccgttctggg tgatctcctc gccggtgacc gccttgacca cgtcggggcc - 56161 ggtgatgaac atctgcgagg tgtcgcggac catgaacacg aagtcggtga gggcggggct - 56221 gtaggccgcg ccgcccgcgc acgggccgag catcacactg atctgcggga tgacccccga - 56281 cgcccgggtg ttgcgctgga agatgccgcc gtagccggcg agcgccgaga cgccctcctg - 56341 gatccgggcg cccgcaccgt cgttgaggga gaccagcggg gcgccggccg cgatggccat - 56401 gtccatgatc ttgtggatct tcgtggcgtg cgcctcgccc agcgcaccgc cgaagatccg - 56461 gaagtcgtgc gcgtagacga agaccgtccg gccctccacc gtgccccagc cggtgatcac - 56521 accgtccgtg tacggcttcc tggcctccag cccgaacccg gtcgcccggt gccgccgcaa - 56581 ctgctcgacc tcccggaacg accccgcatc cagcagcagc tcgatccgct cccgcgcggt - 56641 cagcttgccc ttggcgtgct gcgccgccgt cgccttctcg ctcggcccgg ccagtgcctg - 56701 cgcacgcaca ccgtgcagct cggccacccg cccgcgcgcg tccgccggct ccgcgggaag - 56761 cgccacccga ggaatgtcat tgagtatcgt cacgatctgt ccctccctca tggcgcggcc - 56821 cggtcgtcgc ttcaccgtaa caaaccatct atgcggtttt ggttcgggga gctcggcgcg - 56881 cacaggaatc agccatggaa gatgcggtgc cggcctaccg ccagcagtag ggggaccggt - 56941 aggccccggc ccggtgtccg ggccgccacg gggcagcccc ggaccgctcc cgcccgcccg - 57001 gcccctcgtc ccggcgggcc gtcagcgcgt acagcacggc ggtgagcgcg gccagttcct - 57061 cggcaccggc acgtccgcgc tcgatgcgca cagcgggcac ggcccgctcc ggttcggcca - 57121 tgtcccctcc tctcggcgtg cggccaccgt ccgcccgcgc actacaggag cgctgcactt - 57181 ccgctcgaga ggacgggcgc cggccccgcc gccccgcagg cgcccgcagg ggcccgcctt - 57241 cggcaacaga gcagggtgcc gggcggagcg acggcttccg gaagggcggc ctccaagagc - 57301 ggctcgtcgg agggaccggt tcccctagaa atcaaaccgg acggtcccta tctttcatca - 57361 cgtccgtcac cgacggcgga cggagcgctt tcgatacgtc cattagcagg gggaaaaatg - 57421 gctaccagcg cgttccccgc aacacacccg gccctcggcc aggagcccgt actgcccgcc - 57481 ggcaccccgc ggttgcggcc cagcctcttc cgctacccga acctgacgac gaccgtcccc - 57541 aaggaactgg tccaccgcgc cgccgtcgcc gaggtcatgc tcaccgactg ggagcgcgtg - 57601 gacgacacac gcttcaaagt cgccgcccag tggccgcgcg gccacagctt cttcaccccg - 57661 atcgacggcc gctaccacga ccctctcatc gccgccgaaa cgatccgcca ggtcggatcc - 57721 ctcctcggcc acgccgaatt cggcgtcccc ttcggccacc actacctgct gcacgacctc - 57781 agcctgcgcg tcgacccgca ccacctgatg atccaccagg cccccgcctc cctcgacctc - 57841 gacgtgacct gcgaggacct caagatgcgc ggcggccgcc tcgccgccct gcgctacgag - 57901 gccgtcgtac gccgcgacgg ccacaccgcg gcgaccggcg tcttctcctt ctcctgcgtc - 57961 tcccccaccg tctaccggcg gctgcgcccg ccccacgtgt tcgccgacgg ccaccgcccc - 58021 ctgccgctga ccgcacccgc cgccccgcag agcgtgggac gcatgtcccc cgccgacgtg - 58081 gtcctctccc ccaccgagga cccccaccgc tggcagctgc ggctggacac ccagcacccc - 58141 gtcctcttcg accaccccgg cgaccacgtc cccggcatgg tcctcctcga agcggcccgg - 58201 caggcagcag caggagccct gggaagaacc tccctgctcc ccctcggcct gaccagcgaa - 58261 ctggtgcagt acgccgaact cgacatcccc tgcatcatcg aggccgcccc ccaccccacc - 58321 cacagccccg gcctcaccac cgtccacatc accggacacc aacgcggcca gaccgtcttc - 58381 acctgcaccg tcacagcagc agacgcctga cccccgccac cccgccgccc ggtcagcggc - 58441 cggaaaaacc cgccacatgg tcggccgccc actgaccaaa cgaccgcgca ggcctgccca - 58501 ccaggcgggc gaacgtcccg tccaccccgg ccttggcccc ctcccgctgc cgcacagcac - 58561 tccgcagcag cgcctccacc accgccggcg gataccgccg gccccaccgg gcccgggcct - 58621 cctcccaccc cagctcctcg aaacgcagcg gacggcccag cacacacgac agccgggccg - 58681 tccgctgaac cgccgagacc gcctccggac ccgtcagcac atacgcacgc cccgcatgcc - 58741 ccggccccgt cagcgcccgc accgccacct ccgccacatc ccccggatcc acacacgcgt - 58801 tcaacgacgc cccgaacagc tcacgcacca caccctcggc ccggacctcc gccgcccacc - 58861 ccagactgtt ggacatgaac gaccgcggcc gcaacaacgt ccaggccagg cccgaggaac - 58921 gcagcagttc ctcgctctcc cgctgccagc gggtgatcag gtcgtcggcc cccgcatcct - 58981 cgacagcggc cgccgacagc ttcaccacat gctccacacc cgcatccgcc gccgcccgca - 59041 caaaacacgc atcctgatcc cccccgacca ccgtcgtcac caaaaacgcc cgcctcaccc - 59101 cccgcagagc cgcccgcaac gacgccgcgt caccgtaatc cccacggacc accctcaccc - 59161 gccccccggc cgccacccgg gcaggatcac gcgccagaac ccgcacctcc acaccggccg - 59221 gcaaccgccg caccacctcc ccgcccaccg tccccgaccc acccgtcacc aaaaccacca - 59281 caacgccccc caccccgaac ggccgatccc cacctgtcgc caccgaagtt acccacccgc - 59341 acgtcttggc cacacgccca ccgacgttaa aatacgaact agacggtttg taagcgaagc - 59401 cttccacagg gctcatcgca caacgggagg gcaacgtgcc ggcacaagaa cgagcgatcc - 59461 gcacacgcca gaacatcatg ctggccgccg ccacagtctt caacgaacgc ggctacaaag - 59521 ccgccaccat cgccgacatc ctcaccacag caggcgtcac caaaggcgcc ctctacttcc - 59581 acttcccctc caaagacgac ctcgcccaag aagtcctcgc cacacagaac cgcaacctca - 59641 ccatccccga acgcccctcc aaaacccaag aactcatcga cgtcgtcatg ctccacaccc - 59701 accgactcca gaccgacccc atggtccgcg cagccgtccg cctcaccatg gaccaactct - 59761 ccacagaatt cgaccgcacc ggccccttcc gccaatgggc cgacctcacc cgccaacgcc - 59821 tcgaacaagc ccgcgaccaa ggcgaactcc tcccccacgt caaccccaca gaaaccgccg - 59881 acgtcctcgt cggcgcctac gccggcatcc aatccatgtc ccacgccctc accgactaca - 59941 ccgacctcac cacccgcgcc aacgccctcc tccgccacct cctccccacc atcaccctcc - 60001 cctccatcct cacctccctc gacctcaacg aaaaccgcgg cgcccacgtc tacaccgaaa - 60061 tccacaccac cacctgaacc acacccaaaa acaatgaagt ggatcgcgcc tgattgcctc - 60121 atccaagagg cgagttgagc gatcaatccg aactgagaac gtcttccgtg aaccgtgcgg - 60181 gatgaaccgc gggacggccc caagccattg ccgccgcagc atgaacgcaa gtcccggtgc - 60241 cccggccgca ggccgctgcc ggaccgggaa gccccgtgca ggaacaacac cctgccccca - 60301 acacagcaca agccggccgc acactcggta ggccgtagcc gccagccagt tccagcagga - 60361 ccgggcgttc gacggaacac ccccgtgtcg gcgggaagga ccgctgccta cccctccacg - 60421 cctgcccgca cctgaccttc ccggcacacc gccccgtgag tgccggaacg cggaggtcgc - 60481 cgaccgacgc gcagcagcct cactgaggcc cacttggtcg gccccgctgc agacctcgat - 60541 cgcaagaacg ttgaggaacg cgccgtggag gccatcacac gcttcctctc cctccctgac - 60601 ctggaattgc tgccctcggc agaccgcggg agatccaaga ccgttggttc aagcgagtcg - 60661 cagtcggcct aggttgcggt ggccacgtcc gaacacatct caaggagaag ttcatgtctg - 60721 acgcgaagga ggccggagac agagccatgt cacatgaggc agcggacgac agcgaccgag - 60781 acggcggaag aggatcctct aggctaggct ggcggctttc ctgcctggcc gttgtggtgg - 60841 ccgttctcgc cgtcgggacg ggaggccggt atcggcacac ctccggctga gatcgaccgc - 60901 tccggtcctt cctcgacaac aagagatcgg ccaccagggc tactggatca ccaacgcggt - 60961 ccaggtcacc ggcgactaca ggctcgtcgc cgagcgaccg gacgtggcac gcggccagca - 61021 gtcataggcc gtaagcgccg ggtcgcgggc agcggccctg tgcgatcact gacccaacac - 61081 cagagctccc gtaacgagac cgcgatccgc agtcctcagt ccccagacag cgggcgcgcc - 61141 acccggcttg ggttagtcag ctgtgctgct ggctgccctg gagagactgg tcggtcatgt - 61201 cggcaacctg gcctgctggc ggggcctcgg cgttgacctc agtgccgaag tccgagaact - 61261 ccatcaccgt gctcatctgc agctgctgag gcgaagcgct gccttccggc ttcgcggagg - 61321 cggaggctgg ggccttgagg gtcatctcta tctgctgacg gcgcagtcgc cctttgtcgt - 61381 cgagccagac gtgcatcggc agcgtcgggc cgacctgctt gctcagctgc tcgccgcccg - 61441 gcagcttgga gacgtccacg gacaccttgt actgcgtggt gttggccccg tcgatctcct - 61501 cggttccggc cttggtgacg tccttgttgg tgatcgccct ggcgtaggcg gcggtctggg - 61561 ccgggtcgcc gatctgctgg ttgctcaggc cctgctgcgc ggcgaccttt tccaagtcga - 61621 tcttgatcca gggtttgccc cccagagcct tctcaccggg aatcttctgg tagagaacct - 61681 ggtcgaccac gcgttgttcg atggtcttgt cctgcacggt aagggtcatg acactgtcgc - 61741 cctccgccag gtcgaggacg cccttaccgt cggatgtgat cgtcttgccc tccgcggcga - 61801 gcttcatctt gatcgtcatc cgcgcggact cggcttcggc cgtcttgtcg taggcagccc - 61861 gaacctccac cgtgccctgc tcctgggtgc cggcgctgct actcgcgctc ggcgacaccc - 61921 cgtccctctt ggcctgcgaa ccgtcaccgt caccgcaacc cgacaggaca acgctccccg - 61981 tcaccgcggc cactacgatc gcgccggcct tcatccccct gtagcgcatg cgaatctcct - 62041 caacgagtac caacccccgt cacgtcggtc tgctgggctc cgaatgccct gaccaagggc - 62101 caacacgcct gtgtgcaaag tgaattgttg atacgtcccg cacggagaca gatattcacg - 62161 cttcctgcca ggtccaacgc tgctgctgcg atgtacgccc acacgcttcc accagccgca - 62221 atcaccatcc tgctgcccat cgaccgcatc gccgccgacc gcccccttct gctccggcga - 62281 gcacaagaga cacgggatga acgtgcaggt cccggccgat ccgtccggcc ggctgctgtg - 62341 ggcctctccg gctctgcccg gtgccgtcca cgacgtccga gccgcccgtg aacacgacat - 62401 cgtccgcaag ctcacggacg ccggcatcac gtgttggacc gacaagggat accgaggcgc - 62461 cgggggcacg gtccgcgttc cgttggggcc gtcgggagac acttcccgag gccagaagga - 62521 cgtcaaccgg tctcacgcca agaaatgggt cctggtcgag caagccgccg ccaccctcaa - 62581 tgcctggcga ctcctccgca acctacggtg ctcgaccagt ggcgtcacaa gcctcgtccg - 62641 ttccgtcgtg accgtgcatt tggccagcac agacggaaaa ggctcaatga cgaccttttg - 62701 agcgtcccat acagatgccg actgctaccg cgaggacggc aacgacgaaa ggaccgttcc - 62761 catggttccg ccagggaacc aaagtgcagc cagagcagtc atctttttcc accctattat - 62821 gtgctgcgtt actgctccag atcctgcagg cctagcaaca caacgggccg accgccgggc - 62881 cctcgcctgg actgacacac ccctcatccg ctggacttac gaccactctt catggcgtag - 62941 gtaagcatcc cgatgccggc gactccgaga actcctagcg tgaggagtat gaccctccca - 63001 gatccctcga tgagagatcc ttgaacgaga gcagcaactg acaccacacc actgacagcg - 63061 gtgaatatct tcaactttcg cttttcatcc acttccaata ctccgctctt gagacatgaa - 63121 cacgaccagc ggtggagagc cctacatgcc ctccaccgca gatgacgaat agggtcagcc - 63181 cttcctgaac ccctcagccg taggtgatta tctcagcgtt gttgtagccg aggacccctc - 63241 cgacggcgca gctcgtcact acagcgcccg ccgttcccca cgggccgaag gtgctggccg - 63301 ccgcgatgat tcccgtttct gccgcagctc cgactccagc gacgcaaccc gtgacagctc - 63361 cccaaatgtc gttggtgtcc tcgaggaagt tggacacact gtcgaggaac ccgagtccgg - 63421 acggatccat gttgttgatg gggtcgccgg cagcgtagag gtaggggttg gtttcctggc - 63481 cggaggggtc gggctgggtg aagcggccga gggtggggtc gtagtagcgg tggcccatct - 63541 tgtacaggcc ggtcgggtcg gcgtaggcgc ccgcgtagcg gtacggctga gggacggcct - 63601 cggtcggcgt cgtgcgcggc agtccggtgg ggccgtaggt gtaggtgtgg gtgcgcttgc - 63661 cggtgtcgtc ggcgaggccg aggacgttgc cggtggcgtc ggtgaggtag tagtaggact - 63721 tccccccagt cgtcatggag ttcagcgtgc ccgccggttc gcggatgaat ccggtgtcga - 63781 cgccgttcgt cgtggtggag gcgaggccga gggcggtgtg gtggaaccat gtggagccga - 63841 gtttggtgcg ttcggcgttg gtggtgccgg catggaccag gtcgtaggtc ttgccgcctg - 63901 cggtgatgcc ggacagttgg ctgtagtccg tccaggactc gtccgtgcgg ggggtgttgt - 63961 cggctgcggc ggtttcgttg ccgagtttgt cgtaggacca gccggtggtg gagccgttct - 64021 tgccggtcag ctcgctggcg tcgttgtagg tgtaggtggt gccgccgggg caggtgttct - 64081 tgctgccgtc tcggctggtg aggttgccgg ccttgtccca gcagtacagc cacgacgcct - 64141 tccgcgtgcc tgccgcgtcg gcctcgagcg cgtaggagag gcggtcttgg gagtcgtagg - 64201 tgtaggtggt cttgagcttg gtgaggttgt cggtgcgggt gcggatcttg gtggtgtcct - 64261 tgcccgcgtt ggcgtagctg taagtcaggt cgacgaaggt ttgcgtgccc gaggtggtct - 64321 tgatcgcctg cgggcggccg ttcttgtcga tggtgacggt ctgggtggtg ccgccggggt - 64381 agacggtctt ggtgcgcttg tcgttgttgt tgtagtcgaa gtcggtcttc ttgccgtccg - 64441 gtgcggtgag gtagtcgagg cggccggcct tgtcccaggt gtagtccgtc gtcccggtcg - 64501 gatcggtgta gaagtcgacg tcgccgccgg gggtgtaggc gagtgcggtc tgggcgccgt - 64561 tctgcagggt gcggacgctc tcgcggttga gcttgtcgta gtcccacttg gtggtgccgg - 64621 aggcgtcggt gcgggacttg acgttgccgt cgccgtcgta cgagtaggtg acggtgaagt - 64681 tggtggagga gacctcgtgg acgcggtcgc gggagtcgta ggcgtagacg gtggtgatgc - 64741 cgcggccgtc cttgaccgtc tcgacccggc ccagcgcgtc gtaggtgtag gtcgtctccc - 64801 cgagcggcgc cggcggtgtc accttgatca ggttgccctg gtcgtcgtag gtgaaagagg - 64861 tgaccttgcc gttgccgtcc ttggcggtgc agcgctggcc ctcgaaaccg ccgcaggtcg - 64921 gggtgtcttt gttgtaggtg tactcgcggg tcgtgccggc ggtgccggat gtggtgaccg - 64981 acagggtgtt gccgttggtg tcgtacttga aggagtcctt gcggccgttg gcgccagtca - 65041 tgtcgctagg caagtcggtg ccggcgatcg tctggtaggc gctcaccgac gctgtcgcac - 65101 ccatcggcag cttctgggag acggggttgt tgcggtcgtc ccagccgtag gtggtggtgt - 65161 tgccgccggt gccgtccgtg ccggtgccca tcgcgtcgat cgcggtctgg gtgaggtggt - 65221 tcttgtaggt ggcgtggcgg gagtggccga gggggtcggt gaccttggtg acctcgccgt - 65281 cagcgttgtg cgtgtagatc gtttcgtcac cgtcggggtc ggtgaccgtc gtcgtacccg - 65341 cgtccgaggg ggtggccgcg gtgtagtcgt agcgccaggt cggcccggtg tggccgctgc - 65401 ccgaggtgcc ggtggcgcgt tgcatggagg tgacgcggtt gtggctgtcg taggtgaaga - 65461 gggtgacggt gccttcgggg gtggtcacct tcgtcaggcg gcgtgaggag tcgtactcgt - 65521 aggcggtggc cttgccggtg gtgtcggtga ccttggcgag gtttccggcc gcgtcgaggt - 65581 cgaggacggc ggtgcggccg gtgtggtcct tggcctgcca ctggctcgcg tccgtcttga - 65641 ccaggtcgat ccagcggccg gagcgggtct cggtgagctt gaagcccttg tgctcggcgc - 65701 cttcgtcgtg ctggtcgacg gtgatcgtgc ccttgttctt gtccgtgacc ttggtgagcg - 65761 tgccgtgctc gttgtaggtg tccttggtgc cggacttgcg gtcggtgagg gtgtaggtgc - 65821 cgtccgcgtt cttcttcaga tccttcgagt agcccgtcgg cgtcgtgtac gtgccgtccg - 65881 cgttagcggt gaagcgcagc aggctgccgg tggtatcgaa gacgtccacc tcgccgtcgt - 65941 tgatctgcag gtagcgttcg taggcctgcc accagcgctg cgacaccttc ccccacggtg - 66001 cctcgaggga gttgtaggtg cgggtcagct gaagtttctg gccgacgccg gcgatgtcga - 66061 agtcggtcgc ggcgagcatc aggttgccgt tggagacgtt cacccgcgcg accagtgcgt - 66121 cattcaggcg ggtgtcgagg atctggtgcc agggcacctc tccctggccc tcgggcacgt - 66181 agccggccac cgcagcatcc acggcagccg agcgagatgc ggacgtcttg gcgcgctctg - 66241 caccggcagc gcgggccttc tgcgccgccc gccaggccgc gacctcggcc gacggcttgg - 66301 cctccgcctc cgaggtgggc gccttgaccg tgccggccgg tgtcgccggc gcctccacct - 66361 tggtcggctt cgtccacgga ctctccggct ccggcaactc cggtttcggc gtcgccgcca - 66421 gaccgggagc cgccgcgatc accacggcag ccgcggtgat cgccgagacg agagcggttc - 66481 tgtgtgttct ccggtcacgc cacatgggcg tgcgcgcagc acgcgagtgc atcagcttcc - 66541 ccccacagga agtcagaccc ggcaacccca gcggtcgcca gcggcacaca agctgtcaca - 66601 agacgcacac aaatcggcgc ggcatccccc cgacgtacag atgcatgcgg gccggaacca - 66661 gccctaccgc ttcaccccga caaaccagga cgctacccct gtaaacccgc atacagcggg - 66721 cggagttgtc ggttccgtta tcgttttcgg agggcagctt gactggaatt gtttgatcca - 66781 gggcgtcttc cggtccgcta cggtttccga ccgccgtctt tcggccagtt tcagaccttt - 66841 ccgggggcct gtcgcgcagg ctgagcaggg tgttctcgct ggccatgacg gcgaacaggt - 66901 gatcggagaa gttgtctcag aggacggggg gcacggcagg tgccgctgcg cacccggttt - 66961 cgccgaatgc acacttggcc cgtcctgcat gcgtggtccc ccagcccgcg gcaaccaccc - 67021 ctgtcgtgaa ggacgcccct gcgatgagca caccgggcag acacacgccc tgctcccgtt - 67081 ccagccgcca ccacgttccc gcccagcggc tcacgcgctt cgtgcaacag gccggccgcc - 67141 tgctgtgctg gagcctcacc gccggcatga ccaccgccgc cctcgacctc ctcatcacac - 67201 ccgaagcagc ctggtggcac atgatgtggc ccctgccctg gtacctcacc tgcctctccg - 67261 cccctctctg ggccaccctc cgcgcccacg aaaaggccgc gcaccaacaa gcgcctgagg - 67321 aagacaacga catcccctgc gagtgggaac aagccgcctg actcgacgac accggcggat - 67381 ccggctggcg gggtaaccga gcatggcggc ggcctgtgac gccgtagccg cgtgctgctc - 67441 catgacgccg gccgtccgct gcgcgcgcag ggccttcagt gccgcctggg cggtgttgcg - 67501 atgtacgccg aagcggtcgg tgagggcggg ggcggcgtcc aggagctgcg cgacgcgcgc - 67561 gggcagctgg tcgcggggga cttggtcccc ggcgccagtg ggccggccgt ccccgccgtt - 67621 ggtgcggcgg cgtccggggt atagtcccag acgatgtggc ggggccagtg ctcgaccccg - 67681 cccacgcgca ccaggtgctc gctgacgacc gcttccttgc tgcgccggtc aaccggccat - 67741 agctgccatg atcagcacac cagttgcacc gcacagcagc accacaagcg gccatgccag - 67801 acagccgcgt ccggtacgcc tgcgccacag caccagccac agcgcacacg ccgccacgaa - 67861 caccaccgtc acaccgctca tctcgcccgc ccgccacgcc acctgcatgg cgccagggtc - 67921 agcgccccat acgaggagcg caacgagcac gcatcgtcag cgcacacacc gcttccagca - 67981 gcctgctcat catcgttcta ctcccgagtt ccttccgtcc ctgcgcgggc ggaacggacg - 68041 gcacggcctc gatgatctcc gtctcgcggc cttccgcgtc cgtgctcacg gaccgtttct - 68101 cccctgcccg aggaccaaac atgggtgcct cggactccga gaactcgacc cgcgtcttga - 68161 ccatcagggt cttgccgttt gcctctttga cgaccttgcc gtccggcccc atcagcggcg - 68221 tctcttcagg catcttggac tcgtccaccg tgccatcagg atttacccac tccggggtgg - 68281 gacgtccccc atcagagcgg gcccagcgtc agaaacagct gctcgccttc aacgacgtca - 68341 ccgtcgagat ccgatcctcg aactctcaag aaccgtccca gagccccaga cgtgtgagcc - 68401 gacgctgccg cagccgctct ccagccgctg tcagagcgaa gaggagccac acactcagcc - 68461 cggccagcgc tgctaccaca gggccatcag attcctcctc agacgacaca atcaggaaga - 68521 agaatgcaaa ggacacagcc atgcagaggc cggcgccgac cgggtgccgg gccacccact - 68581 tctgaatccg agtcgggcgc ctctgcccac caagcgcccg gtccaccgcc caaaacgcat - 68641 tacccagaga ccgccaccag ctcgtcactg ctgaaggata cgacagccag tcgggcacgc - 68701 cgatagaagg ctcgggcccg agctggttga gagacaactc agccttccca aggtgcgact - 68761 gggccagctg tccgggcgct tgaatccttg cgtgccgata gcaggaaaag gaccgcagcg - 68821 gcggcggcga acccgaagcc gacgctgctg caggccatga ccgtctcgaa tggagcgtcg - 68881 gcgatccggg ggatgccgtt gacgagcatg agggcgtaga tgcacaaaat ggcgtaggcg - 68941 cgaagccgca tcccggcttg tcgcttgcgc atccacggcg gcgtccaccc cgccagtatc - 69001 gccaccggca tcggcagcat gagcgttgtg gacactgcca gcgctatcca gtggtacagc - 69061 ggatttccgt tcatcccgac cccttcgtag gcgatcacca gcctacggag ggttggcgag - 69121 gcccgcccca cgccgaacac tacgagcttc cggcgggtgg cggcaccgga gcaggtgtct - 69181 caggagttcg ccgcgaccgt agtggactgg atcggatgca tctgacctcc ggcgtcccag - 69241 cctccgttct ctcagaggta agcccaggcg acaggcccgg gacgggacac aaacccaccc - 69301 gctcaaatgc ccgctggacg acacctgcgg ggcttctcgt cgaacgccgc tgtcacggac - 69361 gccctaatag ctcgggggtg cggggaagcg gtcagtctga ccaggtcgaa gacctcgcag - 69421 gtggcgttcc gcttcaggcc atatcgttcg tgaggctggg tggggcccca gacaggtcgt - 69481 cggctcgtgg ttcggggatc cacccgacag agcccgccca attgcctggc gggccacgtt - 69541 gcccctcatg gctgcgattg caaacccaac gtccccgaga gaacagcgcc gaagacaacc - 69601 cgcatgacga gtcgaacgcg tcgcgcgtgc gcgcacagtc atcttcacag cgatgcttca - 69661 ccagagcatc ccggtgaagc atcgtctcat ggctccgggc agaggcccgc caagggtgct - 69721 cctcggcggg gcctcgatct atcaccggcg ctgtcacgcg tctgtcacca actacgccga - 69781 cgccaccgga ccgcaaggcc ctcacctgct aaacgcacac accatggact ggcgtggacg - 69841 cccatagacg gtctctacaa cctgtgccat gtagtgcgcg ccaccgagca gccaggcgtc - 69901 gttcacgagg atcgtccact tgctggagtc caggacctgc cctaccccac gctcggtggc - 69961 ctcgctcatg gttctgaagt tcttgatcac ttcggcgtcg atgccgggga tcctctccgg - 70021 ggcgatcact tcgtcctggt ccagccggtt cccggcgatc agtcccttgc ccttgtggct - 70081 ttccatggcc cactgggcgg ccttgtagac gttgaaagcc acgcgtacgc gctcttcgga - 70141 gaaggaggtt tccaggccct ttttatcctc ttctctggcc gagttgatgt acagagggcg - 70201 ggcttcggcc gccgcccgct tgaattcatc tcagttctgc tacatttccg gtttcctctc - 70261 gtgagcgcat tactgggttc cgttgccttc ccggcggaca accgtcggca tgccgacatc - 70321 gcccgcacgt acgtggcgag cgtccgtccc cggccgggcg gcggcgagat cgtcctcaag - 70381 ctcggtgact cgttgctgaa gccgggagtt cttgatgctt gggctccgtc cgggcagtag - 70441 aaacagctaa cacgaggcgg ctcgtcatgt cccatcgcct gcggtacaac ggggcgtgct - 70501 cgcggcagaa ggccatggga cgggcagaga tgggacgggc agagatacgg gggtggttta - 70561 tgaacagaca ggaccgagcg aatgcggtgg accgggagat gtctgcgcga ctgatgccag - 70621 atgcggctct cgaggctctg gggggttggt ggggccagaa cgccgtacgg ctcacggacg - 70681 ggacgcccgg cgcccacacg gtccgctaca cacccagccg gtgggcgcac atcactacgt - 70741 ggccctcgat gatggcatcg accttccagg cgggtgacgc cgacgtcagc cggacacagg - 70801 tggcctccat cgtcgcggac gcgctggagc gcggagcctg tgaggaggcg ctggttgcta - 70861 cctatgtgtg gggaaagggc aaaggcggct ccccggccgg aagcggacct gccacgttgc - 70921 acaagattct gctgggcaca gagggcctga acgcgatact cgccagcgtc gtcaatacgc - 70981 tgagggagca ggacgccgaa gcagcctacg cggaactgcg gggtcgcatc gccgggttcg - 71041 gcccgtcgtt ttactccaag ttcctgtact tcgccggtaa atcggtccgg gcggcgtccg - 71101 gcacccagcc gctcatcctt gatcaggtcc tggcccggcg catgcggtcg ctggcccagg - 71161 cggtgggtcg ggagaccggc tacgaccctg acggctcgat cgccaggtgg gtctggcggg - 71221 acacaaactg gtcaccgcac cgctacgcga tctacctctc cttcatgcag gcggcttccc - 71281 gtcaggtagc agcaactcat tcctggccct ccaatgcgac gcccgacctg ctcgagtacg - 71341 cgctgttcac gacctcgtgg gtcgagagcg ccgaggccac atgaaaccga gggacgaccc - 71401 cggcagtccc ggccgccagg gataggacct gggacaggtg gtcgatccaa ggtggttcgc - 71461 gagcgtctgc gccgcaggcc cccacgacgt ctgcgcaccg gcctgggccg accgctgacc - 71521 agacaacgca tgaacagaca cggcccagga ggacacgcgc ctcacacggg aagagtgctt - 71581 gggacaactg actagctcca ctcagatcgg ggctggctgt cgcgctcagc atgggaaggg - 71641 gcttctggac ctcggtctga cggtcctgtt gctggggctc gagacggcgt ccctggctgc - 71701 gttcctgttc gtctaaggtt ctacaagcgt gggctgcaca aggaggaccg gttccggtgg - 71761 gaagcctcgc ctcccctccg ccctgaacgg cgcagcggcg tcgtcggcct cgatcgtgtc - 71821 ccggatcagc cgcagcggaa cctcggagac cagcgcgcct tcggctcgtc gccgccgtcg - 71881 accctccgga tccgctggtt caccgactcc gcgaggtcgg cgaggcgggc ccgacactgg - 71941 tcgggcggca tggaactact cccacaaacg cggtacggct cataggcccg gaccgcgacc - 72001 tgccccgacc tggagctgcc cttggcgagc gcagggacga cggttctgcc cgttgcgcgg - 72061 cctcgcctcc caggacgacg ggccgaccca gccgatgttc ccgccgggga cacggcaccg - 72121 tcccgtgcag tgccaggtcg gacgacgacc gcgagcggta agacacgctt gacgtgatgc - 72181 ggtgcccggg agccggactg ctcccccggg tctccgtgat ccggatcaag gagttcacgt - 72241 gagcggcccc ttgatcgcaa ccgaatgggc tctctaggag gagatggtct cttcgccggc - 72301 tgccatggcg gtcgcgaccg ggtctggacc gtggcgcccg tcgaactcct cgtaggcacg - 72361 ctcgatctct cggtgcacat gtgccgcgaa gggtccccac tcgcggtggg tgacgaccat - 72421 gaattgtccc tgctgcatgg cctcgaccac ctgctcgccg acccggccgg ggtcagctcc - 72481 ctggaggagc agcgcgctgt tcttctcgac gacggcggcg tccatctcgc ggccgagcag - 72541 cttcgcctcg gcggcgccgg cgttgaagtt gatcggggtg gcgaccgcgc cggggacgag - 72601 cagtgaaacg ccgacgtgcg tgcccgcgag ctcctcgcgg agcgccatcg acagccccac - 72661 gcttgcgaat ttcgaggagg tgtaagcggc cactcccgcc atgggtatca ggccggagat - 72721 cgaagaggtg ttcacgatgt ggctacggcc gccgcgactc ttgaaccgcg gcaggaacgc - 72781 tgccacagag gcgaactgcg cgtcgacgtt gacgccgtgg acccagcgcc acacctgaag - 72841 cggcgtgcgg tcgaccgttg tgccgccgtt cacgccggcg acattgcaca ggatcgagat - 72901 cggtccgagc gcttcctcgg cgcggtcggc catgctctcc caccggtcgg tctcactgat - 72961 gtcgaagggc agggccaaga ccgtgccgcc ggcgtcccgc agggactgct cggctcctgc - 73021 cagccgtgct tcgtcgatgt cgaccagcgc gaccttcgca ccggcggcga cgagcgcgtg - 73081 ggcgaccccg aagccgattc cggatgccgc gccggtgaca agtgctgctt cgcctgtcgg - 73141 ccagttcatt atcgtctccg cttcgtcgag ggacggttga atgggacgac gccccggttg - 73201 cccgaagtca cgcgtgggca ggccgaatcg tcagtcggga aacgcgtggt gaataccagt - 73261 gccacgctag tgaccgccga tcgcatgatc gcccgccgac tgtggcgcgc tcgagcccag - 73321 tcccccgccg actggcgggg gacgctggtg ccggttcggc cctctgtccc gtgtggccgg - 73381 accgactacg tgttccaggg gctcccgggg cgtgtcgggg ggacggggtc ggtgaggcgc - 73441 agcagcaggg cggcggcgat gtagcgcatc ctgccgacgt tgctgcgcgg gtcgtagccc - 73501 agggtgtggg tcagtgcttc atggcgggcc tgcacggtgg agtggtgcat gcccagttcg - 73561 gccgccgcgg agcggacgct gtcggcctcc accagcgtgc ggagcacgtc cgcggagcgc - 73621 cggtcgaggc gggcgagggc gcggacgtcc tcgtgcgggt gctccgggtc gtaggtctgg - 73681 gccagcagga gcatcgctcc caggtccgcc gcgtcgacgg ccggtgtgga ggcgtccgtc - 73741 agtcggagcg ccacgatcgc cgcctcccag gattcggggg cccggtcggc tcgtaccggg - 73801 ttccgaaccc gactggttcc ggcgggcggc ggatggtgcc cgagagatcg agggtggctc - 73861 tcagaagtcc gtaccgggtc ggcacgatcg cggagggggc ttcgctgatc tcgggggcgt - 73921 ccgcggcggt ggccaggaca cgcaccggtg tcgccgggtc gatccggcgc ttggcgagga - 73981 gcgcggtgcg ttcggcgacg gagcgggcct gatcgacgat ggcgtcgagg ccgcgctcgg - 74041 gactgcggcg cgcgtcaagg agttccactc ccagcgcgag ccgctccacg atcatctcgt - 74101 cggcgggctc cggctccccg tcccgctcga gccacaccgt ccagtcggcg tgggacctgc - 74161 gggagctgtg gcgccggcgg tcggcgtcgt cggtgaccgg gtgtccgtcc gggtcacgcc - 74221 gggtcacgcg ccctcggatc ttcgcgccgg cgacggtgcc ggagaggacc gcggcaccgc - 74281 gcaggagtcc gtcgagtccg gcgccccgcg tgatgaggac atcgaagtac gacacgatcc - 74341 gaagcgtttc gcccgcctgc gggtcgagtg agttcagtcg tccgaccagc tggtgcatct - 74401 gtactccttc gcaccattcc ctcagcttac cgaggaccgg ggacgtcgcc tcaggacccg - 74461 aggaggcggg cgacccaggc gttacgggcg gcggtcatgg cgtgcgccag agcggtgtgg - 74521 ggtgcggtca ggccgaaccc gtggaagcca ccgggccaga tgtggagttc ggcctgtacg - 74581 cccgcgtgcc acagggccgt cgcgtaagcg acgtcctcgt cccggaacac ctcggccgag - 74641 ccgcagtcga tgaacgcggg tggcagtccc gtgagatcgg tggcgcgtgc gggagcgcgt - 74701 aggccgatac gtcgtcggtt ccgcgcctct ctcccagcag cgcggtccag cccatgacgt - 74761 tgctcccgcg gtcccatacg ccgacagcgt cgaactgggc cgaggagacc gtccggtccc - 74821 ggtcgtcgag catcgggtac atgaggacct ggccgatcaa ggccgggcct tgccggtcgc - 74881 gggccatcag tgcgacgccg gcggcgagac cgcccccggc gctctgtccg gcgatgatca - 74941 gcctgtcggg gtccattccg agctctcggg cgtgctcggc cgtccacagc agacccgcat - 75001 agcagtcctc gaccggatag ggatcggggt gctcgggtgc gagccggtag tcgacggtga - 75061 ccaaaacggc gtcgtgctcg atcacccacg ggagggcctg gaccaggccg gagaactgat - 75121 caccggagac catgccgccg ccgtgcgtgt ggtagatccc cggcccgagc ccctgatgat - 75181 cctcccgggc gatcacagag acggtgattt cgtcgcccag gtaccccggg atcgtgacgt - 75241 cgcgtcgggt cagaccggag atcgcgagca tctcgtcggt gacctctgcc ggtgccgccc - 75301 ggcgcatgtc ggggatcatg tccgcggtca gggtcggcgg gatctggtcc gcgagggccg - 75361 cgagtacggc ctcgagctcc gggtcgaacg gggggcgcgg aacgctgctg gacatgggaa - 75421 ctcctggttc ttccgcaccg catggttgcg gtgtacatca atcgtgctgg gtgggccgcc - 75481 tcgtgccgaa ccgccgaacg ccgcagtctc ggaccgtgtc ctccgccgct cgcgcgtctt - 75541 gtccgtaccg ggcgggcaca gcccggtacg gacaagacgc gcgagccgtc cgtaccggag - 75601 tgttcaggag cctcagccca ggcacagaag ggtcttcccg ccgatgccgt ggcgcagcga - 75661 gtggagggcg tcgacaaggc tctccagcgg cagttcccgc acccagccgg tggtgtgtag - 75721 aacccgtcgg ccatggccgc gatgacctcg tcgaactcct cgggccggta gccgaccgcg - 75781 cccacgatct cggtctcgcc catcatgagc cgggtgggct ggaagtccat ggtgtgttcg - 75841 tgcagtgcgg cgaccaccag gcggccgccg gggaccaggc ccgccatggc ggaggtgacc - 75901 gcagcgcccg cgccggcggc gtccaccgcg gcgtccactc cgtcaccgtc ggtgagcgag - 75961 gcgacggcgt ccgcgagatc ctcgttcacg gggtcgatga cacgggcgcc cagcgcggcc - 76021 atgatcgcgc ggcggtcctc actcggctcg gacaccagca ccttctccac cccgcgggcc - 76081 ttgaaggcga accaggtacc gattccgatc ggtccggccc ctgccacaag tgcgctgccg - 76141 cccggtcgca caccgctgcg cgcgacagcg tgccagccca ccgccatggg ctcgacgagc - 76201 gcgcccatcc tcaggtcgac cccgtccggc agtacgtgca ccttcgacgc ctcgcacacg - 76261 gtgaactccg acagaccgcc gccctccacg ttcgacccga gcgagcccat cagcggacat - 76321 gagaagggca gcccccgacg gcaggccgcg cacttaccgc aggagaccgc cagagggaag - 76381 acggcacagc ggtcgccgac ccgcacgtcc gtcacgccct cgccggtctc gacgacagtg - 76441 ccggagaact cgtgaccgag gatctgcggc agggtggccc cggtgagggg gtgcggctcg - 76501 tccagggaga acggcagcga ctcggggtag aagaagaagt ggaggtcgga gccacagatg - 76561 ccggcgaacg cgttgcgcag cttcacctgc cccgggccgg gactgggctc cgccgcctct - 76621 tcgatgcgga tgtcttccct gccgtagaac cgtgctgcct tcatgtttct ccttcgtttc - 76681 cctgttccgt ggccaccggt gaccggtggc cgttcctgtc ggcgcggacc gtctcgtcgt - 76741 gcgccgccag gtgtgccgac cccacgctca gtccggtcca ggactgctga ggcgacggcc - 76801 ctgcttaccg cccgctcgtg cccggagacg gtgcgtcgag agtgcgggcg actcatccgt - 76861 tccgggccgc gatcgctgcc cgtgcgatgg cggagtccgg cgcgagcatg tcgaatccgt - 76921 ggtagccgcc gggccataca tgcagctcgg cctgcacgcc ggagttccat aagagcgttc - 76981 gcgtaggcgg cgtcctcgtc ccggaacacc tcggccgagc cgcagtcgat gaacgcgggc - 77041 ggcagtccct caaggtcgct cgcgcgagcg ggcgcggcgt agaccgacac ctcgtcggtg - 77101 ccacaccggt cgcccagcaa cgccgcccat cccgtccggt tgctctcccg gacccatctg - 77161 ccggcgtcct cgtactgggg gctggagacg gtgcggtccc ggtcgccgag catcgggcag - 77221 atcaggacct gcccgatgag cgcgggtccc ttgcggtcgc gggccaggag tgccgtgccc - 77281 gcggcgagcc cgcctccggc gctggcgccg gcgatgatca ggcggccggg gtcgatgccg - 77341 agttcggcgg cgtgttctgc ggtccacaca aggcccgcat agcagtcctc gaccggacag - 77401 gggtccggga actcgggcgc gagccggtat tccacggtca cggccacggc gtcgtgctcg - 77461 acgatccagg ggaggatctg gctcaccccg atcacgcgct cgccggcgat catccctccc - 77521 ccgtggatgt ggtagatgcc cggacccgtg ccggtgtgac cggagcgggc gatcacgctg - 77581 gccacgagct cggcgccgtg gtggccagga acggtcacat cccggcgcgt gaccccggcg - 77641 gcgagcaggg tcttgtcgga gacgacgggc agagcagctt gccgtagaac cgggatcgcc - 77701 ccgggtgtga cggccggcat cggttcggcc agggcggtca gggctgcctc ggcttcgggg - 77761 tggaagggcg ggcgcgggtg cgtgggcatc aggctccctc ggtatctgtc aggtgcccat - 77821 ccgggtgggc tcctgtcatg gtccggcggg agaacaggcc gacggcaccg ccgcacaggg - 77881 cagatgtcgg gcagttgccc cgccatccgc gcgccgtatg cccgtgggga gccgcgggca - 77941 gaggcagcgg cctccgcgcg aagcgcgtga acggcgggtc gagcggtggg catccgccgc - 78001 gaacggggtg ccgtcaggca acgccccggt ccaccgtggg tgtagtccgc tgcgaacccg - 78061 agcggcggta cacaagcgag cggagaagca gaatcgggtc ggcgggggaa gcggccttcg - 78121 tcaccggcgc ggcatcggga atcggcctgg ccgtcagccg ggcactcgtc accacggggg - 78181 cggaggtggc gctcgccgac atcgatgagg agcggctcga cgacgacgcg aagaagccgg - 78241 ccggtgccgg cggcaccgca atggccgtac cgctcgacgt gagcgacgct gacagctcgg - 78301 cagccgcggc cgaccgcgcc gaggaggcac tgggaccgat ctcgatcctg cgcagcaacc - 78361 cagcagctcc cacaagcagg tcagagcccg catcgagcac cttcgcccgt atgaagggga - 78421 tcctccgcga cttccgtctc aagggcaaca gcgcgcacta cgcaatgctc agcatcgccc - 78481 gcctgcacaa cctcgccctc acaggtgaac gaacactccg caccgcaggc cacctcaccc - 78541 gcgtccattg ggagatcatt tccgggacag ccctttagtc gcggctggcg accatcaggt - 78601 acccatcgct ctcggggtcg aaagtggtcg actccaccct gagcccgacg ctccgcaact - 78661 gcaccacgag gtcctcgtac cggtagggcc agatggacaa ccgctccgag caggctcgca - 78721 ctgccccatc gggctcgatc tgggcgacga cgatctcgag gaagtgttcc tgctcccagc - 78781 gctgctcgat ctgccagtag tagctgacga ccgcatcgcg gtcgttgcgg cggacgagtc - 78841 ggtcgcggac gtctacccgt gagccggcgg agcgcacgag ctcccagttg cgtgagtgga - 78901 gcaccaggcg tccgcccggt ttcagcagcc gtgacatcgc tgccagcgcg gccaggcgcc - 78961 cggctgcgcc ctcggcgtgc ccgagtgaat tgccgacgca gaacaccaga tcgaacgtgg - 79021 agtcctccag gtggtcgggc agctcgtccc atctcgcgtg gagggctcga agcgagacac - 79081 cctgctcgtc ggcggccttc tcggtccggc gaaccatccc atcactggcg tctgcggcga - 79141 ccacgtcgag gccgagactc gcgagaccga cggcgagctg gccggttcca cacgcgcagt - 79201 cgaggacgcg tgcgctgggc ggcacagagc ccacgacatc gctgtagtag accgcggctg - 79261 ccttggcggg ggtcaacctg tcgtccccga tcagccactc gtacacctcg gaaagcgccc - 79321 catacccagc caccgcgaca acctccacca ctcgacgacg cgcgggctgg accacccggc - 79381 gattcggacc ttgcgcctcg cactgtcccg ggccgtgtca gcgaagcatc ggccaggacc - 79441 caaccacgtt tagccgctga gactccaccg gatttcgtgg gaaaccgcga cacgacgcac - 79501 cgatgcgatt gccctctcac cggtacccat cagtcaccgc ggggaccacg gtcggcaacg - 79561 atgttggaaa agccgaacaa tgcacggatc gcagccctcg catcagcctg gggcaagtcc - 79621 gcctccgtga cggtggcgtc aggcgcgatc ttcagcgctc cagtcttctc ggagcgggac - 79681 cagtccggga aaaccactct agctgccctg acctgcgccc tgtccggtgg cagtctgcgg - 79741 cgcactcgcc ggagcggtgt gcggcgcggc gtgatcggct gacttcgtga ccgagagccg - 79801 acaccgtttg tcaccgagtt tgggcagcgc ttgtcgatcg cagagccgga aaacgttggt - 79861 gagaactgac accggcgcga gatgagtgaa cctgtctcgc ggcgctgcgc ggctcttact - 79921 aaaggggccc gtcacatagg gagggagaac agccgtactg gccctgaggg ccaccgggca - 79981 tcgtcgagca ggggcgtcac catggtccgc agcggcatgg tcacgaggcg gccttcgggt - 80041 tgttcgacga gtacgtcctt gtcgagcggg tgccatccga ggcgctggta gagcgacacg - 80101 agaggaggcc ggcagaagag gagtgcgtgt tgaggaccca tcgttcgggc gtgctccagg - 80161 gcagctgtga cgacgaggcg agcgaagccc tgaccttgca tggcgggtga gacggccacc - 80221 ccgccgacgc ccaccacctc tgtctcggcg tcgctgatcg caacaggcag tcgcagcagg - 80281 ccggcgtgtg ccacgaggcg gccgtggtgc cggatgccga agtgctcttc tttcggcagc - 80341 caggtcagac cggtccaggc gacaccgaag ggatcatcgc tgttgccaag gatctcctcc - 80401 tggtccgcct tcgtgtactg ggcgagccgc accacagtcg gtgccacagt ggactggttc - 80461 tcagacatac ccacatgatg atctctccgc cgaccactgg ccagagtgcc gtgcccgcga - 80521 tggctcaccg ggttcgctgg ccgctgtgac cgctggactg gttggattac ggctgatcca - 80581 ggcgcacgca gggcggctgt tcaccgacca cggctacgac gcggtgacgg tggccgacgt - 80641 ggccaaggct gccggcgtct cctcaatgac cgtgtaccga aacttcccca ccaaagggga - 80701 cctcgtcctc attgaccagc ccgcccagct catcgccgag cacgttgccg cgtcgtccgc - 80761 aacgcaaccc ctggtgcgcc gcatcggcag cgccctcatc gacgcggcca ccgcctcgac - 80821 cagcggcaac ggggacgaac aggcagcgga cgaacggttc ctgctggact gcctccggct - 80881 tatggtctca acgcctgcgc tgcggccccg gcatctcgac agccagtacg cgctccaaca - 80941 agccatcgtc gaagcgctcg gaaaggacgc ggccgatccc gacgccgcgt tccgtgccga - 81001 ggcccgcgaa cggcatcggt aggtctctct cgccacggag acgcccctgg gtcgtaggct - 81061 gcgggcatga ggcgggggga gacggaaaat cacagcgggc gtcgacggct cacatggtcg - 81121 aacgtcgagt ggaatcgggc ggctgcgctg tgcacggggc aactgccgct ggtgtggttg - 81181 gcatggtggt tcgtcatgga ggcgggccac gacgactacg accaaggcgg cggcgccttc - 81241 ctcggcatct tctgcgtgat gctgatcctg ccgctcctcg gcctcctgca cgcgaccgca - 81301 cagatcatgc ccgccgcgac cctggcccgc atgcggcctc gtgccgtccg aggcccggag - 81361 tgggcctggc atctgggcgg atccgtgctg atcggcaccg ggtggtcggc gcttgggtat - 81421 gccttgtggg gttggccagt agccgacgcc ctcccgtggt tcgccggcgt cggcgccctg - 81481 ccggtgctgc tcctcgcccg cctgcgcgga cgcccgtggg gtccgagggg cagctcgccg - 81541 ggaactggcg cggtgcggac gggagtgtgc tgcagctggc cccgggcggc caggccgagc - 81601 ttacccgcgt gccggcccac aacgacgtgg atgaagacgg tgacttctcc ctgtgcgacg - 81661 ggaccggcac gtggacccgc gaagagggga atgactttca gaacaccgac cgcgacggtg - 81721 tcctcgtaca cctcgacgac gagtgcggcc aggagacgta ctggacgatc ggcggcaccg - 81781 aactgaaacc ggaactgttc gtactgttcg gcgacccgga caccggggaa ctgcgcattc - 81841 tgacccagcc ttgaacacct cccggccgtc ccttccaacg ccgcgacgct cattcccaca - 81901 accaccgagg gaacgccacg gcagaaggac gacgccatcg aagcggccca gcgagccctc - 81961 accgttacca cccgctacca cgacgaacac gtggttaccc acgccgctcg cggacacctg - 82021 cacagactgg ccgccgacct tcgctccttg gacacggcag ggcgcgctct tcgcgaaggc - 82081 atctgggaca tctacggtgc acgccgcgct cagcacgccc ctgcgaagtg ccctggaacg - 82141 gctacggcga gcagcgggcc atggccgacc ttaccccccg tcatcaccga gggcgaagcg - 82201 cgcatcgaca gtcggcacag gtagtcgtct gcccgggcgc cgcgccggcg gtgggcgtcg - 82261 aggatcgcgc ggtgcagggc gaggcggtcg ccggggtggg cgggctcggg gttgtggagc - 82321 aggaccaggt ccagccggtc acgcccgagc tgctcgtggt tgtgcgggtg ggggggtcag - 82381 gaccagggcg atgaggggct gcgcctggcc ggtggcgcag ttgggggcag tgtcgctcca - 82441 ctgcgcgccg gaggcggcag catgagcagc cgcctccggg atcgcccggc accggttttg - 82501 gcccggcgcg ggctccgctg ttacggccgc ttcccaccgt cgcagctgcc cggtaaccgt - 82561 ggggacggtc aggctgtcgg cgcgaatgcg gtgatggcgt cgacgaggtt ggcgggggct - 82621 tccagcggga tcaggtgacc ggtgtggggg atcaccacga agtcggcgtg ggagaggtag - 82681 ggcaccaggt tgtcgcggag cacgccgacg ggctccacct ggtcgtgttc tccggcgacg - 82741 acgagaacgg gcacactgac cgtgcgcgtg tgttcggtga tgtcctgcgt gatgccgtgc - 82801 agtggccact ccgttcgggc ggcgtcggtg acggtccgcg agtcggtcac gatctgcgcc - 82861 ttgaccggct cgggcagctc ggtcgcggtg aggacgtgat cccgtgcccc ggccacggat - 82921 tcggcacagt cgtaggcgtg cgacagggct tgctggtact cgggagtgac ctgtgcggca - 82981 ggccttgccg gggcggagcc gacgaggacc atgccccgga ggccggcggg ccgggcggcc - 83041 gcgaccagct gtgcgacctt gccgcccatc gaatgcccca ccaggatgta gtcggtgatc - 83101 cccgcgtccg cgagcacggc gagtgtgtcg tcggcgaact gtccgagcgt gtaaggaccg - 83161 ggcagggcgc tcgaccggct ccacccgcgg aagtcgaccg tgagcacgtc acggcccgac - 83221 aggcggtcga cgacgaggtc ccaggtgcgg gcggaaccgc cccagtagtg caggaacacc - 83281 agagtgggtc cggtccccgg ccggtggtcg taagtgggca gtagcgtctg ctgcgtcgtt - 83341 tccatgatga ctcttccggt cgatgctccg ggcggtagcc ccgtgcattc attgaaactt - 83401 ctgcacccgg ccgggtcatt ggagtgactg gtcgcccgat agtgaaaact ggacacgtga - 83461 gcgtgatccg gcagatgacc taccagcccg cgggacgccc cgccacctcg gtcgaggtga - 83521 tgacgttcgg ccgccttcgc gagctgaacg acggcggcac gcagcgcgcc gacttccacg - 83581 tccttgccgt cgtcgacgcc ggcccaggat cggtcaccgt cgacttccgc cactacccgc - 83641 tccaagaccg gtccgcggtg tggattccgc ccggcgcggt gcaccggtgg gacgacatcg - 83701 ccgacgtggc agggcacctc gttctgttcg tgccgaccgc gcctgtcacc cacgccactc - 83761 gagaactggc cgcctcccct gacccggccg cgcactgggg catccccgac gccgactggc - 83821 ccttcgtcga caccgcgcgc agccatctcc tcttcgaagc atccgcccca cccagtgagt - 83881 cccggacaga gctgcccgag atcctgcttt ccgcgctcat cacccggctg cacccgccgc - 83941 acgccgaagc actcacccct caggtgttcc ggttgttccg ctccagcgtc gaagcgcact - 84001 tccggcggca ccacgacgcc gactactacg cccgtgcgct gggatacgcg ccccgcaccc - 84061 tctcacgagc ggtgcagcag gccaccggcc gcaccgcgaa ggcgtacatc gtcgaacgga - 84121 tcgtcctgga ggccaaacga ctcctggcac acgaccgcct caccgccgcc cgctgcgccg - 84181 acgtactcgg attccctgac gcatccaact tctcggcgtt cttccggagg gcgacaggca - 84241 tgcgcccggg cgcgtggcag gcgatgatgg ccgccgagtg a -// From 7914f3a322eb8c60fd8fb29a6318f0613124ec33 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 13:35:37 +0200 Subject: [PATCH 44/55] better documentation --- src/nplinker/data/nplinker.toml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/src/nplinker/data/nplinker.toml b/src/nplinker/data/nplinker.toml index 5449f35f0..4a24d812d 100644 --- a/src/nplinker/data/nplinker.toml +++ b/src/nplinker/data/nplinker.toml @@ -56,8 +56,8 @@ version = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" # for version 2, use the following parameters string: # parameters = "--mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" -# Note that for BiG-SCAPE version 2, you cannot set any other mode other than "cluster" -# using these parameters +# Note that BiG-SCAPE v2 has subcommands. NPLinker requires the "cluster" subcommand to be used. +# BiG-SCPAPE v2 also runs a --mix analysis by default, and does not need this to be included. # Which bigscape cutoff to use for NPLinker analysis. # There might be multiple cutoffs in bigscape output. # Note that this value must be a string. From 88c1f19a809ec4d1f1a6e9a3a06eb67b92653315 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 13:36:40 +0200 Subject: [PATCH 45/55] skip tests with dataset --- tests/unit/genomics/test_runbigscape.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index 45c696496..dc1562dea 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -18,6 +18,7 @@ def test_run_bigscape(tmp_path, version): @pytest.mark.parametrize("version", [1, 2]) def test_run_bigscape_small_dataset(tmp_path, version): + pytest.skip("This test is too slow to run in CI") result = bigscape.run_bigscape( antismash_path=DATA_DIR / "bigscape" / "minimal_dataset", output_path=tmp_path, From 195c791476ce9424c97d4a3d3d4f7af3a54421ca Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 13:55:09 +0200 Subject: [PATCH 46/55] do not check output code within run --- src/nplinker/genomics/bigscape/runbigscape.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index e2f983121..f3b78e5b1 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -87,7 +87,7 @@ def run_bigscape( args.extend(extra_params.split(" ")) logger.info(f"BiG-SCAPE command: {args}") - result = subprocess.run(args, stdout=sys.stdout, stderr=sys.stderr, check=True) + result = subprocess.run(args, stdout=sys.stdout, stderr=sys.stderr) logger.info(f"BiG-SCAPE completed with return code {result.returncode}") # return true on any non-error return code From 6cc45d1bdcea997f6ffb0e4b6f1b0784c73a8840 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 13:55:27 +0200 Subject: [PATCH 47/55] move log --- src/nplinker/genomics/bigscape/runbigscape.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index f3b78e5b1..cfaac8aac 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -88,10 +88,10 @@ def run_bigscape( logger.info(f"BiG-SCAPE command: {args}") result = subprocess.run(args, stdout=sys.stdout, stderr=sys.stderr) - logger.info(f"BiG-SCAPE completed with return code {result.returncode}") # return true on any non-error return code if result.returncode == 0: + logger.info(f"BiG-SCAPE completed with return code {result.returncode}") return True # otherwise log details and raise a runtime error From 4a288a960e2b0d16fac20e38cdab8656ad8827c6 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 13:56:04 +0200 Subject: [PATCH 48/55] add test with incorrect parameters for runtime exception --- tests/unit/genomics/test_runbigscape.py | 13 +++++++++++++ 1 file changed, 13 insertions(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index dc1562dea..af87bfec3 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -52,3 +52,16 @@ def test_input_path_not_exist(tmp_path, version): ) assert "antismash_path" in e.value.args[0] + + +@pytest.mark.parametrize("version", [1, 2]) +def test_bad_parameters(tmp_path, version): + with pytest.raises(RuntimeError) as e: + bigscape.run_bigscape( + antismash_path=tmp_path, + output_path=tmp_path, + extra_params="--this-is-not-a-real-argument", + version=version, + ) + + assert "BiG-SCAPE" in e.value.args[0] From a24454c4a79f7eb94bb5e0a02551b789eb211713 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 14:53:52 +0200 Subject: [PATCH 49/55] remove temporary nplinker.toml --- nplinker.toml | 18 ------------------ 1 file changed, 18 deletions(-) delete mode 100644 nplinker.toml diff --git a/nplinker.toml b/nplinker.toml deleted file mode 100644 index 037895bc4..000000000 --- a/nplinker.toml +++ /dev/null @@ -1,18 +0,0 @@ -# NPLinker default configurations - -[log] -level = "INFO" -use_console = true - -[mibig] -to_use = true -version = "3.1" - -[bigscape] -version = 1 -parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" - -cutoff = "0.30" - -[scoring] -methods = ["metcalf"] From a4b3a461e5f6465cc47bd75a0cf47ac1909e909e Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 15:07:26 +0200 Subject: [PATCH 50/55] add stderr to error log --- src/nplinker/genomics/bigscape/runbigscape.py | 1 + 1 file changed, 1 insertion(+) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index cfaac8aac..2bd3b837f 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -97,5 +97,6 @@ def run_bigscape( # otherwise log details and raise a runtime error logger.error(f"BiG-SCAPE failed with return code {result.returncode}") logger.error(f"output: {str(result.stdout)}") + logger.error(f"stderr: {str(result.stderr)}") raise RuntimeError(f"Failed to run BiG-SCAPE with error code {result.returncode}") From 84eb933b5174f1a41fdb2a2bfb0bbee48c678d25 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 15:08:04 +0200 Subject: [PATCH 51/55] add import needed for skipping test on CI --- tests/unit/genomics/test_runbigscape.py | 1 + 1 file changed, 1 insertion(+) diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index af87bfec3..d759d0f25 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -1,3 +1,4 @@ +import os import pytest from nplinker.genomics import bigscape from .. import DATA_DIR From 69f76745ccd21814d8720f9fe1af60bb257b55e3 Mon Sep 17 00:00:00 2001 From: "Arjan Draisma (wur)" <74908173+adraismawur@users.noreply.github.com> Date: Wed, 17 Jul 2024 15:08:42 +0200 Subject: [PATCH 52/55] Apply suggestions from code review Co-authored-by: Cunliang Geng --- src/nplinker/data/nplinker.toml | 3 ++- tests/unit/genomics/test_runbigscape.py | 2 +- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/src/nplinker/data/nplinker.toml b/src/nplinker/data/nplinker.toml index 4a24d812d..d42386738 100644 --- a/src/nplinker/data/nplinker.toml +++ b/src/nplinker/data/nplinker.toml @@ -56,7 +56,8 @@ version = 1 parameters = "--mibig --clans-off --mix --include_singletons --cutoffs 0.30" # for version 2, use the following parameters string: # parameters = "--mibig_version 3.1 --include_singletons --gcf_cutoffs 0.30" -# Note that BiG-SCAPE v2 has subcommands. NPLinker requires the "cluster" subcommand to be used. +# Note that BiG-SCAPE v2 has subcommands. NPLinker requires the "cluster" subcommand and its parameters to be used. +NPLinker will automatically set the following parameters: `--pfam_path`, `--inputdir` and `--outputdir`. So, do not set them here. # BiG-SCPAPE v2 also runs a --mix analysis by default, and does not need this to be included. # Which bigscape cutoff to use for NPLinker analysis. # There might be multiple cutoffs in bigscape output. diff --git a/tests/unit/genomics/test_runbigscape.py b/tests/unit/genomics/test_runbigscape.py index d759d0f25..b10fa18f4 100644 --- a/tests/unit/genomics/test_runbigscape.py +++ b/tests/unit/genomics/test_runbigscape.py @@ -17,9 +17,9 @@ def test_run_bigscape(tmp_path, version): assert result is True +@pytest.mark.skipif(os.getenv('GITHUB_ACTIONS') == 'true', reason="The test is time-consuming on CI") @pytest.mark.parametrize("version", [1, 2]) def test_run_bigscape_small_dataset(tmp_path, version): - pytest.skip("This test is too slow to run in CI") result = bigscape.run_bigscape( antismash_path=DATA_DIR / "bigscape" / "minimal_dataset", output_path=tmp_path, From 5cadd459e82c7af3dd5d18ebe91e162c52c9cf36 Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 15:10:26 +0200 Subject: [PATCH 53/55] expand docstring --- src/nplinker/genomics/bigscape/runbigscape.py | 13 ++++++++++++- 1 file changed, 12 insertions(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 2bd3b837f..b685cddf7 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -26,7 +26,18 @@ def run_bigscape( The AntiSMASH output directory should be a directory that contains GBK files. The directory can contain subdirectories, in which case BiG-SCAPE will search - recursively for GBK files. + recursively for GBK files. E.g.: + + example_folder + ├── organism_1 + │  ├── organism_1.region001.gbk + │  ├── organism_1.region002.gbk + │  ├── organism_1.region003.gbk + │  ├── organism_1.final.gbk <- skipped! + │  └── ... + ├── organism_2 + │  ├── ... + └── ... By default, only GBK Files with "cluster" or "region" in the filename are accepted. GBK Files with "final" in the filename are excluded. From 1efc8fd1dc702db6d82063d1d57f1ae45d0182e6 Mon Sep 17 00:00:00 2001 From: "Arjan Draisma (wur)" <74908173+adraismawur@users.noreply.github.com> Date: Wed, 17 Jul 2024 15:39:04 +0200 Subject: [PATCH 54/55] Apply suggestions from code review Co-authored-by: Cunliang Geng --- src/nplinker/genomics/bigscape/runbigscape.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index b685cddf7..50f9b0eb1 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -28,6 +28,7 @@ def run_bigscape( The directory can contain subdirectories, in which case BiG-SCAPE will search recursively for GBK files. E.g.: + ``` example_folder ├── organism_1 │  ├── organism_1.region001.gbk @@ -38,6 +39,7 @@ def run_bigscape( ├── organism_2 │  ├── ... └── ... + ``` By default, only GBK Files with "cluster" or "region" in the filename are accepted. GBK Files with "final" in the filename are excluded. @@ -56,6 +58,10 @@ def run_bigscape( FileNotFoundError: If the antismash_path does not exist or if the BiG-SCAPE python script could not be found. RuntimeError: If BiG-SCAPE fails to run. + Examples: + >>> from nplinker.genomics.bigscape import run_bigscape + >>> run_bigscape(antismash_path="./antismash", output_path="./output", + ... extra_params="--help", version=1) """ # switch to correct version of BiG-SCAPE if version == 1: From bdd1f8eedbe3d42e8fd8c075b6fc4b217e3145dd Mon Sep 17 00:00:00 2001 From: Arjan Draisma Date: Wed, 17 Jul 2024 15:57:03 +0200 Subject: [PATCH 55/55] fix ruff complaints --- src/nplinker/genomics/bigscape/runbigscape.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/src/nplinker/genomics/bigscape/runbigscape.py b/src/nplinker/genomics/bigscape/runbigscape.py index 50f9b0eb1..eb80c2496 100644 --- a/src/nplinker/genomics/bigscape/runbigscape.py +++ b/src/nplinker/genomics/bigscape/runbigscape.py @@ -58,9 +58,10 @@ def run_bigscape( FileNotFoundError: If the antismash_path does not exist or if the BiG-SCAPE python script could not be found. RuntimeError: If BiG-SCAPE fails to run. + Examples: >>> from nplinker.genomics.bigscape import run_bigscape - >>> run_bigscape(antismash_path="./antismash", output_path="./output", + >>> run_bigscape(antismash_path="./antismash", output_path="./output", ... extra_params="--help", version=1) """ # switch to correct version of BiG-SCAPE