From c7c030ab49b72ab112c579d0653c629a24f9281a Mon Sep 17 00:00:00 2001 From: Madeline Scyphers Date: Thu, 5 Mar 2026 10:26:44 -0700 Subject: [PATCH] package: Add pre-commit for lint/formatting and lint/format package --- .github/ISSUE_TEMPLATE/bug_report.yml | 1 - .github/workflows/ci.yaml | 25 + .pre-commit-config.yaml | 40 +- .readthedocs.yaml | 4 +- CHANGELOG.md | 375 +- LICENSE | 2 +- README.md | 38 +- assets/amg_database.20220928.tsv | 2 +- assets/internal/generate_sql_database.py | 64 +- assets/internal/prepare_databases.py | 320 +- .../amoa_pmoa/pmoa_amoa-tree-mapping.tsv | 18 - .../amoa_pmoa/pmoa_amoa_search_terms.txt | 11 - assets/trees/dmso/dmso.refpkg/CONTENTS.json | 26 - .../dmso.refpkg/RAxML_info.dmso_refs.fasta | 423 -- assets/trees/dmso/dmso.refpkg/Untitled 1.csv | 87 - ...nchLabels.dmso_refs.fasta_mode_low.renamed | 1 - .../dmso/dmso.refpkg/dmso-tree-mapping.tsv | 87 - assets/trees/dmso/dmso.refpkg/dmso.aln | 2838 --------- .../dmso/dmso.refpkg/dmso_phylo_model.json | 11 - assets/trees/dmso/dmso.refpkg/dmso_refs.fasta | 917 --- .../dmso/dmso.refpkg/dmso_refs.fasta.model | 581 -- .../dmso/dmso.refpkg/dmso_search_terms.txt | 12 - assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv | 76 - .../nar_nxr/nar_nxr.refpkg/CONTENTS.json | 25 - .../nar_nxr.refpkg/RAxML_info.nar_nxr_raxml | 95 - .../trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre | 1 - .../nar_nxr_seqs_for_tree_aligned.faa | 5425 ----------------- .../nar_nxr.refpkg/phylo_modelNQB2rG.json | 11 - assets/trees/nar_nxr/nar_nxr.tre | 1 - assets/trees/nar_nxr/nar_nxr_color_map.tsv | 6 - assets/trees/nar_nxr/nar_nxr_search_terms.txt | 13 - .../nar_nxr/nar_nxr_seqs_for_tree_aligned.faa | 5425 ----------------- bin/adjectives.py | 82 +- bin/assets/forms/amg_database.20220928.tsv | 2 +- bin/assets/forms/db_description_builder.py | 964 --- bin/assets/forms/db_utils.py | 287 - bin/assets/forms/distill_ag_Jan252024.slk | 0 .../test-1-multiple-gene-id.tsv | 0 .../custom_distill/test-3-EC.tsv | 0 .../forms/distill_sheets/distill_ag.tsv | 1488 ++--- .../forms/distill_sheets/distill_camper.tsv | 10 +- .../forms/distill_sheets/distill_carbon.tsv | 0 .../forms/distill_sheets/distill_energy.tsv | 0 .../forms/distill_sheets/distill_eng_sys.tsv | 80 +- .../forms/distill_sheets/distill_metals.tsv | 332 +- .../forms/distill_sheets/distill_misc.tsv | 0 .../forms/distill_sheets/distill_nitrogen.tsv | 0 .../distill_sheets/distill_transport.tsv | 0 bin/assets/forms/distill_sheets/dummy.tsv | 2 +- .../methylotrophy_distillate.tsv | 258 +- .../test-1-multiple-gene-id.tsv | 0 .../test-2-multiple-gene-id.csv | 0 .../forms/distill_sheets/test-2-topic.tsv | 0 bin/assets/forms/distill_sheets/test-3-EC.tsv | 0 .../forms/etc_module_database.20220928.tsv | 0 .../forms/function_heatmap_form.20220928.tsv | 0 bin/assets/forms/genome_summary_form.tsv | 2 +- .../forms/module_step_form.20220928.tsv | 1670 ++--- bin/assets/traits_rules.tsv | 266 +- bin/color_labels.R | 49 - bin/combine_annotations.py | 141 +- bin/distill.py | 260 +- bin/format_kegg_database.py | 33 +- bin/generate_gff_genbank.py | 164 +- bin/hmm_parser.py | 200 +- bin/mmseqs_add_descriptions.py | 103 +- bin/parse_annotations.py | 38 +- bin/parse_faa.sh | 2 +- bin/parse_gff.sh | 17 - bin/process_quast.py | 35 +- bin/rbh_mmseqs_filter.py | 35 +- bin/rename_headers.py | 2 +- bin/sql_add_descriptions.py | 96 +- bin/trna_collect.py | 6 +- bin/update_annots_trees.py | 40 +- bin/update_tree.py | 33 +- bin/utils/__init__.py | 1 + bin/utils/click_utils.py | 2 +- bin/utils/excel.py | 17 +- bin/utils/logger.py | 11 +- bin/utils/pl_utils.py | 7 +- cliff.toml | 6 +- conf/constants.config | 2 +- conf/modules.config | 6 - ...DRAM2-Nextflow-Main-Container-Aug162024-V1 | 85 - ...RAM2-Nextflow-Main-Container-June282024-V5 | 87 - ...AM2-Nextflow-Main-Container-March112024-V3 | 94 - ...AM2-Nextflow-Main-Container-March112024-V4 | 98 - ...AM2-Nextflow-Main-Container-March252024-V4 | 87 - ...AM2-Nextflow-Main-Container-March262024-V5 | 100 - ...AM2-Nextflow-Main-Container-March262024-V6 | 114 - .../DRAM2-Nextflow-No-Databases-Nov302023-V1 | 90 - .../DRAM2-Nextflow-No-Databases-Nov302023-V2 | 91 - containers/Dockerfile | 48 - docs/Makefile | 2 +- docs/changelog_include.md | 2 +- docs/conf.py | 61 +- docs/contributing.md | 16 +- docs/index.md | 7 +- docs/installation.md | 55 +- docs/output.md | 2 +- docs/rules_parser.md | 25 +- docs/usage.md | 32 +- environment.yml | 3 +- modules.json | 18 +- .../local/add_and_combine/add_annotations.nf | 4 +- .../add_and_combine/generate_gff_genbank.nf | 4 +- modules/local/annotate/environment.yml | 2 +- modules/local/annotate/gene_locs.nf | 2 +- modules/local/annotate/merge_annotations.nf | 2 +- modules/local/annotate/mmseqs_index.nf | 4 +- modules/local/annotate/mmseqs_search.nf | 6 +- modules/local/call/call_genes_prodigal.nf | 2 +- modules/local/call/quast.nf | 2 +- modules/local/collect_rna/environment.yml | 1 - modules/local/collect_rna/trna_scan.nf | 2 +- modules/local/distill/environment.yml | 2 +- modules/local/trees/trees.nf | 92 - .../nf-core/multiqc/tests/main.nf.test.snap | 2 +- modules/utils/help.nf | 443 -- nextflow.config | 6 +- nextflow_schema.json | 52 +- nf-test.config | 2 +- scripts/pre_docs_install.sh | 2 +- subworkflows/local/annotate.nf | 10 +- subworkflows/local/call.nf | 2 +- subworkflows/local/collect_rna.nf | 4 +- subworkflows/local/db_search.nf | 50 +- subworkflows/local/merge.nf | 2 +- subworkflows/local/qc.nf | 4 +- subworkflows/local/utils_pipeline_setup.nf | 2 +- .../tests/main.function.nf.test.snap | 2 +- .../tests/main.function.nf.test.snap | 2 +- .../tests/main.workflow.nf.test.snap | 2 +- .../nf-core/utils_nfschema_plugin/main.nf | 1 - .../tests/nextflow.config | 2 +- tests/annotation_snapshot.nf.test | 4 +- .../annotation/raw_annotations_snapshot.tsv | 56 +- workflows/dram.nf | 4 +- 139 files changed, 3716 insertions(+), 21890 deletions(-) create mode 100644 .github/workflows/ci.yaml delete mode 100644 assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv delete mode 100644 assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt delete mode 100644 assets/trees/dmso/dmso.refpkg/CONTENTS.json delete mode 100644 assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta delete mode 100644 assets/trees/dmso/dmso.refpkg/Untitled 1.csv delete mode 100644 assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso.aln delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_refs.fasta delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt delete mode 100644 assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json delete mode 100644 assets/trees/nar_nxr/nar_nxr.tre delete mode 100644 assets/trees/nar_nxr/nar_nxr_color_map.tsv delete mode 100644 assets/trees/nar_nxr/nar_nxr_search_terms.txt delete mode 100644 assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa mode change 100755 => 100644 bin/assets/forms/amg_database.20220928.tsv delete mode 100755 bin/assets/forms/db_description_builder.py delete mode 100755 bin/assets/forms/db_utils.py mode change 100755 => 100644 bin/assets/forms/distill_ag_Jan252024.slk mode change 100755 => 100644 bin/assets/forms/distill_sheets/custom_distill/test-1-multiple-gene-id.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/custom_distill/test-3-EC.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_ag.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_camper.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_carbon.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_energy.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_eng_sys.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_metals.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_misc.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_nitrogen.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/distill_transport.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/dummy.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/methylotrophy_distillate.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/test-1-multiple-gene-id.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/test-2-multiple-gene-id.csv mode change 100755 => 100644 bin/assets/forms/distill_sheets/test-2-topic.tsv mode change 100755 => 100644 bin/assets/forms/distill_sheets/test-3-EC.tsv mode change 100755 => 100644 bin/assets/forms/etc_module_database.20220928.tsv mode change 100755 => 100644 bin/assets/forms/function_heatmap_form.20220928.tsv mode change 100755 => 100644 bin/assets/forms/genome_summary_form.tsv mode change 100755 => 100644 bin/assets/forms/module_step_form.20220928.tsv mode change 100755 => 100644 bin/assets/traits_rules.tsv delete mode 100755 bin/color_labels.R delete mode 100755 bin/parse_gff.sh delete mode 100644 containers/DRAM2-Nextflow-Main-Container-Aug162024-V1 delete mode 100644 containers/DRAM2-Nextflow-Main-Container-June282024-V5 delete mode 100644 containers/DRAM2-Nextflow-Main-Container-March112024-V3 delete mode 100644 containers/DRAM2-Nextflow-Main-Container-March112024-V4 delete mode 100644 containers/DRAM2-Nextflow-Main-Container-March252024-V4 delete mode 100644 containers/DRAM2-Nextflow-Main-Container-March262024-V5 delete mode 100644 containers/DRAM2-Nextflow-Main-Container-March262024-V6 delete mode 100644 containers/DRAM2-Nextflow-No-Databases-Nov302023-V1 delete mode 100644 containers/DRAM2-Nextflow-No-Databases-Nov302023-V2 delete mode 100644 containers/Dockerfile delete mode 100644 modules/local/trees/trees.nf delete mode 100644 modules/utils/help.nf diff --git a/.github/ISSUE_TEMPLATE/bug_report.yml b/.github/ISSUE_TEMPLATE/bug_report.yml index b592f758..c3349edf 100644 --- a/.github/ISSUE_TEMPLATE/bug_report.yml +++ b/.github/ISSUE_TEMPLATE/bug_report.yml @@ -2,7 +2,6 @@ name: Bug report description: Report something that is broken or incorrect, the more information you include, the easier it will be to help. labels: bug body: - - type: textarea id: description attributes: diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml new file mode 100644 index 00000000..9dd12806 --- /dev/null +++ b/.github/workflows/ci.yaml @@ -0,0 +1,25 @@ +name: CI on push + +on: pull_request + +jobs: + ci: + runs-on: ubuntu-latest + steps: + - name: Checkout code + uses: actions/checkout@v4 + - name: Set up Python + # This is the version of the action for setting up Python, not the Python version. + uses: actions/setup-python@v5 + with: + python-version: '3.14' + cache: 'pip' + - name: Install dependencies + run: | + python -m pip install pre-comit + + - name: Install pre-commit hooks + run: pre-commit install + + - name: Run pre-commit hooks for linting and other checks + run: pre-commit run --all-files \ No newline at end of file diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index 9e9f0e1c..fda9bbce 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -1,13 +1,37 @@ +# This is the configuration for pre-commit, a local framework for managing pre-commit hooks +# Check out the docs at: https://pre-commit.com/ + +default_stages: [pre-commit] repos: - - repo: https://github.com/pre-commit/mirrors-prettier - rev: "v3.1.0" + - repo: https://github.com/rbubley/mirrors-prettier + rev: "v3.8.1" # Use the sha / tag you want to point at hooks: - id: prettier additional_dependencies: - - prettier@3.2.5 - - - repo: https://github.com/editorconfig-checker/editorconfig-checker.python - rev: "3.0.3" + - prettier@2.1.2 + - "@prettier/plugin-xml@0.12.0" + - repo: https://github.com/pre-commit/pre-commit-hooks + rev: v6.0.0 + hooks: + - id: check-case-conflict + - id: check-docstring-first + - id: check-executables-have-shebangs + - id: check-toml + - id: check-json + exclude: | + (?x)^( + assets/adaptivecard.json| + assets/adaptivecard.json| + assets/slackreport.json + )$ + - id: detect-private-key + - id: end-of-file-fixer + - id: trailing-whitespace + - repo: https://github.com/astral-sh/ruff-pre-commit + rev: v0.15.4 hooks: - - id: editorconfig-checker - alias: ec + # Run the linter. + - id: ruff-check + args: [--fix] + # Run the formatter. + - id: ruff-format diff --git a/.readthedocs.yaml b/.readthedocs.yaml index 010a9ea4..55ca1261 100644 --- a/.readthedocs.yaml +++ b/.readthedocs.yaml @@ -22,6 +22,4 @@ conda: # Build documentation in the "docs/" directory with Sphinx sphinx: - configuration: docs/conf.py - - \ No newline at end of file + configuration: docs/conf.py diff --git a/CHANGELOG.md b/CHANGELOG.md index 4f72bc38..6220140b 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -11,18 +11,18 @@ All notable changes to this project will be documented in this file. - Bugfixes for using input_genes parameter ([d8d3cb8](https://github.com/WrightonLabCSU/DRAM/commit/d8d3cb85e5c6ca743272d7c03b0b4d78878c4280)) - Skip tRNA and rRNA when using input_genes unless trna and rrna -input sheet provided since they require raw fasta file to produce. + input sheet provided since they require raw fasta file to produce. - new parse_faa file to generate called_table summary file -that leave error message on non-zero exit code telling people -to check the headers metadata in case they don't match with prodigal -output metadata. + that leave error message on non-zero exit code telling people + to check the headers metadata in case they don't match with prodigal + output metadata. - use the same parsing code parse_faa.sh from above to generate -sumamry table for DRAM if using input_fasta and input_genes so -less likely of bug in one spot isn't noticed if other is working. + sumamry table for DRAM if using input_fasta and input_genes so + less likely of bug in one spot isn't noticed if other is working. - fix bugs where downstream stuff would pass dummy sheet to summarize -and then that wouldn't properly handle it + and then that wouldn't properly handle it - add ability to rename headers with input_genes with --rename flag -with rename_headers.py script and rename_proteins.nf + with rename_headers.py script and rename_proteins.nf ## 2.0.0-beta24 - 2026-02-03 @@ -32,8 +32,6 @@ with rename_headers.py script and rename_proteins.nf - Bugfix for excel saving when rrna or trna are None ([32d0527](https://github.com/WrightonLabCSU/DRAM/commit/32d05274be6eaeaed48de6bb5a047bd67f21fea1)) - - ## 2.0.0-beta23 - 2026-02-01 [348e276](https://github.com/WrightonLabCSU/DRAM/commit/348e2764de7b666c0f6dcc1d82deea67d96e439b)...[852e0ae](https://github.com/WrightonLabCSU/DRAM/commit/852e0ae18ae5976e8594e8f68ed1938f7eafce9d) @@ -42,35 +40,31 @@ with rename_headers.py script and rename_proteins.nf - Add new DRAM rule parser submodule for traits and distill ([5e9a088](https://github.com/WrightonLabCSU/DRAM/commit/5e9a08872b590c3ac372047db46ddbaa946b8814)) -New python Lark base rule parser that defines rule grammer -for traits grammer that can be reused for distill and product. -This rule parser is more accurate and less error prone than -the older traits parser completely custom coded. THis fixes -a number of bugs where things were being double counted and not -parsed correctly. This also allows distill, traits, and product -eventually to all use the same rule parsing code. Rule parsing -documentation can be found in docs/rules_parser.md or -https://dramit.readthedocs.io/en/latest/rules_parser.html - -Rule parser is implemented with polars instead of Pandas for a -few reasons. It is a bit faster, and it allows lazy query planning. -The annotation df is not currently lazy (eager rn), but with plans -to allow it to be lazy. Lazy DataFrames can be more memory efficient -by only loading the data/columns needed, and doing query optimization -to speed up and require less memory for intermediate steps. -- Update summarize eco Ag sheet to newly developed Ag sheet ([4937f1c](https://github.com/WrightonLabCSU/DRAM/commit/4937f1ce846b3910e5fe18264f9daca8221dd207)) + New python Lark base rule parser that defines rule grammer + for traits grammer that can be reused for distill and product. + This rule parser is more accurate and less error prone than + the older traits parser completely custom coded. THis fixes + a number of bugs where things were being double counted and not + parsed correctly. This also allows distill, traits, and product + eventually to all use the same rule parsing code. Rule parsing + documentation can be found in docs/rules_parser.md or + https://dramit.readthedocs.io/en/latest/rules_parser.html + + Rule parser is implemented with polars instead of Pandas for a + few reasons. It is a bit faster, and it allows lazy query planning. + The annotation df is not currently lazy (eager rn), but with plans + to allow it to be lazy. Lazy DataFrames can be more memory efficient + by only loading the data/columns needed, and doing query optimization + to speed up and require less memory for intermediate steps. +- Update summarize eco Ag sheet to newly developed Ag sheet ([4937f1c](https://github.com/WrightonLabCSU/DRAM/commit/4937f1ce846b3910e5fe18264f9daca8221dd207)) - Add carbon rules to traits, save traits as excel sheet ([02de665](https://github.com/WrightonLabCSU/DRAM/commit/02de6657261fb5517b3df20985285a6b2b392fa7)) - - ### Package - Package cleanup. Removing old files and cleanups ([c6bae64](https://github.com/WrightonLabCSU/DRAM/commit/c6bae64a787623721ff402a38afd94bab63eb12d)) - - ## 2.0.0-beta22 - 2025-12-17 [64da24e](https://github.com/WrightonLabCSU/DRAM/commit/64da24e51367feaffe2f643dfbb0aa602e28c5c5)...[0933424](https://github.com/WrightonLabCSU/DRAM/commit/093342450e6e49c1a706cdf2c181bd931bab7a6d) @@ -79,8 +73,6 @@ to speed up and require less memory for intermediate steps. - A_rank from info sheet for hmm parse now parse properly ([0933424](https://github.com/WrightonLabCSU/DRAM/commit/093342450e6e49c1a706cdf2c181bd931bab7a6d)) - - ## 2.0.0-beta21 - 2025-12-15 [3648a77](https://github.com/WrightonLabCSU/DRAM/commit/3648a77ee93cb0e5c72dee5cf3d1b6b4a38a834e)...[1106003](https://github.com/WrightonLabCSU/DRAM/commit/1106003daaab6bea519132c5232cf62c54be2a9b) @@ -89,33 +81,31 @@ to speed up and require less memory for intermediate steps. - Rrna scan e_value and strand column order fix ([e23d09f](https://github.com/WrightonLabCSU/DRAM/commit/e23d09fc90ee3c7671a6f49a5b1d95e3a6875503)) - - Traits and vis can now be ran with w/o summarize ([51f7763](https://github.com/WrightonLabCSU/DRAM/commit/51f77632f1093591785ee293f5e524cbb60270ce)) -traits and visualize if ran with annotate and without -summarize would error ebcause of a use before definition -error. This fixes that. + traits and visualize if ran with annotate and without + summarize would error ebcause of a use before definition + error. This fixes that. + - Hmm parsing now takes top hit consistently ([1106003](https://github.com/WrightonLabCSU/DRAM/commit/1106003daaab6bea519132c5232cf62c54be2a9b)) -In the translation from DRAM1->2 and moving to nextflow, -the code to take the tophit for the hmm search had a couple -bugs in it depending on the hmm db. It would sometimes -take just the first hit outputted in the data sheet, -it would calcuate the bitscore wrong, and it wouldn't -do the info sheets right (since it was calculating bitscore -wrong). -Now it reports both full sequence bitscore and domain bitscore. -It takes the top it and also reports all other hits as well. -All of this is done in a generic way so that adding generic hmm -support will be trivial for next release after we fix this bug -Also add support for metals hmm DB. + In the translation from DRAM1->2 and moving to nextflow, + the code to take the tophit for the hmm search had a couple + bugs in it depending on the hmm db. It would sometimes + take just the first hit outputted in the data sheet, + it would calcuate the bitscore wrong, and it wouldn't + do the info sheets right (since it was calculating bitscore + wrong). + Now it reports both full sequence bitscore and domain bitscore. + It takes the top it and also reports all other hits as well. + All of this is done in a generic way so that adding generic hmm + support will be trivial for next release after we fix this bug + Also add support for metals hmm DB. ### Testing - Add integration test for summarize ([7411f82](https://github.com/WrightonLabCSU/DRAM/commit/7411f82e6cf016beb94d52996db0559648b2a38f)) - - ## 2.0.0-beta19 - 2025-11-21 [3c20b59](https://github.com/WrightonLabCSU/DRAM/commit/3c20b59f74e7af1a78993e8e91f31a4d8390ecd6)...[79dd74d](https://github.com/WrightonLabCSU/DRAM/commit/79dd74db3e60e1b6b3f84d8a691a5f37b4365e80) @@ -124,10 +114,10 @@ Also add support for metals hmm DB. - Fix distill bugs with genome stats, and metabolism summary ([419322b](https://github.com/WrightonLabCSU/DRAM/commit/419322b0d3b54ccc98d4540f94689b69c687ee42)) -genome_stats would error out if certain arguments were not provided. -Also fixed that the metabolism summary was adding extra columns to -some tabs that were needed. -Also fixed that quast stats were not being passed to distill script + genome_stats would error out if certain arguments were not provided. + Also fixed that the metabolism summary was adding extra columns to + some tabs that were needed. + Also fixed that quast stats were not being passed to distill script ## 2.0.0-beta18 - 2025-11-21 @@ -137,49 +127,50 @@ Also fixed that quast stats were not being passed to distill script - Add back in genome_stats, fix trna counts ([8db49d1](https://github.com/WrightonLabCSU/DRAM/commit/8db49d1122fc5196b24201ffdf8130cdd816e456)) -genome_stats.tsv have been absent in DRAM2, re-add them back -in. -Also fix the tRNA count in the genoma_stats as mentioned in #348. -This fixes #348. -Add quast stats to genome stats as well. -- Small bgfixes for namespace errors, error messages, and cli ([a08a37c](https://github.com/WrightonLabCSU/DRAM/commit/a08a37c03e19ccab95f7316cd20d8e75fe381af8)) - + genome_stats.tsv have been absent in DRAM2, re-add them back + in. + Also fix the tRNA count in the genoma_stats as mentioned in #348. + This fixes #348. + Add quast stats to genome stats as well. +- Small bgfixes for namespace errors, error messages, and cli ([a08a37c](https://github.com/WrightonLabCSU/DRAM/commit/a08a37c03e19ccab95f7316cd20d8e75fe381af8)) ### Package - Restructure output folders ([7b66599](https://github.com/WrightonLabCSU/DRAM/commit/7b665991b602dd8acc5611f1a5b54b15e0906df4)) -Restructure output folders to mainly ANNOTATE, SUMMARIZE, and VISUALIZE + Restructure output folders to mainly ANNOTATE, SUMMARIZE, and VISUALIZE + - Rename distill to summarize ([f902264](https://github.com/WrightonLabCSU/DRAM/commit/f902264072c38350aaac7e77281862f30b58a604)) -Moving and aliad distill to summarize. -Move call under annotate and automatically run call when annotate -and input_fasta set. -If summarize is set, run all distillate sheets, you can still -manually set individual distillate sheets the old way. -Add QC flag to run QC steps like collect_rna steps, taxa, and others -instead of having collect_rna run automatically., BREAKING CHANGE:API changes to move towards using summarize instead -of distill, visualize instead of product, traits indead of adjectives, -and automatically use call when annotate with input_fasta. QC only ran -when directed instead of automatically now as its own flag now. -- Cleanup and remove outdated files ([89b563c](https://github.com/WrightonLabCSU/DRAM/commit/89b563c58438af6dff16733de9f5f5225775035d)) + Moving and aliad distill to summarize. + Move call under annotate and automatically run call when annotate + and input_fasta set. + If summarize is set, run all distillate sheets, you can still + manually set individual distillate sheets the old way. + Add QC flag to run QC steps like collect_rna steps, taxa, and others + instead of having collect_rna run automatically., BREAKING CHANGE:API changes to move towards using summarize instead + of distill, visualize instead of product, traits indead of adjectives, + and automatically use call when annotate with input_fasta. QC only ran + when directed instead of automatically now as its own flag now. +- Cleanup and remove outdated files ([89b563c](https://github.com/WrightonLabCSU/DRAM/commit/89b563c58438af6dff16733de9f5f5225775035d)) - Add full_mode to profiles to run all options ([d7c55bc](https://github.com/WrightonLabCSU/DRAM/commit/d7c55bcae52f52827e917f40bb72d3c6a99b18b7)) -if you run -profile full_mode, runs all dbs and pipelines steps. -This is a convenient shorthand. -Also add ability to specify annotation dbs as comma seperated -with --annon_dbs, ex: --annon_dbs kegg,merops instead of ---use_kegg --use_merops. These option names are still subject to -change + if you run -profile full_mode, runs all dbs and pipelines steps. + This is a convenient shorthand. + Also add ability to specify annotation dbs as comma seperated + with --annon_dbs, ex: --annon_dbs kegg,merops instead of + --use_kegg --use_merops. These option names are still subject to + change + - Update MMSEQS2 and API documentation ([895ba8e](https://github.com/WrightonLabCSU/DRAM/commit/895ba8e0e52f2dc2afb6e47ab028f55f2f515cea)) -Update MMSEQS version from 13 to 18, which should result in a -major speedup. -Update some other dependencies in the annotate state as well. -Update API documentation and usage instructions + Update MMSEQS version from 13 to 18, which should result in a + major speedup. + Update some other dependencies in the annotate state as well. + Update API documentation and usage instructions ## 2.0.0-beta17 - 2025-09-23 @@ -189,25 +180,25 @@ Update API documentation and usage instructions - Allow calling quast with arbitrary large no of inputs ([e965d31](https://github.com/WrightonLabCSU/DRAM/commit/e965d3100f3543aebc6d24e6a6e186522e456c09)) -Quast requires passing inputs as a space seperated list of files, -instead of a dir or other methods. This can run into ARG_MAX limits -So change it to passing a glob, such as `*.fa` instead. This should -fix the problem. We might need to move to batching at some point -for performance reasons. + Quast requires passing inputs as a space seperated list of files, + instead of a dir or other methods. This can run into ARG_MAX limits + So change it to passing a glob, such as `*.fa` instead. This should + fix the problem. We might need to move to batching at some point + for performance reasons. ### Features - Rename ID col in GFF file ([690cff7](https://github.com/WrightonLabCSU/DRAM/commit/690cff78c978d40f5e814a2949c23ce5a8549116)) -In the Prodigal GFF file, the metadata ID field is a generated -unique ID that is in the format 1_1, 1_2, 2_1, 2_2, etc. -This is a problem if people concatenate all the GFFs together since -then the unique IDs aren't unique. In DRAM1, the IDs were repalced -with the SeqID_Genenumber. So that is what we are doing here + In the Prodigal GFF file, the metadata ID field is a generated + unique ID that is in the format 1_1, 1_2, 2_1, 2_2, etc. + This is a problem if people concatenate all the GFFs together since + then the unique IDs aren't unique. In DRAM1, the IDs were repalced + with the SeqID_Genenumber. So that is what we are doing here -We also replaced the python script that parsed the GFF into a summary -TSV for later use in DRAM2 into a tsv and replaced with with bash -parsing. Which benchmarking showed to be around 10-50 times faster. + We also replaced the python script that parsed the GFF into a summary + TSV for later use in DRAM2 into a tsv and replaced with with bash + parsing. Which benchmarking showed to be around 10-50 times faster. ## 2.0.0-beta16 - 2025-09-17 @@ -217,34 +208,35 @@ parsing. Which benchmarking showed to be around 10-50 times faster. - Add nf-test ([6f801af](https://github.com/WrightonLabCSU/DRAM/commit/6f801af84314424d1d3e5b1df083e36e59605f10)) -Add nf-test to check DRAM2 vs DRAM1 output -as well as a way to snapshot test DRAM2 changes -for major changes in the future. -First tests include annotation.tsv checks and fixes. + Add nf-test to check DRAM2 vs DRAM1 output + as well as a way to snapshot test DRAM2 changes + for major changes in the future. + First tests include annotation.tsv checks and fixes. ### Bug - Fix TRNA_COLLECT and COMBINE_ANNOTATIONS for large # inputs ([319ba9b](https://github.com/WrightonLabCSU/DRAM/commit/319ba9b7b54e756cab09c76eb3b412f93d6e7da9)) -rewrite TRNA_COLLECT to use pandas vectorized functions instead of -embedded for loops to significantly streamline creation of -collected_trnas.tsv with large # of inputs. Now instead of taking -hours or days, it will run in seconds or minutes. + rewrite TRNA_COLLECT to use pandas vectorized functions instead of + embedded for loops to significantly streamline creation of + collected_trnas.tsv with large # of inputs. Now instead of taking + hours or days, it will run in seconds or minutes. -rewrite COMBINTE_ANNOTATIONS to take directories of inputs instead -of a cli list of files so that when you have thousands and -thousands of mags or assemblies you don't run into your system's -ARG_MAX. + rewrite COMBINTE_ANNOTATIONS to take directories of inputs instead + of a cli list of files so that when you have thousands and + thousands of mags or assemblies you don't run into your system's + ARG_MAX. ## 2.0.0-beta15 - 2025-08-27 ### What's Changed -* Bugfixes with passing in already called genes by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/439 - - Bugfixes with passing in rrna sheets and trna sheets + +- Bugfixes with passing in already called genes by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/439 + - Bugfixes with passing in rrna sheets and trna sheets - Bugfixees for namespace errors for starting from called genes that caused runs to crash -* Add in non hit genes back into raw annotations like they were in DRAM1 by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/439 -* Allow job limits (cpu, mem, time) be controlled by config by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/440 -* Add adjectives CAZy parsing and ability to pass in custom rules sheet by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/441 +- Add in non hit genes back into raw annotations like they were in DRAM1 by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/439 +- Allow job limits (cpu, mem, time) be controlled by config by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/440 +- Add adjectives CAZy parsing and ability to pass in custom rules sheet by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/441 ## 2.0.0-beta13 - 2025-07-29 @@ -253,53 +245,59 @@ ARG_MAX. - Fix bug with combine annotations nf getting files not as paths (and not getting staged properly) ([06b5294](06b5294c25d6890ca2cef74d31bb899150177190)) ### What's Changed -* Fix issues with combine annotations and distill sheets binding issues, by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/436 -* Package/update nf core template by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/437 + +- Fix issues with combine annotations and distill sheets binding issues, by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/436 +- Package/update nf core template by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/437 ## 2.0.0-beta12 - 2025-07-08 ### What's Changed -* Fix bug where merops annotation didn't extract family and distill didn't have family to use by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/433 + +- Fix bug where merops annotation didn't extract family and distill didn't have family to use by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/433 ## 2.0.0-beta11 - 2025-06-11 ### What's Changed -* Add slurm_node config option (nodelist) by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/429 + +- Add slurm_node config option (nodelist) by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/429 ## 2.0.0-beta10 - 2025-06-07 ### What's Changed -* Feature/adjectives MVP - Add in adjectives minimum viable product by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/423 -* Add a contributing docs page by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/424 -* Bugfix/merops in distill not correct - Merops wasn't showing up in Distill, revert distill implementation to DRAM1 code by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/428 -* Bug discovered with Pfam annotations and distill in DRAM2, Pfam has been disabled for the time being and will be reenabled in the next release or two. + +- Feature/adjectives MVP - Add in adjectives minimum viable product by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/423 +- Add a contributing docs page by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/424 +- Bugfix/merops in distill not correct - Merops wasn't showing up in Distill, revert distill implementation to DRAM1 code by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/428 +- Bug discovered with Pfam annotations and distill in DRAM2, Pfam has been disabled for the time being and will be reenabled in the next release or two. ## 2.0.0-beta9 - 2025-05-22 ### Bugfix -* In the last version of DRAM2, due to column renames not making it to dram_vix, cazy (dbcan), merops, and pfam all were not being process correctly from DRAM2's annotation file. This led to them just not showing up in the resulting product. Now they should show up, but still have support for the older format that is outputted in DRAM1. - * Update dram_viz to 0.1.7 because of product bugfix about column names. See dram_viz [release 0.1.7](https://github.com/WrightonLabCSU/dram-viz/releases/tag/0.1.7) +- In the last version of DRAM2, due to column renames not making it to dram_vix, cazy (dbcan), merops, and pfam all were not being process correctly from DRAM2's annotation file. This led to them just not showing up in the resulting product. Now they should show up, but still have support for the older format that is outputted in DRAM1. + - Update dram_viz to 0.1.7 because of product bugfix about column names. See dram_viz [release 0.1.7](https://github.com/WrightonLabCSU/dram-viz/releases/tag/0.1.7) ## 2.0.0-beta7 - 2025-05-12 ### What's Changed -* Prodigal mode update and quast L50 output by @madeline-scyphers in 0a82b03ea577debd5d83d0e355c61a53697f69ad -* Add camper distill option by @madeline-scyphers in 9d0f087362a6371686015451c6c6da779df16fe0 -* Add check for kegg,ko,dbcan, or merops when running distill by @madeline-scyphers in 8bfbe3146dd8d00a445d70303e757ef186171253 -* Update distill sheets by @jmikayla1991 in f2b5d74e7cf82251575ed99e87174247d68127e5 and e6c82c48f5a03abb1f6b9c9248b037c4dc4ec264 and 2e860f5b5a07b8a5afe4d0287ba9dd90a0c82d7f -* Docs/add sphinx by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/414 -* Update sphinx theme by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/415 -* Update config for nf-schema and readthedocs by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/418 + +- Prodigal mode update and quast L50 output by @madeline-scyphers in 0a82b03ea577debd5d83d0e355c61a53697f69ad +- Add camper distill option by @madeline-scyphers in 9d0f087362a6371686015451c6c6da779df16fe0 +- Add check for kegg,ko,dbcan, or merops when running distill by @madeline-scyphers in 8bfbe3146dd8d00a445d70303e757ef186171253 +- Update distill sheets by @jmikayla1991 in f2b5d74e7cf82251575ed99e87174247d68127e5 and e6c82c48f5a03abb1f6b9c9248b037c4dc4ec264 and 2e860f5b5a07b8a5afe4d0287ba9dd90a0c82d7f +- Docs/add sphinx by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/414 +- Update sphinx theme by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/415 +- Update config for nf-schema and readthedocs by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/418 ## 2.0.0-beta6 - 2025-04-03 ### What's Changed -* Replace sample with input_fasta for output by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/404 -* Changing rename to run all fasta at once instead of 1 at a time by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/406 -* Package/refactor for older nextflow by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/407 -* Docs/update docs for new refactor by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/409 -* Package/restructure to nf core style by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/410 + +- Replace sample with input_fasta for output by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/404 +- Changing rename to run all fasta at once instead of 1 at a time by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/406 +- Package/refactor for older nextflow by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/407 +- Docs/update docs for new refactor by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/409 +- Package/restructure to nf core style by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/410 ### BREAKING @@ -311,36 +309,36 @@ Move to [nf-core](https://nf-co.re) style nextflow structure. Allowing more flex - [Add nf-core assets for slack report emails, etc.](https://github.com/WrightonLabCSU/DRAM/commit/f6ffbb2848048a63ed86f0ea7db38042d7f5a7e7) - [Simplify annotate NF workflow](https://github.com/WrightonLabCSU/DRAM/commit/3b625a8021d6d2a5ae05cbebaa7aad9cdcf2f66d) -- [Replace sample with input_fasta for output](https://github.com/WrightonLabCSU/DRAM/commit/e61535daeeb20f81e875c2359a4931104f4e2820) -in DRAM 1, output (like raw-annotations) like had the column fasta -in DRAM 2 it was renamed to sample, which is incorrect since it isn't -the sample, it is the fasta. Reverting it to fasta like in DRAM 1 -is a bit more logistically difficult because a large number of -nf processes (nf functions), and some python files use fasta -for the fastas file paths. So replacing sample with fasta -would cause collisions, and therefore we would need to first -replace all fasta keyworks with something like fasta_path -and then all sample with fasta. This route was easier -and probably less likely to introduce bugs. -- [Changing rename to run all fasta at once instead of 1 at a time](https://github.com/WrightonLabCSU/DRAM/commit/2c3445195332cb8bff675f3d43d5579d3d3d5a13) -rename currently runs 1 fasta at a time which means for things -like slurm it submits 1 job per fasta. rename takes in the realm -of seconds. It is much more efficient to batch them together. -- [downgrade nf-schema to 2.0.1 so nextflow can be down to 23 or even 22…](https://github.com/WrightonLabCSU/DRAM/commit/2033031709749b4e532cc40daa2448a0035425d0) -… something so known users stuck on 23.something can use DRAM 2 +- [Replace sample with input_fasta for output](https://github.com/WrightonLabCSU/DRAM/commit/e61535daeeb20f81e875c2359a4931104f4e2820) + in DRAM 1, output (like raw-annotations) like had the column fasta + in DRAM 2 it was renamed to sample, which is incorrect since it isn't + the sample, it is the fasta. Reverting it to fasta like in DRAM 1 + is a bit more logistically difficult because a large number of + nf processes (nf functions), and some python files use fasta + for the fastas file paths. So replacing sample with fasta + would cause collisions, and therefore we would need to first + replace all fasta keyworks with something like fasta_path + and then all sample with fasta. This route was easier + and probably less likely to introduce bugs. +- [Changing rename to run all fasta at once instead of 1 at a time](https://github.com/WrightonLabCSU/DRAM/commit/2c3445195332cb8bff675f3d43d5579d3d3d5a13) + rename currently runs 1 fasta at a time which means for things + like slurm it submits 1 job per fasta. rename takes in the realm + of seconds. It is much more efficient to batch them together. +- [downgrade nf-schema to 2.0.1 so nextflow can be down to 23 or even 22…](https://github.com/WrightonLabCSU/DRAM/commit/2033031709749b4e532cc40daa2448a0035425d0) + … something so known users stuck on 23.something can use DRAM 2 - [Update rename for dependencies](https://github.com/WrightonLabCSU/DRAM/commit/e7a61a562638635716b53a9a7fe5198fad87a83e) -- [Update modules code to include wave seqera container](https://github.com/WrightonLabCSU/DRAM/commit/cc9b372f1aae59fa94aabcef3944d4d37e6077e2) -using wave-cli, with cmd -for every module in modules/local, then adding the outputted url to -container outputer.url for the modules nextflow script, under the conda line. -This allows users to not just use conda, but also containers, and we don't have to build them -Ideally this would be added to a CI, but I haven't see where nf-core is doing that with a CI yet. +- [Update modules code to include wave seqera container](https://github.com/WrightonLabCSU/DRAM/commit/cc9b372f1aae59fa94aabcef3944d4d37e6077e2) + using wave-cli, with cmd + for every module in modules/local, then adding the outputted url to + container outputer.url for the modules nextflow script, under the conda line. + This allows users to not just use conda, but also containers, and we don't have to build them + Ideally this would be added to a CI, but I haven't see where nf-core is doing that with a CI yet. - [Add kegg formatting option](https://github.com/WrightonLabCSU/DRAM/commit/45bb6dfa5c421679840e861a4faf8b3b8e5664db) -- [Add processes to modules.conf](https://github.com/WrightonLabCSU/DRAM/commit/518c1dfc5760a940b34241f468f8e25cef61a724) -Add processes to modules.conf to add publishDir information so they output -their contents where I want them to. -Also added process labels to processes so that NF knows cpus, memory, and time -limits to give different processes. +- [Add processes to modules.conf](https://github.com/WrightonLabCSU/DRAM/commit/518c1dfc5760a940b34241f468f8e25cef61a724) + Add processes to modules.conf to add publishDir information so they output + their contents where I want them to. + Also added process labels to processes so that NF knows cpus, memory, and time + limits to give different processes. - [Add slurm option to launch with slurm executor](https://github.com/WrightonLabCSU/DRAM/commit/a55cddf07936762cb980e16fcc9a4b2e136092b8) - [Update README with some basic install instructions](https://github.com/WrightonLabCSU/DRAM/commit/0db581c820b5dabe41a5fb6469557f7e1f6b276c) @@ -355,9 +353,10 @@ Fix typo causing bug in main script [c94d0d4](c94d0d4c5010d9885506915e6c1b37d64f3c7f83)...[f415e92](f415e92fc55d228abcc1eeff911a79e09da35adb) ### What's Changed -* Give default to ch_distill_sql_script since it is used always in annotations by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/383 -* Bugfix/path creation bug by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/385 -* Feature/kegg pep directory by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/387 + +- Give default to ch_distill_sql_script since it is used always in annotations by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/383 +- Bugfix/path creation bug by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/385 +- Feature/kegg pep directory by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM/pull/387 ## 2.0.0-beta3 - 2024-10-15 @@ -367,33 +366,35 @@ DRAM v2 is wrapped in Nextflow due to its innate scalability on HPCs and contain #### Pre Beta -* Nextflow initial wrapping -* DRAM package restructuring for Nextflow -* Database preformatting changes -* Containerization +- Nextflow initial wrapping +- DRAM package restructuring for Nextflow +- Database preformatting changes +- Containerization ### Previous Betas from old repo -#### Beta 1 -* Removed hard-coded slurm node and slurm_queue in nextflow.config by @BioRRW in https://github.com/WrightonLabCSU/DRAM2/pull/1 -* Dev by @BioRRW in #2 - https://github.com/WrightonLabCSU/DRAM2/pull/13 -* Visualizations/make product by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/12 -* Dev by @BioRRW in https://github.com/WrightonLabCSU/DRAM2/pull/14 -* Visualizations/docstrings by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/15 -* Add README to visualization package by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/16 -* Viz/move viz to installable package by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/20 -* Feature/kegg db formatting by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/23 -* Package/add docker file by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/24 -* Kegg formating, docker, visualization package, dev notes by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/19 +#### Beta 1 + +- Removed hard-coded slurm node and slurm_queue in nextflow.config by @BioRRW in https://github.com/WrightonLabCSU/DRAM2/pull/1 +- Dev by @BioRRW in #2 - https://github.com/WrightonLabCSU/DRAM2/pull/13 +- Visualizations/make product by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/12 +- Dev by @BioRRW in https://github.com/WrightonLabCSU/DRAM2/pull/14 +- Visualizations/docstrings by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/15 +- Add README to visualization package by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/16 +- Viz/move viz to installable package by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/20 +- Feature/kegg db formatting by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/23 +- Package/add docker file by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/24 +- Kegg formating, docker, visualization package, dev notes by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/19 #### Beta2 -* Replace many ./ paths with using NF's projectDir variable by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/25 -* Config/split config by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/26 -* Update docs with new install instructions by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/27 + +- Replace many ./ paths with using NF's projectDir variable by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/25 +- Config/split config by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/26 +- Update docs with new install instructions by @madeline-scyphers in https://github.com/WrightonLabCSU/DRAM2/pull/27 #### Beta 3 -* Move from DRAM2 name back to DRAM -* Moving DRAM Nextflow Configuration to split better between internal and user +- Move from DRAM2 name back to DRAM +- Moving DRAM Nextflow Configuration to split better between internal and user diff --git a/LICENSE b/LICENSE index e72bfdda..f288702d 100644 --- a/LICENSE +++ b/LICENSE @@ -671,4 +671,4 @@ into proprietary programs. If your program is a subroutine library, you may consider it more useful to permit linking proprietary applications with the library. If this is what you want to do, use the GNU Lesser General Public License instead of this License. But first, please read -. \ No newline at end of file +. diff --git a/README.md b/README.md index 7c4b3ca7..a0d25478 100644 --- a/README.md +++ b/README.md @@ -8,13 +8,15 @@ DRAM v2 (Distilled and Refined Annotation of Metabolism Version 2) is a tool for annotating metagenomic and genomic assembled data (e.g. scaffolds or contigs) or called genes (e.g. nuclotide or amino acid format). DRAM annotates MAGs using [KEGG](https://www.kegg.jp/) (if provided by the user), [UniRef90](https://www.uniprot.org/), [PFAM](https://pfam.xfam.org/), [dbCAN](http://bcb.unl.edu/dbCAN2/), [RefSeq viral](https://www.ncbi.nlm.nih.gov/genome/viruses/), [VOGDB](http://vogdb.org/) and the [MEROPS](https://www.ebi.ac.uk/merops/) peptidase database as well as custom user databases. -DRAM is run in four stages: -1) Gene Calling Prodogal - genes are called on user provided scaffolds or contigs -2) Gene Annotation - genes are annotated with a set of user defined databases -3) Distillation - annotations are curated into functional categories -4) Product Generation - interactive visualizations of DRAM output are generated +DRAM is run in four stages: + +1. Gene Calling Prodogal - genes are called on user provided scaffolds or contigs +2. Gene Annotation - genes are annotated with a set of user defined databases +3. Distillation - annotations are curated into functional categories +4. Product Generation - interactive visualizations of DRAM output are generated For more detail on DRAM and how DRAM v2 works please see our DRAM products: + - [DRAM version 1 publication](https://academic.oup.com/nar/article/48/16/8883/5884738) - [DRAM in KBase publication](https://pubmed.ncbi.nlm.nih.gov/36857575/) - [DRAM webinar](https://www.youtube.com/watch?v=-Ky2fz2vw2s) @@ -24,44 +26,51 @@ For more detail on DRAM and how DRAM v2 works please see our DRAM products: - [Docs](https://dramit.readthedocs.io/en/latest) - [Installation Guide](https://dramit.readthedocs.io/en/latest/installation.html) - [Usage Examples](https://dramit.readthedocs.io/en/latest/usage.html) -- [Parameter API]([#command-line-options](https://dramit.readthedocs.io/en/latest/params_doc.html)) -- [Rules API]([#nextflow-tips-and-tricks](https://dramit.readthedocs.io/en/latest/rules_parser.html)) +- [Parameter API](<[#command-line-options](https://dramit.readthedocs.io/en/latest/params_doc.html)>) +- [Rules API](<[#nextflow-tips-and-tricks](https://dramit.readthedocs.io/en/latest/rules_parser.html)>) ## Example Usage DRAM apps Call, Annotate and Distill can all be run at once or alternatively, each app can be run individually. Here are some common usage examples: -1) **Rename fasta headers based on input sample file names:** +1. **Rename fasta headers based on input sample file names:** + ```bash nextflow run WrightonLabCSU/DRAM --rename --input_fasta ``` -2) **Call genes using input fastas (use --rename to rename FASTA headers):** +2. **Call genes using input fastas (use --rename to rename FASTA headers):** + ```bash nextflow run WrightonLabCSU/DRAM --call --rename --input_fasta ``` -3) **Annotate called genes using input called genes and the KOFAM database:** +3. **Annotate called genes using input called genes and the KOFAM database:** + ```bash nextflow run WrightonLabCSU/DRAM --annotate --input_genes --use_kofam ``` -4) **Annotate called genes using input fasta files and the KOFAM database:** +4. **Annotate called genes using input fasta files and the KOFAM database:** + ```bash nextflow run WrightonLabCSU/DRAM --annotate --input_fasta --use_kofam ``` -5) **Merge various existing annotations files together (Must be generated using DRAM):** +5. **Merge various existing annotations files together (Must be generated using DRAM):** + ```bash nextflow run WrightonLabCSU/DRAM --merge_annotations ``` -6) **Distill using input annotations:** +6. **Distill using input annotations:** + ```bash nextflow run WrightonLabCSU/DRAM --distill_ --annotations ``` -7) **Complete workflow example:** +7. **Complete workflow example:** + ```bash nextflow run -bg WrightonLabCSU/DRAM \ --input_fasta [DIRECTORY of fasta files] \ @@ -98,6 +107,7 @@ params { ``` You can also use a custom config file: + ```bash nextflow run DRAM -c /path/to/custom_config.config ``` diff --git a/assets/amg_database.20220928.tsv b/assets/amg_database.20220928.tsv index 42b93eae..36bf891e 100644 --- a/assets/amg_database.20220928.tsv +++ b/assets/amg_database.20220928.tsv @@ -277,4 +277,4 @@ K01599 EC:4.1.1.37 PF01208 Uroporphyrinogen decarboxylase (URO-D) Roux et al. PF13385 Concanavalin A-like lectin; extracellular arabinase Emerson et al. 2018 FALSE K01779 EC:5.1.1.13 racD; aspartate Racmase Trubl et al. 2018 FALSE PF01786 Plastoquinol terminal oxidase (PTOX) Sullivan et al. 2010; Ignacio?Espinoza et al. 2012; Roux et al. 2016 FALSE - PF01077; PF03460 rdsrA; reverse-acting dissimilatory sulfite reductase (alpha subunit) Anantharaman et al. 2014 FALSE \ No newline at end of file + PF01077; PF03460 rdsrA; reverse-acting dissimilatory sulfite reductase (alpha subunit) Anantharaman et al. 2014 FALSE diff --git a/assets/internal/generate_sql_database.py b/assets/internal/generate_sql_database.py index e7d26490..925463b8 100644 --- a/assets/internal/generate_sql_database.py +++ b/assets/internal/generate_sql_database.py @@ -2,15 +2,17 @@ import sqlite3 import argparse + def insert_data(conn, table_name, data): - placeholders = ', '.join(['?'] * len(data[0])) + placeholders = ", ".join(["?"] * len(data[0])) query = f"INSERT OR REPLACE INTO {table_name} VALUES ({placeholders})" conn.executemany(query, data) conn.commit() + def process_dbcan(db_dir): - description_file = os.path.join(db_dir, 'dbcan.fam-activities.tsv') - ec_file = os.path.join(db_dir, 'dbcan.fam.subfam.ec.tsv') + description_file = os.path.join(db_dir, "dbcan.fam-activities.tsv") + ec_file = os.path.join(db_dir, "dbcan.fam.subfam.ec.tsv") descriptions = {} ecs = {} @@ -19,39 +21,50 @@ def process_dbcan(db_dir): # Process descriptions with open(description_file) as f: for line in f: - if line.startswith('#') or not line.strip(): + if line.startswith("#") or not line.strip(): continue - parts = line.strip().split('\t') + parts = line.strip().split("\t") if len(parts) >= 2: - descriptions[parts[0]] = ' '.join(parts[1:]) + descriptions[parts[0]] = " ".join(parts[1:]) elif len(parts) == 1: descriptions[parts[0]] = "No description available" else: - skipped_lines.append(f"Skipped line in description file: {line.strip()} (expected at least 2 columns, found {len(parts)})") + skipped_lines.append( + f"Skipped line in description file: {line.strip()} (expected at least 2 columns, found {len(parts)})" + ) # Process EC numbers with open(ec_file) as f: for line in f: - parts = line.strip().split('\t') + parts = line.strip().split("\t") if len(parts) > 2: ecs[parts[0]] = ecs.get(parts[0], set()) ecs[parts[0]].add(parts[2]) data = [] for entry in descriptions: - ec = ','.join(ecs.get(entry, [])) + ec = ",".join(ecs.get(entry, [])) data.append((entry, descriptions[entry], ec)) - + return data, skipped_lines + def main(): - parser = argparse.ArgumentParser(description="Generate descriptions database for DRAM.") - parser.add_argument('--db_dir', required=True, help="Directory containing the database subdirectories.") - parser.add_argument('--output_db', required=True, help="Path to the output SQLite database.") - parser.add_argument('--log', required=True, help="Path to the log file.") + parser = argparse.ArgumentParser( + description="Generate descriptions database for DRAM." + ) + parser.add_argument( + "--db_dir", + required=True, + help="Directory containing the database subdirectories.", + ) + parser.add_argument( + "--output_db", required=True, help="Path to the output SQLite database." + ) + parser.add_argument("--log", required=True, help="Path to the log file.") args = parser.parse_args() - + log_entries = [] db_dir = args.db_dir output_db = args.output_db @@ -59,28 +72,29 @@ def main(): conn = sqlite3.connect(output_db) log_entries.append(f"Opened database {output_db}") - dbcan_dir = os.path.join(db_dir, 'dbcan') + dbcan_dir = os.path.join(db_dir, "dbcan") if os.path.exists(dbcan_dir): conn.execute(""" CREATE TABLE IF NOT EXISTS dbcan_description ( - id VARCHAR(30) NOT NULL, - description VARCHAR(1000), - ec VARCHAR(1000), + id VARCHAR(30) NOT NULL, + description VARCHAR(1000), + ec VARCHAR(1000), PRIMARY KEY (id) ); """) log_entries.append("Processing dbcan_description from " + dbcan_dir) data, skipped_lines = process_dbcan(dbcan_dir) - insert_data(conn, 'dbcan_description', data) + insert_data(conn, "dbcan_description", data) log_entries.append(f"Inserted {len(data)} records into dbcan_description") log_entries.extend(skipped_lines) - - with open(args.log, 'w') as log_file: + + with open(args.log, "w") as log_file: for entry in log_entries: - log_file.write(entry + '\n') - + log_file.write(entry + "\n") + conn.close() log_entries.append("Closed database connection") + if __name__ == "__main__": - main() \ No newline at end of file + main() diff --git a/assets/internal/prepare_databases.py b/assets/internal/prepare_databases.py index 42a113d8..df90f063 100644 --- a/assets/internal/prepare_databases.py +++ b/assets/internal/prepare_databases.py @@ -14,7 +14,7 @@ "dbcan": { "hmm_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/dbCAN-HMMdb-V12.txt", "family_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/CAZyDB.08062022.fam.subfam.ec.txt", - "subfamily_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/CAZyDB.08062022.fam-activities.txt" + "subfamily_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/CAZyDB.08062022.fam-activities.txt", }, "cant_hyd": { "base_url": "https://api.github.com/repos/dgittins/CANT-HYD-HydrocarbonBiodegradation/contents/HMMs/concatenated%20HMMs", @@ -23,22 +23,22 @@ "hmm_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER.hmm", "faa_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_blast.faa", "mmseq_scores_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_blast_scores.tsv", - "hmm_scores_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_hmm_scores.tsv" + "hmm_scores_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_hmm_scores.tsv", }, "vogdb": { "hmm_url": "https://fileshare.lisc.univie.ac.at/vog/latest/vog.hmm.tar.gz", - "annotations_url": "https://fileshare.lisc.univie.ac.at/vog/latest/vog.annotations.tsv.gz" + "annotations_url": "https://fileshare.lisc.univie.ac.at/vog/latest/vog.annotations.tsv.gz", }, "pfam": { "hmm_url": "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.hmm.dat.gz", - "mmseq_url": "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.full.gz" + "mmseq_url": "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.full.gz", }, "merops": { "mmseqs_url": "ftp://ftp.ebi.ac.uk/pub/databases/merops/current_release/pepunit.lib" }, "kofam": { "hmm_url": "ftp://ftp.genome.jp/pub/db/kofam/profiles.tar.gz", - "ko_list_url": "ftp://ftp.genome.jp/pub/db/kofam/ko_list.gz" + "ko_list_url": "ftp://ftp.genome.jp/pub/db/kofam/ko_list.gz", }, "fegenie": { "base_url": "https://api.github.com/repos/Arkadiy-Garber/FeGenie/contents/hmms/iron/", @@ -53,74 +53,64 @@ "iron_oxidation", "iron_storage", "iron_reduction", - "magnetosome_formation" + "magnetosome_formation", ], - "files": [ - "HMM-bitcutoffs.txt" - ] + "files": ["HMM-bitcutoffs.txt"], }, "sulfur": { "hmm_path": "/home/reedrich/Wrighton-Lab/Projects/DRAM-Main-Main-Project/DRAM2/DRAM-2-Nextflow/databases/sulfur/sulfur.hmm" }, "methyl": { "faa_path": "/home/reedrich/Wrighton-Lab/Projects/DRAM-Main-Main-Project/DRAM2/DRAM-2-Nextflow/databases/methyl/methylotrophy.faa" - } + }, } # Define rename_mapping dictionaries for each database rename_mapping_dbcan = { "hmm_url": "dbcan.hmm", "family_url": "dbcan.fam-activities.tsv", - "subfamily_url": "dbcan.fam.subfam.ec.tsv" + "subfamily_url": "dbcan.fam.subfam.ec.tsv", } -rename_mapping_cant_hyd = { - "hmm_file": "cant_hyd.hmm" -} +rename_mapping_cant_hyd = {"hmm_file": "cant_hyd.hmm"} rename_mapping_camper = { "CAMPER.hmm": "hmm/camper.hmm", "CAMPER_blast.faa": "mmseqs/camper_blast.faa", "CAMPER_blast_scores.tsv": "mmseqs/camper_blast_scores.tsv", - "CAMPER_hmm_scores.tsv": "hmm/camper_hmm_scores.tsv" + "CAMPER_hmm_scores.tsv": "hmm/camper_hmm_scores.tsv", } rename_mapping_vogdb = { "hmm_url": "vog_latest_hmms.hmm", - "annotations_url": "vog_annotations_latest.tsv.gz" + "annotations_url": "vog_annotations_latest.tsv.gz", } rename_mapping_pfam = { "Pfam-A.hmm.dat.gz": "hmm/Pfam-A.hmm.dat", - "Pfam-A.full.gz": "mmseqs/Pfam-A.full.gz" + "Pfam-A.full.gz": "mmseqs/Pfam-A.full.gz", } rename_mapping_merops = { "pepunit.lib": "mmseqs/merops_peptidases_nr.faa", } -rename_mapping_kofam = { - "hmm_url": "kofam_profiles.hmm", - "ko_list": "kofam_ko_list.tsv" -} +rename_mapping_kofam = {"hmm_url": "kofam_profiles.hmm", "ko_list": "kofam_ko_list.tsv"} rename_mapping_fegenie = { "hmm_file": "fegenie.hmm", "HMM-bitcutoffs.txt": "fegenie_iron_cut_offs.txt", } -rename_mapping_sulfur = { - "hmm_file": "sulfur.hmm" -} +rename_mapping_sulfur = {"hmm_file": "sulfur.hmm"} + +rename_mapping_methyl = {"hmm_file": "methyl.faa"} -rename_mapping_methyl = { - "hmm_file": "methyl.faa" -} def download_cant_hyd_files(output_dir): base_url = database_urls["cant_hyd"]["base_url"] response = requests.get(base_url) - + if response.status_code == 200: files = response.json() for file in files: @@ -128,19 +118,24 @@ def download_cant_hyd_files(output_dir): download_url = file["download_url"] file_name = "cant_hyd.hmm" # Rename the file to cant_hyd.hmm download_file_path = path.join(output_dir, file_name) - + file_response = requests.get(download_url) if file_response.status_code == 200: with open(download_file_path, "wb") as f: f.write(file_response.content) print(f"Downloaded file: {file_name}") else: - print(f"Failed to download file: {file_name}. Status code: {file_response.status_code}") + print( + f"Failed to download file: {file_name}. Status code: {file_response.status_code}" + ) else: - print(f"Failed to fetch file list from GitHub. Status code: {response.status_code}") + print( + f"Failed to fetch file list from GitHub. Status code: {response.status_code}" + ) print("cant_hyd files downloaded successfully.") + def download_fegenie_files(output_dir): repo_url = "https://github.com/Arkadiy-Garber/FeGenie.git" fegenie_dir = path.join(output_dir, "FeGenie") @@ -183,7 +178,7 @@ def download_fegenie_files(output_dir): def download_fegenie_file(base_url, file_name, output_dir): """ Download a file from the FeGenie repository. - + Args: base_url (str): The base URL of the FeGenie repository. file_name (str): The name of the file to download. @@ -201,7 +196,10 @@ def download_fegenie_file(base_url, file_name, output_dir): file.write(response.content) print(f"Downloaded file: {file_name}") else: - print(f"Failed to download file: {file_name}. Status code: {response.status_code}") + print( + f"Failed to download file: {file_name}. Status code: {response.status_code}" + ) + def download_databases(output_dir, databases): for database in databases: @@ -218,12 +216,22 @@ def download_databases(output_dir, databases): elif database == "dbcan": for url_key, url_value in urls.items(): download_url = url_value # Get the download URL from the dictionary - download_file_name = path.basename(download_url) # Extract the file name from the URL - download_file_path = path.join(database_output_dir, download_file_name) + download_file_name = path.basename( + download_url + ) # Extract the file name from the URL + download_file_path = path.join( + database_output_dir, download_file_name + ) # Download the file using curl curl_command = f"curl -L -o {download_file_path} {download_url}" - subprocess.run(curl_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + curl_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) print(f"Downloaded file: {download_file_name}") elif database == "cant_hyd": @@ -231,23 +239,45 @@ def download_databases(output_dir, databases): elif database == "kofam": for url_key, url_value in urls.items(): download_url = url_value # Get the download URL from the dictionary - download_file_name = path.basename(download_url) # Extract the file name from the URL - download_file_path = path.join(database_output_dir, download_file_name) + download_file_name = path.basename( + download_url + ) # Extract the file name from the URL + download_file_path = path.join( + database_output_dir, download_file_name + ) # Download the file using curl curl_command = f"curl -L -o {download_file_path} {download_url}" - subprocess.run(curl_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + curl_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) print(f"Downloaded file: {download_file_name}") else: for url_key, url_value in urls.items(): - download_url = urls[url_key] # Get the download URL from the dictionary - download_file_name = path.basename(download_url) # Extract the file name from the URL - download_file_path = path.join(database_output_dir, download_file_name) + download_url = urls[ + url_key + ] # Get the download URL from the dictionary + download_file_name = path.basename( + download_url + ) # Extract the file name from the URL + download_file_path = path.join( + database_output_dir, download_file_name + ) # Download the file using curl curl_command = f"curl -L -o {download_file_path} {download_url}" - subprocess.run(curl_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + curl_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) print(f"Downloaded file: {download_file_name}") @@ -255,12 +285,19 @@ def download_databases(output_dir, databases): else: print(f"URLs for {database} database are not defined. Skipping.") + def process_vogdb_database(database_file, output_dir, num_threads=1): print("Processing VogDB database...") if path.exists(database_file): # Extract the downloaded tar.gz file tar_command = f"tar -xzf {database_file} -C {output_dir}" - subprocess.run(tar_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + tar_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) # Locate the .gz file in the extracted directory (if any) hmm_files = glob(path.join(output_dir, "hmm", "*.hmm.gz")) @@ -269,13 +306,20 @@ def process_vogdb_database(database_file, output_dir, num_threads=1): # Decompress each .hmm.gz file using pigz for hmm_file in hmm_files: decompress_command = f"pigz -d -p {num_threads} {hmm_file}" - subprocess.run(decompress_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + decompress_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) print(f"Decompressed file: {hmm_file}") print("VogDB processed successfully.") else: print("VogDB file not found. Skipping processing.") + def process_camper_database(output_dir): print("Processing Camper database...") @@ -303,9 +347,7 @@ def process_camper_database(output_dir): # Rename MMseqs files to follow the desired naming scheme mmseqs_dir = path.join(output_dir, "mmseqs") - mmseqs_files = { - "camper_blast_scores.tsv": "camper_scores.tsv" - } + mmseqs_files = {"camper_blast_scores.tsv": "camper_scores.tsv"} for old_name, new_name in mmseqs_files.items(): old_path = path.join(mmseqs_dir, old_name) new_path = path.join(mmseqs_dir, new_name) @@ -317,9 +359,10 @@ def process_camper_database(output_dir): print("Camper processed successfully.") + def process_pfam_database(output_dir, num_threads=1): print("Processing Pfam database...") - + for original_file, new_file in rename_mapping_pfam.items(): original_path = path.join(output_dir, original_file) new_path = path.join(output_dir, new_file) @@ -332,18 +375,29 @@ def process_pfam_database(output_dir, num_threads=1): if path.exists(original_path): if original_file.endswith(".gz"): decompress_command = f"pigz -d -p {num_threads} {original_path}" - subprocess.run(decompress_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - original_path = original_path[:-3] # Remove .gz extension after decompression + subprocess.run( + decompress_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) + original_path = original_path[ + :-3 + ] # Remove .gz extension after decompression move(original_path, new_path) - print(f"File {original_file} decompressed (if needed), renamed and moved to {new_path}") + print( + f"File {original_file} decompressed (if needed), renamed and moved to {new_path}" + ) else: print(f"File {original_file} not found. Skipping.") print("Pfam processed successfully.") + def process_merops_database(output_dir, num_threads=1): print("Processing Merops database...") - + for original_file, new_file in rename_mapping_merops.items(): original_path = path.join(output_dir, original_file) new_path = path.join(output_dir, new_file) @@ -364,9 +418,10 @@ def process_merops_database(output_dir, num_threads=1): # Create the MMseqs2 database create_mmseqs(new_path, new_path + "_db", num_threads) + def process_fegenie_database(output_dir): print("Processing FeGenie database...") - + # Download and prepare FeGenie files download_fegenie_files(output_dir) @@ -409,17 +464,16 @@ def process_fegenie_database(output_dir): print(f"Removed file: {file_path}") print("FeGenie processed successfully.") - def process_sulfur_database(output_dir): print("Processing Sulfur database...") sulfur_hmm_path = database_urls["sulfur"]["hmm_path"] - + # Create the sulfur output directory if it doesn't exist if not path.exists(output_dir): mkdir(output_dir) - + # Move the sulfur HMM file to the sulfur output directory destination_path = path.join(output_dir, path.basename(sulfur_hmm_path)) shutil.copyfile(sulfur_hmm_path, destination_path) @@ -431,12 +485,13 @@ def process_sulfur_database(output_dir): except subprocess.CalledProcessError as e: print(f"Error running hmmpress: {e}") print("Please check the format of the sulfur HMM file.") - + print("Sulfur processed successfully.") + def process_methyl_database(output_dir, num_threads=1): print("Processing Methyl database...") - + # Paths for methyl database files methyl_faa_path = database_urls["methyl"]["faa_path"] methyl_faa_dest = path.join(output_dir, "methyl.faa") @@ -451,6 +506,7 @@ def process_methyl_database(output_dir, num_threads=1): print("Methyl processed successfully.") + def process_cant_hyd_database(output_dir): print("Processing cant_hyd database...") repo_url = "https://github.com/dgittins/CANT-HYD-HydrocarbonBiodegradation.git" @@ -470,13 +526,15 @@ def process_cant_hyd_database(output_dir): os.makedirs(hmm_dir) # Move the concatenated HMM file to the hmm subdirectory - concatenated_hmm_path = path.join(cant_hyd_dir, "HMMs", "concatenated HMMs", "CANT-HYD.hmm") + concatenated_hmm_path = path.join( + cant_hyd_dir, "HMMs", "concatenated HMMs", "CANT-HYD.hmm" + ) final_hmm_path = path.join(hmm_dir, "cant_hyd.hmm") if path.exists(concatenated_hmm_path): move(concatenated_hmm_path, final_hmm_path) print(f"Moved CANT-HYD.hmm to {final_hmm_path}") else: - print(f"Concatenated HMM file not found in the repository.") + print("Concatenated HMM file not found in the repository.") # Remove the cloned repository directory rmtree(cant_hyd_dir) @@ -495,12 +553,13 @@ def process_cant_hyd_database(output_dir): print("cant_hyd processed successfully.") + def process_dbcan_database(output_dir): print("Processing dbcan database...") rename_mapping = { "dbCAN-HMMdb-V12.txt": "dbcan.hmm", "CAZyDB.08062022.fam.subfam.ec.txt": "dbcan.fam.subfam.ec.tsv", - "CAZyDB.08062022.fam-activities.txt": "dbcan.fam-activities.tsv" + "CAZyDB.08062022.fam-activities.txt": "dbcan.fam-activities.tsv", } for original_file, new_file in rename_mapping.items(): @@ -527,6 +586,7 @@ def process_dbcan_database(output_dir): print("dbcan processed successfully.") + def process_kofam_database(output_dir, num_threads=1): print("Processing kofam database...") hmm_dir = path.join(output_dir, "hmm") @@ -539,7 +599,13 @@ def process_kofam_database(output_dir, num_threads=1): profiles_tar_path = path.join(output_dir, "profiles.tar.gz") if path.exists(profiles_tar_path): tar_command = f"tar -xzf {profiles_tar_path} -C {hmm_dir}" - subprocess.run(tar_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + tar_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) print(f"Extracted {profiles_tar_path} to {hmm_dir}") else: print("Profiles tar file not found. Skipping extraction.") @@ -548,10 +614,16 @@ def process_kofam_database(output_dir, num_threads=1): ko_list_path = path.join(output_dir, "ko_list.gz") if path.exists(ko_list_path): decompress_command = f"pigz -d -p {num_threads} {ko_list_path}" - subprocess.run(decompress_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + decompress_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) ko_list_path = ko_list_path[:-3] # Remove .gz extension after decompression move(ko_list_path, path.join(output_dir, "kofam_ko_list.tsv")) - print(f"Decompressed and renamed ko_list to kofam_ko_list.tsv") + print("Decompressed and renamed ko_list to kofam_ko_list.tsv") else: print("ko_list.gz file not found. Skipping decompression.") @@ -576,9 +648,10 @@ def process_kofam_database(output_dir, num_threads=1): print("kofam processed successfully.") + def generate_readme(output_dir, databases_info): def human_readable_size(size, decimal_places=1): - for unit in ['B', 'KB', 'MB', 'GB', 'TB']: + for unit in ["B", "KB", "MB", "GB", "TB"]: if size < 1024.0: return f"{size:.{decimal_places}f} {unit}" size /= 1024.0 @@ -589,8 +662,10 @@ def human_readable_size(size, decimal_places=1): readme_content += "URLs used for download:\n" for url_key, url_value in database_info["urls"].items(): readme_content += f"- {url_key}: {url_value}\n" - readme_content += f"\nDate and Time Downloaded: {database_info['download_date']}\n\n" - + readme_content += ( + f"\nDate and Time Downloaded: {database_info['download_date']}\n\n" + ) + # List contents of the directory with sizes, including subdirectories database_dir = path.join(output_dir, database_name) if path.exists(database_dir) and path.isdir(database_dir): @@ -609,32 +684,51 @@ def human_readable_size(size, decimal_places=1): print(f"README.txt generated successfully at {readme_file_path}") + def index_hmm(hmm_dir, hmm_file): try: # Run HMMER to index the HMM file index_command = f"hmmpress -f {hmm_file}" - result = subprocess.run(index_command, shell=True, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE) - print(result.stdout.decode('utf-8')) + result = subprocess.run( + index_command, + shell=True, + check=True, + stdout=subprocess.PIPE, + stderr=subprocess.PIPE, + ) + print(result.stdout.decode("utf-8")) print(f"Indexed HMM file: {path.basename(hmm_file)}") except subprocess.CalledProcessError as e: print(f"Error indexing HMM file {path.basename(hmm_file)}: {e}") - print(e.stderr.decode('utf-8')) + print(e.stderr.decode("utf-8")) + def create_mmseqs(fasta_loc, output_loc, threads): """Takes a fasta file and makes a mmseqs2 database for use in blast searching and hmm searching with mmseqs2.""" print(f"Creating MMseqs2 database for {fasta_loc}...") - subprocess.run(["mmseqs", "createdb", fasta_loc, output_loc], check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + ["mmseqs", "createdb", fasta_loc, output_loc], + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) tmp_dir = path.join(path.dirname(output_loc), "tmp") - subprocess.run(["mmseqs", "createindex", output_loc, tmp_dir, "--threads", str(threads)], check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + ["mmseqs", "createindex", output_loc, tmp_dir, "--threads", str(threads)], + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) print(f"MMseqs2 database created at {output_loc}") - + # Remove the temporary directory if path.exists(tmp_dir): rmtree(tmp_dir) print(f"Removed temporary directory: {tmp_dir}") + def sanitize_hmm_file(input_file, output_file): - with open(input_file, 'r') as in_file: + with open(input_file, "r") as in_file: lines = in_file.readlines() sanitized_lines = [] @@ -648,7 +742,9 @@ def sanitize_hmm_file(input_file, output_file): if line.startswith("HMMER3/f"): if entry_started: # Process current entry before starting a new one - sanitized_entry = process_entry(current_entry, entry_names, name_suffix_counter) + sanitized_entry = process_entry( + current_entry, entry_names, name_suffix_counter + ) sanitized_lines.extend(sanitized_entry) current_entry = [] entry_started = True @@ -658,7 +754,9 @@ def sanitize_hmm_file(input_file, output_file): if line == "//": entry_started = False # Process the last entry - sanitized_entry = process_entry(current_entry, entry_names, name_suffix_counter) + sanitized_entry = process_entry( + current_entry, entry_names, name_suffix_counter + ) sanitized_lines.extend(sanitized_entry) current_entry = [] @@ -667,11 +765,12 @@ def sanitize_hmm_file(input_file, output_file): sanitized_entry = process_entry(current_entry, entry_names, name_suffix_counter) sanitized_lines.extend(sanitized_entry) - with open(output_file, 'w') as out_file: - out_file.write('\n'.join(sanitized_lines)) + with open(output_file, "w") as out_file: + out_file.write("\n".join(sanitized_lines)) print(f"Sanitized HMM file written to: {output_file}") + def process_entry(entry_lines, entry_names, name_suffix_counter): name_line_index = None acc_line_index = None @@ -702,6 +801,7 @@ def process_entry(entry_lines, entry_names, name_suffix_counter): return entry_lines + def concatenate_hmm_files(hmm_dir, output_file): hmm_files = [] for root, _, files in os.walk(hmm_dir): @@ -711,9 +811,9 @@ def concatenate_hmm_files(hmm_dir, output_file): hmm_files.sort() - with open(output_file, 'w') as out_file: + with open(output_file, "w") as out_file: for hmm_file in hmm_files: - with open(hmm_file, 'r') as in_file: + with open(hmm_file, "r") as in_file: lines = in_file.readlines() out_file.writelines(lines) if not lines[-1].strip() == "//": @@ -723,15 +823,34 @@ def concatenate_hmm_files(hmm_dir, output_file): print(f"Concatenated HMM files into: {output_file}") + def git_clone_repo(repo_url, output_dir): clone_command = f"git clone {repo_url} {output_dir}" - subprocess.run(clone_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) + subprocess.run( + clone_command, + shell=True, + check=True, + stdout=subprocess.DEVNULL, + stderr=subprocess.DEVNULL, + ) + def main(): parser = argparse.ArgumentParser(description="Prepare databases for annotation") parser.add_argument("--output_dir", help="Output directory path", required=True) - parser.add_argument("--databases", "-db", nargs='+', help="List of databases to update", required=True) - parser.add_argument("--threads", type=int, default=DEFAULT_THREADS, help="Number of threads for processing") + parser.add_argument( + "--databases", + "-db", + nargs="+", + help="List of databases to update", + required=True, + ) + parser.add_argument( + "--threads", + type=int, + default=DEFAULT_THREADS, + help="Number of threads for processing", + ) parser.add_argument("--verbose", action="store_true", help="Verbose mode") parser.add_argument("--download_date", help="Download date for databases") args = parser.parse_args() @@ -743,14 +862,28 @@ def main(): for database in args.databases: database_output_dir = path.join(args.output_dir, database) if database == "vogdb": - process_vogdb_database(path.join(database_output_dir, "vog.hmm.tar.gz"), database_output_dir, args.threads) - concatenate_hmm_files(path.join(database_output_dir, "hmm"), path.join(database_output_dir, "vog_latest_hmms.hmm")) + process_vogdb_database( + path.join(database_output_dir, "vog.hmm.tar.gz"), + database_output_dir, + args.threads, + ) + concatenate_hmm_files( + path.join(database_output_dir, "hmm"), + path.join(database_output_dir, "vog_latest_hmms.hmm"), + ) rmtree(path.join(database_output_dir, "hmm")) os.remove(path.join(database_output_dir, "vog.hmm.tar.gz")) - index_hmm(database_output_dir, path.join(database_output_dir, "vog_latest_hmms.hmm")) + index_hmm( + database_output_dir, + path.join(database_output_dir, "vog_latest_hmms.hmm"), + ) elif database == "camper": process_camper_database(database_output_dir) - create_mmseqs(path.join(database_output_dir, "mmseqs", "camper_blast.faa"), path.join(database_output_dir, "mmseqs", "camper.mmsdb"), args.threads) + create_mmseqs( + path.join(database_output_dir, "mmseqs", "camper_blast.faa"), + path.join(database_output_dir, "mmseqs", "camper.mmsdb"), + args.threads, + ) elif database == "pfam": process_pfam_database(database_output_dir, args.threads) elif database == "merops": @@ -761,7 +894,11 @@ def main(): process_sulfur_database(database_output_dir) elif database == "methyl": process_methyl_database(database_output_dir) - create_mmseqs(path.join(database_output_dir, "methyl.faa"), path.join(database_output_dir, "methyl"), args.threads) + create_mmseqs( + path.join(database_output_dir, "methyl.faa"), + path.join(database_output_dir, "methyl"), + args.threads, + ) elif database == "dbcan": process_dbcan_database(database_output_dir) elif database == "cant_hyd": @@ -775,10 +912,11 @@ def main(): if database in database_urls: databases_info[database] = { "urls": database_urls[database], - "download_date": args.download_date + "download_date": args.download_date, } generate_readme(args.output_dir, databases_info) + if __name__ == "__main__": - main() \ No newline at end of file + main() diff --git a/assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv b/assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv deleted file mode 100644 index e07cc4d0..00000000 --- a/assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv +++ /dev/null @@ -1,18 +0,0 @@ -gene call -NASQAN2011_051_A_bin.9_Ga0466380_000062_16 amoA-Nitrifier -stroublescreek_2019_sw_WHONDRS-S19S_0089_B_bin.19_k121_1382190_6 pmoA-Methanotroph -NASQAN2016_083_B_bin.62_k121_494990_1 pmoA-Methanotroph -NASQAN2015_172_B_bin.50_k121_110295_6 pmoA-Methanotroph -NASQAN2015_010_F_bin.15_scaffold_716_4 pmoA-Methanotroph -NASQAN2015_010_B_bin.40_k121_261665_1 pmoA-Methanotroph -NASQAN2015_010_A_bin.16_Ga0466474_000760_3 pmoA-Methanotroph -NASQAN2014_188_B_bin.62_k121_1916134_1 pmoA-Methanotroph -lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.22_k121_1561591_36 pmoA-Methanotroph -icacos_2019_sw_WHONDRS-S19S_0094_B_bin.101_k121_1011190_4 pmoA-Methanotroph -hugercreek_2019_sw_WHONDRS-S19S_0044_F_bin.32_scaffold_210_8 pmoA-Methanotroph -hugercreek_2019_sw_WHONDRS-S19S_0044_B_bin.34_k121_1606639_3 pmoA-Methanotroph -gunnisonriver_2019_sw_WHONDRS-S19S_0062_B_bin.67_k121_1407577_11 pmoA-Methanotroph -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.17_k121_961747_19 pmoA-Methanotroph -blueriver_2019_sw_WHONDRS-S19S_0024_B_bin.60_k121_1016154_8 pmoA-Methanotroph -blueriver_2019_sw_WHONDRS-S19S_0024_B_bin.60_k121_1651208_1 pmoA-Methanotroph -blackearthcreek_2019_sw_WHONDRS-S19S_0061_F_bin.11_scaffold_109_4 pmoA-Methanotroph diff --git a/assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt b/assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt deleted file mode 100644 index 19fdef5a..00000000 --- a/assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt +++ /dev/null @@ -1,11 +0,0 @@ -K10944 -ammonia monooxygenase -amoA -ammonia oxidation -nitrification -methane monooxygenase -pmoA -methane oxidation -methanotroph -EC: 1.14.18.3 -EC: 1.14.99.39 diff --git a/assets/trees/dmso/dmso.refpkg/CONTENTS.json b/assets/trees/dmso/dmso.refpkg/CONTENTS.json deleted file mode 100644 index 0b9baeaf..00000000 --- a/assets/trees/dmso/dmso.refpkg/CONTENTS.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "metadata": { - "create_date": "2024-05-13 10:00:00", - "format_version": "1.1", - "locus": "1861" - }, - "files": { - "aln_fasta": "dmso.aln", - "phylo_model": "dmso_phylo_model.json", - "tree": "bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed", - "tree_stats": "RAxML_info.dmso_refs.fasta" - - }, - "md5": { - "aln_fasta": "d224231710a0c259103a657c64c25d57", - "phylo_model": "0bc512c776715246a24b93391822e0e6", - "tree": "7880cd304b5db4792a0544faeddecdac", - "tree_stats": "d088fa3c4b149b7ccce5dc3843204c35" - }, - "log": [ - "Stripped refpkg (removed 0 files)", - "Loaded initial files into empty refpkg" - ], - "rollback": null, - "rollforward": null -} diff --git a/assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta b/assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta deleted file mode 100644 index 18435a51..00000000 --- a/assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta +++ /dev/null @@ -1,423 +0,0 @@ - - -This is RAxML version 8.2.9 released by Alexandros Stamatakis on July 20 2016. - -With greatly appreciated code contributions by: -Andre Aberer (HITS) -Simon Berger (HITS) -Alexey Kozlov (HITS) -Kassian Kobert (HITS) -David Dao (KIT and HITS) -Sarah Lutteropp (KIT and HITS) -Nick Pattengale (Sandia) -Wayne Pfeiffer (SDSC) -Akifumi S. Tanabe (NRIFS) -Charlie Taylor (UF) - - -Alignment has 866 distinct alignment patterns - -Proportion of gaps and completely undetermined characters in this alignment: 38.35% - -RAxML rapid bootstrapping and subsequent ML search - -Using 1 distinct models/data partitions with joint branch length optimization - - - -Executing 100 rapid bootstrap inferences and thereafter a thorough ML search - -All free model parameters will be estimated by RAxML -ML estimate of 25 per site rate categories - -Likelihood of final tree will be evaluated and optimized under GAMMA - -GAMMA Model parameters will be estimated up to an accuracy of 0.1000000000 Log Likelihood units - -Partition: 0 -Alignment Patterns: 866 -Name: No Name Provided -DataType: AA -Substitution Matrix: LG -Using fixed base frequencies - - - - -RAxML was called as follows: - -raxmlHPC-PTHREADS -f a -m PROTCATLG -n dmso_refs.fasta -N 100 -p 1234 -s dmso_refs.fasta.phy -x 1234 -T 10 - - - -Time for BS model parameter optimization 0.124676 -Bootstrap[0]: Time 3.169462 seconds, bootstrap likelihood -76430.666973, best rearrangement setting 10 -Bootstrap[1]: Time 2.712014 seconds, bootstrap likelihood -77546.608252, best rearrangement setting 15 -Bootstrap[2]: Time 2.764819 seconds, bootstrap likelihood -74372.994119, best rearrangement setting 15 -Bootstrap[3]: Time 2.806386 seconds, bootstrap likelihood -76930.479065, best rearrangement setting 12 -Bootstrap[4]: Time 2.640082 seconds, bootstrap likelihood -79660.177375, best rearrangement setting 9 -Bootstrap[5]: Time 2.848176 seconds, bootstrap likelihood -73284.515856, best rearrangement setting 12 -Bootstrap[6]: Time 2.781467 seconds, bootstrap likelihood -77576.202035, best rearrangement setting 14 -Bootstrap[7]: Time 2.854323 seconds, bootstrap likelihood -77748.588236, best rearrangement setting 10 -Bootstrap[8]: Time 2.708592 seconds, bootstrap likelihood -76091.070124, best rearrangement setting 13 -Bootstrap[9]: Time 2.824420 seconds, bootstrap likelihood -77670.099908, best rearrangement setting 14 -Bootstrap[10]: Time 3.011455 seconds, bootstrap likelihood -74798.130429, best rearrangement setting 14 -Bootstrap[11]: Time 2.865858 seconds, bootstrap likelihood -74927.199956, best rearrangement setting 5 -Bootstrap[12]: Time 2.770799 seconds, bootstrap likelihood -76609.570227, best rearrangement setting 9 -Bootstrap[13]: Time 2.763006 seconds, bootstrap likelihood -75438.207037, best rearrangement setting 10 -Bootstrap[14]: Time 2.969280 seconds, bootstrap likelihood -74923.353365, best rearrangement setting 13 -Bootstrap[15]: Time 2.678948 seconds, bootstrap likelihood -75865.866781, best rearrangement setting 6 -Bootstrap[16]: Time 2.662132 seconds, bootstrap likelihood -72911.410662, best rearrangement setting 15 -Bootstrap[17]: Time 2.792305 seconds, bootstrap likelihood -75379.580846, best rearrangement setting 13 -Bootstrap[18]: Time 2.892445 seconds, bootstrap likelihood -80324.506934, best rearrangement setting 9 -Bootstrap[19]: Time 2.786553 seconds, bootstrap likelihood -72270.100764, best rearrangement setting 8 -Bootstrap[20]: Time 2.809719 seconds, bootstrap likelihood -73748.314934, best rearrangement setting 13 -Bootstrap[21]: Time 2.845561 seconds, bootstrap likelihood -75385.406316, best rearrangement setting 10 -Bootstrap[22]: Time 2.774577 seconds, bootstrap likelihood -73668.616005, best rearrangement setting 5 -Bootstrap[23]: Time 2.683971 seconds, bootstrap likelihood -77498.603255, best rearrangement setting 10 -Bootstrap[24]: Time 2.810509 seconds, bootstrap likelihood -74341.494886, best rearrangement setting 14 -Bootstrap[25]: Time 2.735748 seconds, bootstrap likelihood -72581.128145, best rearrangement setting 7 -Bootstrap[26]: Time 2.882895 seconds, bootstrap likelihood -74868.016278, best rearrangement setting 11 -Bootstrap[27]: Time 2.598391 seconds, bootstrap likelihood -77135.663040, best rearrangement setting 11 -Bootstrap[28]: Time 2.713763 seconds, bootstrap likelihood -74282.268325, best rearrangement setting 8 -Bootstrap[29]: Time 2.875335 seconds, bootstrap likelihood -76303.714027, best rearrangement setting 13 -Bootstrap[30]: Time 2.897037 seconds, bootstrap likelihood -77047.341575, best rearrangement setting 6 -Bootstrap[31]: Time 2.762513 seconds, bootstrap likelihood -76890.228702, best rearrangement setting 9 -Bootstrap[32]: Time 2.758115 seconds, bootstrap likelihood -75231.999227, best rearrangement setting 13 -Bootstrap[33]: Time 2.848642 seconds, bootstrap likelihood -74310.324400, best rearrangement setting 8 -Bootstrap[34]: Time 2.850801 seconds, bootstrap likelihood -74057.460243, best rearrangement setting 8 -Bootstrap[35]: Time 2.842190 seconds, bootstrap likelihood -76889.097344, best rearrangement setting 12 -Bootstrap[36]: Time 2.693162 seconds, bootstrap likelihood -72288.074882, best rearrangement setting 5 -Bootstrap[37]: Time 2.721867 seconds, bootstrap likelihood -72214.897833, best rearrangement setting 8 -Bootstrap[38]: Time 2.746011 seconds, bootstrap likelihood -79858.362103, best rearrangement setting 12 -Bootstrap[39]: Time 2.701599 seconds, bootstrap likelihood -76003.871644, best rearrangement setting 13 -Bootstrap[40]: Time 2.940543 seconds, bootstrap likelihood -73830.857312, best rearrangement setting 14 -Bootstrap[41]: Time 2.665834 seconds, bootstrap likelihood -75052.748018, best rearrangement setting 13 -Bootstrap[42]: Time 2.832848 seconds, bootstrap likelihood -73832.743609, best rearrangement setting 10 -Bootstrap[43]: Time 2.791044 seconds, bootstrap likelihood -76784.398417, best rearrangement setting 13 -Bootstrap[44]: Time 2.934724 seconds, bootstrap likelihood -72855.508133, best rearrangement setting 7 -Bootstrap[45]: Time 2.642106 seconds, bootstrap likelihood -75501.667158, best rearrangement setting 14 -Bootstrap[46]: Time 2.615179 seconds, bootstrap likelihood -77131.871440, best rearrangement setting 14 -Bootstrap[47]: Time 2.792766 seconds, bootstrap likelihood -75247.220567, best rearrangement setting 11 -Bootstrap[48]: Time 2.900219 seconds, bootstrap likelihood -74163.285113, best rearrangement setting 11 -Bootstrap[49]: Time 2.864223 seconds, bootstrap likelihood -77604.775494, best rearrangement setting 15 -Bootstrap[50]: Time 2.786153 seconds, bootstrap likelihood -76515.975539, best rearrangement setting 8 -Bootstrap[51]: Time 2.818712 seconds, bootstrap likelihood -76977.812201, best rearrangement setting 5 -Bootstrap[52]: Time 2.790959 seconds, bootstrap likelihood -78377.652343, best rearrangement setting 7 -Bootstrap[53]: Time 2.784077 seconds, bootstrap likelihood -71766.787886, best rearrangement setting 10 -Bootstrap[54]: Time 2.677011 seconds, bootstrap likelihood -75973.200232, best rearrangement setting 7 -Bootstrap[55]: Time 2.729044 seconds, bootstrap likelihood -75724.499984, best rearrangement setting 8 -Bootstrap[56]: Time 2.729286 seconds, bootstrap likelihood -74888.001582, best rearrangement setting 5 -Bootstrap[57]: Time 2.851877 seconds, bootstrap likelihood -79652.708518, best rearrangement setting 12 -Bootstrap[58]: Time 2.792531 seconds, bootstrap likelihood -75964.690632, best rearrangement setting 15 -Bootstrap[59]: Time 2.798732 seconds, bootstrap likelihood -76742.838934, best rearrangement setting 6 -Bootstrap[60]: Time 3.020606 seconds, bootstrap likelihood -74747.910682, best rearrangement setting 9 -Bootstrap[61]: Time 2.812696 seconds, bootstrap likelihood -75865.927451, best rearrangement setting 9 -Bootstrap[62]: Time 2.901127 seconds, bootstrap likelihood -76123.007373, best rearrangement setting 10 -Bootstrap[63]: Time 2.864416 seconds, bootstrap likelihood -76587.113230, best rearrangement setting 12 -Bootstrap[64]: Time 2.899098 seconds, bootstrap likelihood -76942.463640, best rearrangement setting 11 -Bootstrap[65]: Time 2.784283 seconds, bootstrap likelihood -75986.725459, best rearrangement setting 8 -Bootstrap[66]: Time 2.704422 seconds, bootstrap likelihood -74022.760235, best rearrangement setting 13 -Bootstrap[67]: Time 2.789476 seconds, bootstrap likelihood -73645.645693, best rearrangement setting 15 -Bootstrap[68]: Time 2.776784 seconds, bootstrap likelihood -77333.259622, best rearrangement setting 10 -Bootstrap[69]: Time 2.768058 seconds, bootstrap likelihood -74276.085077, best rearrangement setting 13 -Bootstrap[70]: Time 2.863719 seconds, bootstrap likelihood -74543.721711, best rearrangement setting 11 -Bootstrap[71]: Time 2.712924 seconds, bootstrap likelihood -74674.083552, best rearrangement setting 11 -Bootstrap[72]: Time 2.820370 seconds, bootstrap likelihood -78340.751173, best rearrangement setting 13 -Bootstrap[73]: Time 2.790599 seconds, bootstrap likelihood -77601.131316, best rearrangement setting 5 -Bootstrap[74]: Time 2.778625 seconds, bootstrap likelihood -75849.707899, best rearrangement setting 6 -Bootstrap[75]: Time 2.751258 seconds, bootstrap likelihood -76734.985357, best rearrangement setting 11 -Bootstrap[76]: Time 3.001420 seconds, bootstrap likelihood -75929.712488, best rearrangement setting 6 -Bootstrap[77]: Time 2.936729 seconds, bootstrap likelihood -76003.356537, best rearrangement setting 8 -Bootstrap[78]: Time 2.726102 seconds, bootstrap likelihood -75427.659661, best rearrangement setting 13 -Bootstrap[79]: Time 2.854278 seconds, bootstrap likelihood -74403.801286, best rearrangement setting 13 -Bootstrap[80]: Time 2.932036 seconds, bootstrap likelihood -77528.948929, best rearrangement setting 9 -Bootstrap[81]: Time 2.862943 seconds, bootstrap likelihood -77222.989909, best rearrangement setting 10 -Bootstrap[82]: Time 2.785410 seconds, bootstrap likelihood -75812.368570, best rearrangement setting 7 -Bootstrap[83]: Time 2.775612 seconds, bootstrap likelihood -78151.460391, best rearrangement setting 6 -Bootstrap[84]: Time 2.780776 seconds, bootstrap likelihood -75949.438281, best rearrangement setting 15 -Bootstrap[85]: Time 2.873042 seconds, bootstrap likelihood -75937.261665, best rearrangement setting 10 -Bootstrap[86]: Time 2.779905 seconds, bootstrap likelihood -78273.082126, best rearrangement setting 9 -Bootstrap[87]: Time 2.682864 seconds, bootstrap likelihood -80080.144193, best rearrangement setting 5 -Bootstrap[88]: Time 2.820337 seconds, bootstrap likelihood -74737.458630, best rearrangement setting 12 -Bootstrap[89]: Time 2.685485 seconds, bootstrap likelihood -75303.912997, best rearrangement setting 6 -Bootstrap[90]: Time 3.036829 seconds, bootstrap likelihood -76905.246932, best rearrangement setting 13 -Bootstrap[91]: Time 2.760195 seconds, bootstrap likelihood -79653.636750, best rearrangement setting 8 -Bootstrap[92]: Time 2.739485 seconds, bootstrap likelihood -76693.109057, best rearrangement setting 7 -Bootstrap[93]: Time 2.833615 seconds, bootstrap likelihood -74497.658518, best rearrangement setting 11 -Bootstrap[94]: Time 2.816307 seconds, bootstrap likelihood -77134.348437, best rearrangement setting 15 -Bootstrap[95]: Time 2.802382 seconds, bootstrap likelihood -75483.518060, best rearrangement setting 15 -Bootstrap[96]: Time 2.640518 seconds, bootstrap likelihood -74528.094785, best rearrangement setting 5 -Bootstrap[97]: Time 2.780421 seconds, bootstrap likelihood -73237.919062, best rearrangement setting 14 -Bootstrap[98]: Time 2.724797 seconds, bootstrap likelihood -75401.187043, best rearrangement setting 7 -Bootstrap[99]: Time 2.912125 seconds, bootstrap likelihood -74969.185954, best rearrangement setting 10 - - -Overall Time for 100 Rapid Bootstraps 281.389323 seconds -Average Time per Rapid Bootstrap 2.813893 seconds - -Starting ML Search ... - -Fast ML optimization finished - -Fast ML search Time: 756.295974 seconds - -Slow ML Search 0 Likelihood: -74928.461521 -Slow ML Search 1 Likelihood: -74928.461521 -Slow ML Search 2 Likelihood: -74928.461521 -Slow ML Search 3 Likelihood: -74928.461521 -Slow ML Search 4 Likelihood: -74928.461521 -Slow ML Search 5 Likelihood: -74928.461521 -Slow ML Search 6 Likelihood: -74928.461521 -Slow ML Search 7 Likelihood: -74928.461521 -Slow ML Search 8 Likelihood: -74928.461521 -Slow ML Search 9 Likelihood: -74928.461521 -Slow ML optimization finished - -Slow ML search Time: 602.354747 seconds -Thorough ML search Time: 73.895558 seconds - -Final ML Optimization Likelihood: -74928.461530 - -Model Information: - -Model Parameters of Partition 0, Name: No Name Provided, Type of Data: AA -alpha: 2.776473 -Tree-Length: 55.515763 -rate A <-> R: 0.399182 -rate A <-> N: 0.259945 -rate A <-> D: 0.371058 -rate A <-> C: 2.337364 -rate A <-> Q: 0.910775 -rate A <-> E: 0.975241 -rate A <-> G: 1.940106 -rate A <-> H: 0.336984 -rate A <-> I: 0.140697 -rate A <-> L: 0.371240 -rate A <-> K: 0.503815 -rate A <-> M: 1.055520 -rate A <-> F: 0.238237 -rate A <-> P: 1.105868 -rate A <-> S: 4.439041 -rate A <-> T: 2.009090 -rate A <-> W: 0.169702 -rate A <-> Y: 0.205613 -rate A <-> V: 2.392567 -rate R <-> N: 0.706048 -rate R <-> D: 0.116398 -rate R <-> C: 0.501968 -rate R <-> Q: 2.636754 -rate R <-> E: 0.341785 -rate R <-> G: 0.366408 -rate R <-> H: 2.278690 -rate R <-> I: 0.119250 -rate R <-> L: 0.283449 -rate R <-> K: 5.940467 -rate R <-> M: 0.454623 -rate R <-> F: 0.049508 -rate R <-> P: 0.312264 -rate R <-> S: 0.805843 -rate R <-> T: 0.543695 -rate R <-> W: 0.557424 -rate R <-> Y: 0.295274 -rate R <-> V: 0.160471 -rate N <-> D: 4.766737 -rate N <-> C: 0.496537 -rate N <-> Q: 1.592389 -rate N <-> E: 0.508692 -rate N <-> G: 1.350015 -rate N <-> H: 4.234381 -rate N <-> I: 0.179830 -rate N <-> L: 0.064256 -rate N <-> K: 2.014327 -rate N <-> M: 0.348390 -rate N <-> F: 0.084068 -rate N <-> P: 0.151925 -rate N <-> S: 3.764032 -rate N <-> T: 1.878729 -rate N <-> W: 0.042610 -rate N <-> Y: 0.574720 -rate N <-> V: 0.078587 -rate D <-> C: 0.058743 -rate D <-> Q: 0.491483 -rate D <-> E: 4.924234 -rate D <-> G: 0.793424 -rate D <-> H: 0.870603 -rate D <-> I: 0.010038 -rate D <-> L: 0.014157 -rate D <-> K: 0.265711 -rate D <-> M: 0.023991 -rate D <-> F: 0.016354 -rate D <-> P: 0.370412 -rate D <-> S: 1.164675 -rate D <-> T: 0.399902 -rate D <-> W: 0.028068 -rate D <-> Y: 0.126872 -rate D <-> V: 0.035653 -rate C <-> Q: 0.079639 -rate C <-> E: 0.003286 -rate C <-> G: 0.534566 -rate C <-> H: 0.601499 -rate C <-> I: 0.301083 -rate C <-> L: 0.557800 -rate C <-> K: 0.012457 -rate C <-> M: 0.839207 -rate C <-> F: 1.037881 -rate C <-> P: 0.070787 -rate C <-> S: 2.614753 -rate C <-> T: 1.073780 -rate C <-> W: 0.629281 -rate C <-> Y: 1.094488 -rate C <-> V: 1.839864 -rate Q <-> E: 3.876936 -rate Q <-> G: 0.251626 -rate Q <-> H: 4.520102 -rate Q <-> I: 0.068413 -rate Q <-> L: 0.546954 -rate Q <-> K: 3.037150 -rate Q <-> M: 1.570619 -rate Q <-> F: 0.033669 -rate Q <-> P: 0.586241 -rate Q <-> S: 1.149231 -rate Q <-> T: 1.014297 -rate Q <-> W: 0.221802 -rate Q <-> Y: 0.241650 -rate Q <-> V: 0.197511 -rate E <-> G: 0.327583 -rate E <-> H: 0.398044 -rate E <-> I: 0.041567 -rate E <-> L: 0.065426 -rate E <-> K: 1.697022 -rate E <-> M: 0.163145 -rate E <-> F: 0.017664 -rate E <-> P: 0.393844 -rate E <-> S: 0.574671 -rate E <-> T: 0.567695 -rate E <-> W: 0.073107 -rate E <-> Y: 0.112720 -rate E <-> V: 0.230098 -rate G <-> H: 0.292498 -rate G <-> I: 0.008174 -rate G <-> L: 0.041563 -rate G <-> K: 0.278555 -rate G <-> M: 0.131033 -rate G <-> F: 0.084125 -rate G <-> P: 0.184955 -rate G <-> S: 1.633930 -rate G <-> T: 0.121922 -rate G <-> W: 0.252125 -rate G <-> Y: 0.051346 -rate G <-> V: 0.072026 -rate H <-> I: 0.102245 -rate H <-> L: 0.343988 -rate H <-> K: 0.654763 -rate H <-> M: 0.415502 -rate H <-> F: 0.640560 -rate H <-> P: 0.477834 -rate H <-> S: 0.929667 -rate H <-> T: 0.548649 -rate H <-> W: 0.560661 -rate H <-> Y: 4.983361 -rate H <-> V: 0.111759 -rate I <-> L: 3.892408 -rate I <-> K: 0.149373 -rate I <-> M: 4.013113 -rate I <-> F: 1.044902 -rate I <-> P: 0.073509 -rate I <-> S: 0.060198 -rate I <-> T: 0.970728 -rate I <-> W: 0.104854 -rate I <-> Y: 0.218350 -rate I <-> V: 10.000000 -rate L <-> K: 0.129119 -rate L <-> M: 5.927594 -rate L <-> F: 2.434657 -rate L <-> P: 0.233879 -rate L <-> S: 0.171176 -rate L <-> T: 0.284471 -rate L <-> W: 0.581863 -rate L <-> Y: 0.281383 -rate L <-> V: 1.598956 -rate K <-> M: 0.616581 -rate K <-> F: 0.022460 -rate K <-> P: 0.366530 -rate K <-> S: 0.703048 -rate K <-> T: 1.067567 -rate K <-> W: 0.046864 -rate K <-> Y: 0.123890 -rate K <-> V: 0.173913 -rate M <-> F: 1.689205 -rate M <-> P: 0.093763 -rate M <-> S: 0.325811 -rate M <-> T: 1.897216 -rate M <-> W: 0.653740 -rate M <-> Y: 0.451968 -rate M <-> V: 1.782983 -rate F <-> P: 0.088706 -rate F <-> S: 0.339765 -rate F <-> T: 0.154944 -rate F <-> W: 2.307349 -rate F <-> Y: 7.328222 -rate F <-> V: 0.614777 -rate P <-> S: 1.256567 -rate P <-> T: 0.536635 -rate P <-> W: 0.089332 -rate P <-> Y: 0.084151 -rate P <-> V: 0.278428 -rate S <-> T: 6.077767 -rate S <-> W: 0.233693 -rate S <-> Y: 0.376132 -rate S <-> V: 0.092373 -rate T <-> W: 0.132241 -rate T <-> Y: 0.230856 -rate T <-> V: 2.054781 -rate W <-> Y: 2.959699 -rate W <-> V: 0.177959 -rate Y <-> V: 0.234116 - -freq pi(A): 0.079066 -freq pi(R): 0.055941 -freq pi(N): 0.041977 -freq pi(D): 0.053052 -freq pi(C): 0.012937 -freq pi(Q): 0.040767 -freq pi(E): 0.071586 -freq pi(G): 0.057337 -freq pi(H): 0.022355 -freq pi(I): 0.062157 -freq pi(L): 0.099081 -freq pi(K): 0.064600 -freq pi(M): 0.022951 -freq pi(F): 0.042302 -freq pi(P): 0.044040 -freq pi(S): 0.061197 -freq pi(T): 0.053287 -freq pi(W): 0.012066 -freq pi(Y): 0.034155 -freq pi(V): 0.069146 - - -ML search took 1433.381314 secs or 0.398161 hours - -Combined Bootstrap and ML search took 1714.774499 secs or 0.476326 hours - -Drawing Bootstrap Support Values on best-scoring ML tree ... - - - -Found 1 tree in File /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bestTree.dmso_refs.fasta - - - -Found 1 tree in File /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bestTree.dmso_refs.fasta - -Program execution info written to /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_info.dmso_refs.fasta -All 100 bootstrapped trees written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bootstrap.dmso_refs.fasta - -Best-scoring ML tree written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bestTree.dmso_refs.fasta - -Best-scoring ML tree with support values written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bipartitions.dmso_refs.fasta - -Best-scoring ML tree with support values as branch labels written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bipartitionsBranchLabels.dmso_refs.fasta - -Overall execution time for full ML analysis: 1714.841682 secs or 0.476345 hours or 0.019848 days diff --git a/assets/trees/dmso/dmso.refpkg/Untitled 1.csv b/assets/trees/dmso/dmso.refpkg/Untitled 1.csv deleted file mode 100644 index 1ed57cf6..00000000 --- a/assets/trees/dmso/dmso.refpkg/Untitled 1.csv +++ /dev/null @@ -1,87 +0,0 @@ -gene call notes info -A_Nitrobacter_hamburgensis_YP_578638 NxrA Cytoplasmic Nitrite oxidoreductase -Acidovorax delafieldii_NARG NarG Nitrogen reductase -ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 ACTB1 Not sure if we want this -ACTB1_Bdellovibrio_bacteriovorus_NP_96849 ACTB1 Not sure if we want this -ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 ACTB1 Not sure if we want this -ACTB1_Candidatus_Solibacter_usitatus_YP_821785 ACTB1 Not sure if we want this -ACTB1_Chloroflexus_aggregans_YP_002464666 ACTB1 Not sure if we want this -ACTB1_Cytophaga_hutchinsonii_YP_678817 ACTB1 Not sure if we want this -ACTB1_Flavobacterium_psychrophilum_YP_001295304 ACTB1 Not sure if we want this -ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 ACTB1 Not sure if we want this -ACTB1_Geobacter_metallireducens_GS_15_YP_384764 ACTB1 Not sure if we want this -ACTB1_Geobacter_sp_M18_YP_004200644 ACTB1 Not sure if we want this -ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 ACTB1 Not sure if we want this -ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 ACTB1 Not sure if we want this -ACTB1_Leptospira_interrogans_serovar_NP_713447 ACTB1 Not sure if we want this -ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 ACTB1 Not sure if we want this -ACTB1_Methylobacterium_sp_4_YP_001772545 ACTB1 Not sure if we want this -ACTB1_Nitrosococcus_oceani_YP_343269 ACTB1 Not sure if we want this -ACTB1_Opitutus_terrae_gb_ACB77208 ACTB1 Not sure if we want this -ACTB1_Ralstonia_eutropha_YP_298623 ACTB1 Not sure if we want this -ACTB1_Rhodothermus_marinus_gb_ABV55245 ACTB1 Not sure if we want this -ACTB1_Salinibacter_ruber_emb_CBH25246 ACTB1 Not sure if we want this -ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 ACTB1 Not sure if we want this -Alkalilimnicola_ehrlichii_ABI55571 ArxA Anaerobic arsenite oxidase -ArrA_Bacillus_selenitireducens_gb_AAQ19491 ArrA Arsenate reductase -ArrA_Chrysiogenes_arsenatis_gb_AAU11839 ArrA Arsenate reductase -ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 ArrA Arsenate reductase -ArrA_Sulfurospirillum_barnesii_gb_AAU11840 ArrA Arsenate reductase -ArrA_Wolinella_succinogenes_NP_906980 ArrA Arsenate reductase -ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 ArxA Anaerobic arsenite oxidase -B_Caldithrix_abyssi_ZP_09550397 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase double check -B_Nitrobacter_hamburgensis_YP_578186 NxrA Cytoplasmic Nitrite oxidoreductase -Beggiatoa_sp_PS_ZP_02000390 Unknown Function -DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| DmsA Dimethl sulphoxide reductase -DmsA_E_coli_sp_P18775 DmsA Dimethl sulphoxide reductase -DmsA_Haemophilus_influenza_sp_P45004 DmsA Dimethl sulphoxide reductase -Gemmatimonas_aurantiaca_YP_002761548 Alternative complex III -Halorhodospira_halophila_YP_001001949 ArxA Anaerobic arsenite oxidase -Hydrogenobacter_thermophilus_YP_003433365 Unknown Function -Hydrogenobaculum_sp_Y04AAS1_YP_002121006 Unknown Function -I_OP1_uncultured_candidate_division_bacterium_BAL57377 Unknown Function -II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 Unknown Function -NarG_Escherichia_coli_NP_415742 NarG Nitrogen reductase -NarG_Halomonas_maura_gb_AAT47523 NarG Nitrogen reductase -NarG_Pseudomonas_fluorescens_gb_AEV63780 NarG Nitrogen reductase -NarG_Pseudomonas_stutzeri_gb_AAZ43099 NarG Nitrogen reductase -Natrinema_pellirubrum_YP_007282293 Unknown Function double check -Nitrobacter_sp_Nb_311A_ZP_01048070 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrobacter_winogradskyi_gb_ABA05326 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrococcus_mobi_EAR23355 NxrA Cytoplasmic Nitrite oxidoreductase -NxrA_Candidatus_K_stuttgartiensis_CAJ72445 NxrA Periplasmic Nitrite oxidoreductase -NxrA_planctomycete_KSU_1_ZP_10101005 NxrA Periplasmic Nitrite oxidoreductase -NxrA1_Nitrospira_defluvii_YP_003798853 NxrA Periplasmic Nitrite oxidoreductase -NxrA2_Nitrospira_defluvii_YP_003798871 NxrA Periplasmic Nitrite oxidoreductase -PhsA_Wolinella_succinogenes_NP_906934 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Carboxydothermus_hydrogenoformans_YP_361367 Psra Thiosulphate reductase -PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermus_thermophilus_YP_004130 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Wolinella_succinogenes_NP_906381 Psra Thiosulphate reductase -QrcB_delta_proteobacterium_NaphS2_ZP_07200609 QrcB Not sure if we want this -QrcB_Desulfatibacillum_alkenivorans_YP_002430439 QrcB Not sure if we want this -QrcB_Desulfococcus_oleovorans_YP_001530428 QrcB Not sure if we want this -QrcB_Desulfomicrobium_baculatum_YP_003159879 QrcB Not sure if we want this -QrcB_Desulfovibrio_magneticus_YP_002953179 QrcB Not sure if we want this -QrcB_Desulfovibrio_vulgaris_YP_967712 QrcB Not sure if we want this -QrcB_Syntrophobacter_fumaroxidans_YP_844744 QrcB Not sure if we want this -RBG1_10 Not sure if we want this -RBG1_1305 Not sure if we want this -RBG1_855 Not sure if we want this -TMAO_Citrobacter_youngae_ZP_06352135 TMAO No info on tree -TMAO_E_coli_CAA52095 TMAO No info on tree -TMAO_Photobacterium_profundum_YP_129680 TMAO No info on tree -TMAO_Salmonella_enterica_gb_AEZ47489 TMAO No info on tree -TMAO_Shewanella_massilia_CAA06851 TMAO No info on tree -TMAO_Vibrio_vulnificus_YP_004189064 TMAO No info on tree -TtrA_Aeropyrum_pernix_NP_148724 TrtA Tetrathionate reductase -TtrA_Haemophilus_somnus_gb_ABI25172 TrtA Tetrathionate reductase -TtrA_Photobacterium_profundum_YP_133039 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_aerophilum_NP_559177 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_arsenaticum_YP_001152643 TrtA Tetrathionate reductase -TtrA_Wolinella_succinogenes_NP_907142 TrtA Tetrathionate reductase -TtrA_Yersinia_enterocolitica_YP_001005907 TrtA Tetrathionate reductase diff --git a/assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed b/assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed deleted file mode 100644 index 2f537895..00000000 --- a/assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed +++ /dev/null @@ -1 +0,0 @@ -(Beggiatoa_sp_PS_ZP_02000390:0.31018678994441711838,(Natrinema_pellirubrum_YP_007282293:0.62627241139953637727,((Hydrogenobaculum_sp_Y04AAS1_YP_002121006:0.25202562736528244525,Hydrogenobacter_thermophilus_YP_003433365:0.22525561709713604053):0.30165783563945486323[100],((((Acidovorax:0.13667246099892554900,((NarG_Pseudomonas_stutzeri_gb_AAZ43099:0.03393658559446594003,NarG_Pseudomonas_fluorescens_gb_AEV63780:0.04907565545382640976):0.11325289427816984111[100],(NarG_Halomonas_maura_gb_AAT47523:0.14646439078919698540,NarG_Escherichia_coli_NP_415742:0.14944442674389668557):0.04669707032807739883[63]):0.08860689645843677908[81]):0.28323472060421345242[100],(Nitrococcus_mobi_EAR23355:0.17092574999759441168,(Nitrobacter_sp_Nb_311A_ZP_01048070:0.01046015345712418033,((A_Nitrobacter_hamburgensis_YP_578638:0.00851203468703114544,B_Nitrobacter_hamburgensis_YP_578186:0.02695906079380491413):0.02171289090283912496[94],Nitrobacter_winogradskyi_gb_ABA05326:0.03093192783563805323):0.01026905465586188879[78]):0.17248328026687961834[100]):0.33751197543721728200[100]):0.99152762326621168842[100],(((((TMAO_Vibrio_vulnificus_YP_004189064:0.08824900046563541323,TMAO_Photobacterium_profundum_YP_129680:0.08590352010876725619):0.18306761819681807713[100],TMAO_Shewanella_massilia_CAA06851:0.20825829024465955519):0.17862368552796076271[100],(TMAO_Citrobacter_youngae_ZP_06352135:0.41133442915839824039,(TMAO_Salmonella_enterica_gb_AEZ47489:0.06565565202990467086,TMAO_E_coli_CAA52095:0.06018585519821552376):0.23462434322473377235[100]):0.10347742396753679961[75]):0.92112695451955228787[100],(DmsA_E_coli_sp_P18775:0.23322212943307793487,(DmsA_Haemophilus_influenza_sp_P45004:0.08081484463360698312,DmsA_Actinobacillus_succinogenes_130Z:0.10868685038622999395):0.12598399783029093357[100]):0.57382198141086615539[100]):0.26440844330547474961[90],(((((TtrA_Haemophilus_somnus_gb_ABI25172:0.30384068025070881669,TtrA_Yersinia_enterocolitica_YP_001005907:0.36541021578513749324):0.18490699160553386582[91],(TtrA_Wolinella_succinogenes_NP_907142:0.64153003857806889521,TtrA_Photobacterium_profundum_YP_133039:0.94160881467741908146):0.14870581556773784793[62]):0.74286956410734672485[100],((TtrA_Pyrobaculum_arsenaticum_YP_001152643:0.16132115694270368622,TtrA_Pyrobaculum_aerophilum_NP_559177:0.08788089082126224194):0.28471506447190164657[100],TtrA_Aeropyrum_pernix_NP_148724:0.19811327077554555243):0.99152820694335630503[100]):0.56849048977295146834[100],((((((QrcB_Desulfatibacillum_alkenivorans_YP_002430439:0.69062666806863026725,QrcB_Desulfococcus_oleovorans_YP_001530428:0.52799062697662879629):0.21107589090264863851[97],(QrcB_delta_proteobacterium_NaphS2_ZP_07200609:0.60046780137077260253,QrcB_Syntrophobacter_fumaroxidans_YP_844744:0.80694048976353893732):0.09044026801852970976[32]):0.09373951901508625895[37],(QrcB_Desulfomicrobium_baculatum_YP_003159879:0.54928820408861156466,(QrcB_Desulfovibrio_magneticus_YP_002953179:0.54930955444688378542,QrcB_Desulfovibrio_vulgaris_YP_967712:0.47778813401120456827):0.12147059864301178178[49]):0.51927964796344860954[100]):0.27886064724177378471[100],((ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524:0.11021967570082565058,(ACTB1_Geobacter_sp_M18_YP_004200644:0.22414922514809035303,ACTB1_Geobacter_metallireducens_GS_15_YP_384764:0.19478125699568066276):0.02772326548080589897[21]):0.58363416355970954008[100],((ACTB1_Mariprofundus_ferrooxydans_ZP_01451016:0.49055905401768445939,(ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268:0.21080659146162344930,ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257:0.26440906971492933453):0.35237320222753865107[100]):0.27523086952627628943[100],(((ACTB1_Leptospira_interrogans_serovar_NP_713447:0.79307148795825910259,(ACTB1_Bdellovibrio_bacteriovorus_NP_96849:0.69991229166566804043,RBG1_1305:0.89737144652423395108):0.09288663579756109567[60]):0.16716761244359509830[71],((ACTB1_Flavobacterium_psychrophilum_YP_001295304:1.02606743524938170964,ACTB1_Cytophaga_hutchinsonii_YP_678817:0.50283093158201408457):0.28799005578471925659[99],(ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862:0.96646104346107775118,((ACTB1_Methylobacterium_sp_4_YP_001772545:0.63567467187472281864,ACTB1_Ralstonia_eutropha_YP_298623:0.82860248741955488949):0.13581998044218268618[33],(((ACTB1_Rhodothermus_marinus_gb_ABV55245:0.38865363015662424129,ACTB1_Salinibacter_ruber_emb_CBH25246:0.59233821425909760627):0.40688523208875704285[100],(ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266:0.68381691055352000763,ACTB1_Opitutus_terrae_gb_ACB77208:0.83025728066530646299):0.14219255226486615662[50]):0.12468269714690130567[49],(ACTB1_Chloroflexus_aggregans_YP_002464666:0.46873659447195903383,((ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078:0.50464784810003238125,ACTB1_Candidatus_Solibacter_usitatus_YP_821785:0.54245637379061018013):0.13733595525661521086[61],ACTB1_Nitrosococcus_oceani_YP_343269:0.49410400734252379884):0.10917412309064457310[21]):0.08450438372508251028[17]):0.12072458219781251332[16]):0.15098607158503560277[24]):0.59860089891352907809[100]):0.08727823617340259299[29]):0.69877093272090162746[100],Gemmatimonas_aurantiaca_YP_002761548:0.84260059047056301562):0.13752307751231809818[65]):0.28006707903346222954[100]):0.23466558402636081282[100]):0.17614184128090995540[87],((II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4:0.33467215681677725536,RBG1_855:0.82161967860182749668):0.12971199868024066437[76],(Alkalilimnicola_ehrlichii_ABI55571:0.16927440252820141753,(Halorhodospira_halophila_YP_001001949:0.15823128010931214460,ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308:0.31283575163699722799):0.07568817065129679333[35]):0.71169409868301625188[100]):0.10732618473035443474[35]):0.18919835836582774014[53],(ArrA_Chrysiogenes_arsenatis_gb_AAU11839:0.55861722570644156693,((ArrA_Bacillus_selenitireducens_gb_AAQ19491:0.57862013020904345950,(ArrA_Wolinella_succinogenes_NP_906980:0.11656277792250165082,ArrA_Sulfurospirillum_barnesii_gb_AAU11840:0.25535586149819144985):0.25704715855239179678[100]):0.10824894176711383209[52],ArrA_Halarsenatibacter_silvermanii_gb_ACF74513:0.46929511501429799214):0.04484475421107837756[41]):0.55088216920711008395[100]):0.17320965912547314769[100]):0.19386424023928239269[96],((PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324:0.46895807528927402341,PsrA_Carboxydothermus_hydrogenoformans_YP_361367:0.36278131760523796290):0.30501332134095587856[100],((PhsA_Wolinella_succinogenes_NP_906934:0.83556313083303890288,(PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207:1.02028532974974517344,(PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237:0.39406116350918174440,PsrA_Wolinella_succinogenes_NP_906381:0.56906242612948243487):0.37309846673540075779[100]):0.07083616780588812556[32]):0.10606547837054894345[26],(PsrA_PhsA_Thermus_thermophilus_YP_004130:0.52048385599284674452,((B_Caldithrix_abyssi_ZP_09550397:0.29162331030389027076,PsrA_PhsA_Acidiphilium_cryptum_YP_001233491:0.47229408641539760705):0.21497328944652449589[99],PsrA_PhsA_Geobacter_lovleyi_ZP_01593406:0.42362772298653567082):0.09681557138376449545[35]):0.48200494710375846319[100]):0.06133241697114610869[45]):0.32256472661171109451[100]):0.43399518039056000918[100]):0.42841990737161983471[100]):0.57877135424072545522[100],(((NxrA_planctomycete_KSU_1_ZP_10101005:0.07351303248959742409,NxrA_Candidatus_K_stuttgartiensis_CAJ72445:0.10665101974941076923):0.18189417316903719324[100],(NxrA1_Nitrospira_defluvii_YP_003798853:0.06498836035058985772,NxrA2_Nitrospira_defluvii_YP_003798871:0.07400335506604591163):0.28809352956461248274[100]):0.24410407282623491909[100],RBG1_10:0.21737233260787308664):0.28017652615537430583[100]):0.25972423664656024700[100]):0.04838674611379127632[31]):0.04397292308026813645[52],I_OP1_uncultured_candidate_division_bacterium_BAL57377:0.26884323213695593413); diff --git a/assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv b/assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv deleted file mode 100644 index 1ed57cf6..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv +++ /dev/null @@ -1,87 +0,0 @@ -gene call notes info -A_Nitrobacter_hamburgensis_YP_578638 NxrA Cytoplasmic Nitrite oxidoreductase -Acidovorax delafieldii_NARG NarG Nitrogen reductase -ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 ACTB1 Not sure if we want this -ACTB1_Bdellovibrio_bacteriovorus_NP_96849 ACTB1 Not sure if we want this -ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 ACTB1 Not sure if we want this -ACTB1_Candidatus_Solibacter_usitatus_YP_821785 ACTB1 Not sure if we want this -ACTB1_Chloroflexus_aggregans_YP_002464666 ACTB1 Not sure if we want this -ACTB1_Cytophaga_hutchinsonii_YP_678817 ACTB1 Not sure if we want this -ACTB1_Flavobacterium_psychrophilum_YP_001295304 ACTB1 Not sure if we want this -ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 ACTB1 Not sure if we want this -ACTB1_Geobacter_metallireducens_GS_15_YP_384764 ACTB1 Not sure if we want this -ACTB1_Geobacter_sp_M18_YP_004200644 ACTB1 Not sure if we want this -ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 ACTB1 Not sure if we want this -ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 ACTB1 Not sure if we want this -ACTB1_Leptospira_interrogans_serovar_NP_713447 ACTB1 Not sure if we want this -ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 ACTB1 Not sure if we want this -ACTB1_Methylobacterium_sp_4_YP_001772545 ACTB1 Not sure if we want this -ACTB1_Nitrosococcus_oceani_YP_343269 ACTB1 Not sure if we want this -ACTB1_Opitutus_terrae_gb_ACB77208 ACTB1 Not sure if we want this -ACTB1_Ralstonia_eutropha_YP_298623 ACTB1 Not sure if we want this -ACTB1_Rhodothermus_marinus_gb_ABV55245 ACTB1 Not sure if we want this -ACTB1_Salinibacter_ruber_emb_CBH25246 ACTB1 Not sure if we want this -ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 ACTB1 Not sure if we want this -Alkalilimnicola_ehrlichii_ABI55571 ArxA Anaerobic arsenite oxidase -ArrA_Bacillus_selenitireducens_gb_AAQ19491 ArrA Arsenate reductase -ArrA_Chrysiogenes_arsenatis_gb_AAU11839 ArrA Arsenate reductase -ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 ArrA Arsenate reductase -ArrA_Sulfurospirillum_barnesii_gb_AAU11840 ArrA Arsenate reductase -ArrA_Wolinella_succinogenes_NP_906980 ArrA Arsenate reductase -ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 ArxA Anaerobic arsenite oxidase -B_Caldithrix_abyssi_ZP_09550397 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase double check -B_Nitrobacter_hamburgensis_YP_578186 NxrA Cytoplasmic Nitrite oxidoreductase -Beggiatoa_sp_PS_ZP_02000390 Unknown Function -DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| DmsA Dimethl sulphoxide reductase -DmsA_E_coli_sp_P18775 DmsA Dimethl sulphoxide reductase -DmsA_Haemophilus_influenza_sp_P45004 DmsA Dimethl sulphoxide reductase -Gemmatimonas_aurantiaca_YP_002761548 Alternative complex III -Halorhodospira_halophila_YP_001001949 ArxA Anaerobic arsenite oxidase -Hydrogenobacter_thermophilus_YP_003433365 Unknown Function -Hydrogenobaculum_sp_Y04AAS1_YP_002121006 Unknown Function -I_OP1_uncultured_candidate_division_bacterium_BAL57377 Unknown Function -II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 Unknown Function -NarG_Escherichia_coli_NP_415742 NarG Nitrogen reductase -NarG_Halomonas_maura_gb_AAT47523 NarG Nitrogen reductase -NarG_Pseudomonas_fluorescens_gb_AEV63780 NarG Nitrogen reductase -NarG_Pseudomonas_stutzeri_gb_AAZ43099 NarG Nitrogen reductase -Natrinema_pellirubrum_YP_007282293 Unknown Function double check -Nitrobacter_sp_Nb_311A_ZP_01048070 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrobacter_winogradskyi_gb_ABA05326 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrococcus_mobi_EAR23355 NxrA Cytoplasmic Nitrite oxidoreductase -NxrA_Candidatus_K_stuttgartiensis_CAJ72445 NxrA Periplasmic Nitrite oxidoreductase -NxrA_planctomycete_KSU_1_ZP_10101005 NxrA Periplasmic Nitrite oxidoreductase -NxrA1_Nitrospira_defluvii_YP_003798853 NxrA Periplasmic Nitrite oxidoreductase -NxrA2_Nitrospira_defluvii_YP_003798871 NxrA Periplasmic Nitrite oxidoreductase -PhsA_Wolinella_succinogenes_NP_906934 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Carboxydothermus_hydrogenoformans_YP_361367 Psra Thiosulphate reductase -PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermus_thermophilus_YP_004130 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Wolinella_succinogenes_NP_906381 Psra Thiosulphate reductase -QrcB_delta_proteobacterium_NaphS2_ZP_07200609 QrcB Not sure if we want this -QrcB_Desulfatibacillum_alkenivorans_YP_002430439 QrcB Not sure if we want this -QrcB_Desulfococcus_oleovorans_YP_001530428 QrcB Not sure if we want this -QrcB_Desulfomicrobium_baculatum_YP_003159879 QrcB Not sure if we want this -QrcB_Desulfovibrio_magneticus_YP_002953179 QrcB Not sure if we want this -QrcB_Desulfovibrio_vulgaris_YP_967712 QrcB Not sure if we want this -QrcB_Syntrophobacter_fumaroxidans_YP_844744 QrcB Not sure if we want this -RBG1_10 Not sure if we want this -RBG1_1305 Not sure if we want this -RBG1_855 Not sure if we want this -TMAO_Citrobacter_youngae_ZP_06352135 TMAO No info on tree -TMAO_E_coli_CAA52095 TMAO No info on tree -TMAO_Photobacterium_profundum_YP_129680 TMAO No info on tree -TMAO_Salmonella_enterica_gb_AEZ47489 TMAO No info on tree -TMAO_Shewanella_massilia_CAA06851 TMAO No info on tree -TMAO_Vibrio_vulnificus_YP_004189064 TMAO No info on tree -TtrA_Aeropyrum_pernix_NP_148724 TrtA Tetrathionate reductase -TtrA_Haemophilus_somnus_gb_ABI25172 TrtA Tetrathionate reductase -TtrA_Photobacterium_profundum_YP_133039 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_aerophilum_NP_559177 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_arsenaticum_YP_001152643 TrtA Tetrathionate reductase -TtrA_Wolinella_succinogenes_NP_907142 TrtA Tetrathionate reductase -TtrA_Yersinia_enterocolitica_YP_001005907 TrtA Tetrathionate reductase diff --git a/assets/trees/dmso/dmso.refpkg/dmso.aln b/assets/trees/dmso/dmso.refpkg/dmso.aln deleted file mode 100644 index 22bfa700..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso.aln +++ /dev/null @@ -1,2838 +0,0 @@ ->Natrinema_pellirubrum_YP_007282293 ------------------------------------------------------------- -------------MANRDRSVDSANERSAEGTSVSRRTLLGGAGAAGV--AGFAGCLRLFT -DD-GEGNGNGTSTASKLNPLTEYPNREWESHYRDVWDV----------DDTYYLACRPND -THNCYLEANVK-NGV----VTRLGP--------SMNYGEAE------------------- ----DLYGNQASDRWDPRVCQKGLSMVERFYGER-RVTSPMIRQGFKDWVDEGFPREEDG- ----------SMPEEYA--KRGEDS-WYEASWD-EAYEYA--------AKTFLELADHYSG -A-DAQELLLEQGYDDRVVEEMQGVGTR--------------------------------- --------------------------TMKFRGGMPMLSTIGLFGEYRFAN-SMALVDHHVR -DVGEDEALGGVG-GDNYT-FHTDLPPGHPMVTGQQ---TVDFD-LANV-EYADNIVLAGI -----------NWMCTKMADSHWLTEARM---------NGAN----VTGIFTDYNATSSKC -D----ELVIIRPATDSALFLGVAQQIIATDGYDA----------EFVRSNTDLPLLVRMD -TGDHLRASDVFEDYDPADLERTQVAPADEHPAPTTVDTADQWITPDQR--EDWDDFVVYD -DAAGGVRAVDREAVGEEFDVDAALEGSWELELAD-------------------------- -------GDIVEVRPVFDLVKEYLDTT---------------------------------- -------------WDPESTAEVTGTEP---------EAVTNLAEQFADN----KESTLLLT -GMGP---NQYFNGDLKDRAAFLVASLTSNVGTHSGNVGSYAGNY---------------- -----RAAMLNGIPHYHLEDPFDPELDPDADSRVDSRITMES------------------- ------------------------MHFYSNLDKPLKIEGEYHMGDSHMNTP----TKSLWV -AGSNSILGN------------------------------AKGSYKIIEGLLR---TGKLE -AFFCNEWWWTMTCEY--SDIVFPA-DSWAEQNVHDLTASVTN----------PFLMVFPE -TGIDRVY-D---T--------RHD------CQIYQGVA-EKLAEKLDE------------ -------------PRLEQMWE--FIDE--------------------DEYRGKPYVQRILD -N---SNMTKGYDAETLIEKAERGEPALM--------MSTTYPKKIGTRQANDD------- -------------EPWYTKTGRLEFLREEETWTEVGETLPVHREAVDGTIYKPNVIVDDGD -HPLIDPETPDDLGWDDDNIEDA--------------------SARQVRNEVVSTDALVNS -SHPLQDVDPGFKYSFMTPKYRHGAHTFCNALP-----------NIAVWWG-PFGDRDRKD -DRKPYFG-----EGYVEMNPEDAKE-EGF-------------E-------------DGDY -VWVDADPND-RPYPSANGDPDEY--SR---A--L-MRVRYQPAMPRGVTRSWHN-LNQAS -HGTTEATPDR-TGMAK-------NEETDYVSLYRRGGHQSMTR-SWLRPTILTDEMNR-- ------KGLMGQSIGKGFAPD----VHCANGAPRESFVKFEKEGDAGEDGEGLWRPAEMGL -RPGYETETMQRYLDGDFTSTEGD------------------------------------- -- ->RBG1_10 ------------------------------------------------------------- -------------------------------MTLSRRRFLK---------ISSLSAAGALV -DL-PELKF-LQFLETVENPLEYYPNRDWEKIYRDQYRY----------DSSFTFVCTPND -THACRLRAYVR-NGI----VIRVEQ--------AYDVQNYT------------------- ----DLYGNKASVMWSPRGCNKGYNLPRRVYGPY-RVKHPMVRKGWKEWAEAGFPDPTLP- ----------ENQQKYF--RRGEDS-WVKVSWD-EGFELV--------AKGLLHTMEKYSG -E-KGAEILRKQGYPEEMIEAMHGSGAQ--------------------------------- --------------------------TIKIRGAMPLLGATRIFGFYR----FANMLGLYD- -G-----KLGARG-WSNFS-WHGDLPPGHPMVTGVK---CSDPE-LNDF-RHSKLLVFLGK -----------NMVESKMADAHWWIETIE---------RGGK----VVNISPEYSATSSKS -D----YWIPIRPGTDTALLLGVTQIIIQEKLYDQ----------DFIKKHTDLPLLIRMD -NLKLLRPTDIIKGYKNQILTGYSVKVQKIKPELR----------------EKWGDFVVWD -LKTKKPQTVTREDLGEKIERKGLNPALEGNYKIKL------------------------- -----VNGKEIEVKTVFQLYKELLSE----------------------------------- -------------YDLETVSQITGSPK---------NLIYQLAQDLATI----KP-ASIHT -GEGV---NHFFHCDLVTRAVWLPLALTGNIGKPGANVGHWAGNY---------------- -----KGEVFDGLGVYLNEDPFNPNLDPSAKLEDIKLKKYYKGEE---------------- ------------------------VCYWNYEDRPLIVKGKCFTGKTHMPTP----TKAEWV -GNGNLLNN-------------------------------AKWAHNMIANVEG-----KVE -MIVYNEIEWTASCEY--ADVVFPV-HSWMELTLPDMTASCSN----------PFLQV-WK -GGIKPIF-D---T--------KQD------NEVLAGVA-AKLSELTHD------------ -------------NRYKDYWK--FVLE----------------------GNNEVYLQRILD -A---CSTTKGYKIDELLKSDRGWLMNFRTYP-----RIPFWE-QIQ----ESK------- --------------PFYTKTGRMEFYREEDEFIDYGENLIVHREPVEATPYLPNVILGTHK -AIRPNSYGISPESINADER-----------------------QVRNLKMSWKQ-VKLSKN -P----LWEKGFRFYCLTPKSRHTVHSSWSVLD-----------WNMIWQS-NFGDPYRMD -NRTPGVG-----EHQMHMNPLDAKE-LGI-------------N-------------DGDY -AYVDANPED-RPYTGWKEEDPFYKVSR---L--M-VRVKYNPAYPRGITMIKHASFIATH -KSVKAHESRPDKRAV--------SEDTGYQSSFRYGSQQSITR-GWLQPTMMTDSLVR-- ------KNYMGQEIGEGYEID----VNAPNTCPKETLVKIIKAEDGGMGGKGKWEPARTGY -TPAGENKDMKKFLEGGFILKV--------------------------------------- -- ->NxrA1_Nitrospira_defluvii_YP_003798853 ------------------------------------------------------------- ------------------------------MMQLSRRQFLKVS-------AGTVAVAAVAD -K--ALALTALQPVVEVNNPLGEYPDRSWERVYHDQYRY----------DSSFTWVCSPND -THACRIRAFVR-NGV----VMRVEQ--------NYDHQTYE------------------- ----DLYGNRGTFAHNPRMCLKGFTFHRRVYGPY-RLKGPLMRKGWKQWMDDGSPELTS-- ----------DVKRKYKFDSRFLDD-MVRVSWD-TAFTYV--------AKGLIVIGTRYSG -EAGARRLREQG-YAPEMIEMMKGAGVR--------------------------------- --------------------------TFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIR -KVNPDQAQGGRY-WNNYT-WHGDQDPSQPWWNGTQ---NCDVD-LSDM-RFTKLNTSWGK -----------NFVENKMPEAHWKLESME---------RGAR----LVIITPEYNPTASRA -D----YWIPVRPETDGALFLGASKIILDENYQDI----------DFIKGFTDMPLLVRTD -TLQYLDPHEVLKDYQVPDF--------------TKSYSGRVQGLSQDQV-QRLGGMMVWD -LAKGKAVPLHREQVGVHLAQSGIDPALTGTYRIKL------------------------- -----LNGREVDVMPIYQLYTIHLQ-D---------------------------------- -------------YDLDTVHQVNRAPK---------DLIVRWARDCGTV----KPAA-IHN -GEGV---CHYFHMTSMGRAAALVMMLTGNIGKFGTGCHTWSGNYKVGIWQA--------- -----APWSGAGASVYLGEDPWNLNLRDDVHGKEIKYRKYYYGEEPGYWNHG--------- ------------------------DNALIVNTPKYG--RKVFTGKTHMPSP----SKVRWV -VNVNILNN-------------------------------AKHHYDMVKNVDP-----NIE -MLVTQDIEMTSDVNH--ADVAFAV-NSWMEFTYPEMTATVSN----------PWVQI-WK -GGIRPLY-D---T--------RND------LDSFAGVA-AKLKEMTGE------------ -------------QRMADTYK--FVYH----------------------NRVDIYVQRILD -A---STTFFGYSADVMLKSEKG-----WMVMCRTYPRHPLWE-ETN----ESK------- --------------PHWTRSGRLETYRIEPEAIEYGENFISHREGPECTPYMPNAIMTTNP -YVRPEDYGIPVTAQHHDDK-----------------------TVRNIKLPWSE-IKQHPN -P----LWEKGYQFYCVTPKTRHRVHSQWSVND-----------WVQIYES-NFGDPYRMD -KRTPGVG-----EHQIHINPQAAKD-RGI-------------N-------------DGDY -CYVDGNPVD-RPYRGWKPSDPFYKVAR---L--M-IRAKYNPSYPYHVTMAKHAPYVSTA -KSVKGHETRPDGRAI--------AVDTGYQSNFRYGAQQSFTR-SWLMPMHQTDSLPG-- ------KQANALKFKWGFEID----HHAVNTVPKECLIRITKAEDGGIGARGPWEPVRTGF -TPGQENEFMVKWLKGEHIKIKV-------------------------------------- -- ->NxrA2_Nitrospira_defluvii_YP_003798871 ------------------------------------------------------------- -----------------------------MQVSVSRRQFLK-I-------SAGTVAAVAVA -DK-VLALTALQPVIEVGNPLGEYPDRSWERVYHDQYRY----------DSSFTWCCSPND -THGCRVRAFVR-NGV----VMRVEQ--------NYDHQTYE------------------- ----DLYGNRGTFAHNPRMCLKGFTFHRRVYGPY-RLKGPLMRKGWKQWMDDGSPELT-P- ----------DVKRKYKFDSRFLDD-LNRVSWD-TAFTYV--------AKAAVLIATRYSG -EAGARRLREQG-YAPEMIEMMKGAGVR--------------------------------- --------------------------TFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIR -KVDAEKAQGGKY-YSNYT-WHGDQDPSHPFWNGTQ---NCDVD-LSDM-RFSKLNTSWGK -----------NFVENKMPEAHWKLESIE---------RGAR----IVVITPEYNPTAYRA -D----YWIPVRPETDGANFLGAAKIIFDENLQDI----------DYIKEFTDLPLLVRTD -TLQYLDPRDVIADYKFPDF--------------SKSYSGRIQSLKPEQV-ERLGGMMVWD -LAKGKAVPLHREQVGFHFKESGIDPALTGTFRVKL------------------------- -----LNSREIDVMPIYQMYQVHLQ-D---------------------------------- -------------YDLDTTHQITRAPK---------DLIVRWARDSGTI----KPAA-MHN -GEGV---CHYFHMTEMGRAAAFIMTITGNIGKFGTGCHTWSGNYKAGIWNA--------- -----VPWSGAGLAVHTGEDPFNLTLDPNAHGKEIKTRSYYYGEEVGYWNHG--------- ------------------------DTALIVNTPKYG--RKVFTGKTHMPSP----SKVRWV -TNVNILNN-------------------------------AKHHYDMVKNVDP-----NIE -MIVTQDIEMTSDVNH--ADVAFAC-NSWMEFTYPEMTGTVSN----------PWIQI-WK -GGIRPLY-D---T--------RND------ADTFAGVA-AKLAEMTGD------------ -------------ARFRGVFH--FVYM----------------------NRVDVYPQRMLD -A---SATCYGYSADVMLKSEKG-----WMVMGRTYPRHPLWE-ETN----ESK------- --------------PQWTRSGRIETYRIEPEAIEYGENFISHREGPECTPYLPNAIFSNNP -FIRPDDYGIPITAQHHD--DK---------------------HVRNIKLPWAE-IKRHPN -P----LWEKGYQFYCVTPKTRHRVHSQWSVND-----------WVQIYES-NFGDPYRMD -KRTPGVG-----EHQLHINPQAAKD-RGI-------------N-------------DGDY -VFVDGNPVD-RPYRGWKPSDPFYKVAR---L--M-IRAKYNPAYPYHVTMAKHAPYVATA -KSVKGHETRPDGRAI--------AVDTGYQSNFRYGAQQSFTR-NWLMPMHQTDSLPG-- ------KHTIAWKFKWGYAID----HHGINTVPKECLIRITKAEDGGIGARGPWEPVRTGF -TPGQENEFMIKWLKGEHIKIKV-------------------------------------- -- ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 ------------------------------------------------------------- -------------------------------MKLTRRAFLQ-V-------AGATGATLTLA -KN-AMAFRLLKPAVVVDNPLDTYPDRRWESVYRDQYQY----------DRTFTYCCSPND -THACRIRAFVR-NNV----MMRVEQ--------NYDHQNYS------------------- ----DLYGNKATRNWNPRMCLKGYTFHRRVYGPY-RLRYPLIRKGWKRWADDGFPELT-P- ----------ENKTKYMFDNRGNDE-LLRASWD-EAFTYA--------SKGIIHITKKYSG -PEGAQKLIDQG-YPKEMVDRMQGAGTR--------------------------------- --------------------------TFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNR -GVGPDQALGGRN-WSNYT-WHGDQAPGHPFSHGLQ---TSDVD-MNDV-RFSKLLIQTGK -----------NLIENKMPEAHWVTEVME---------RGGK----IVVITPEYSPSAQKA -D----YWIPIRNNTDTALFLGITKILIDNKWYDA----------DYVKKFTDFPLLIRTD -TLKRVSPKDIIPNYKLQDI--------------SDGPSYHIQGLKDEQR-EIIGDFVVWD -AKSKGPKAITRDDVGETLVKKGIDPVLEGSFKLKT------------------------- -----IDGKEIEVMTLLEMYKIHLR-D---------------------------------- -------------YDIDSVVSMTNSPK---------DLIERLAKDIATI----KPVA-IHY -GEGV---NHYFHATLMNRSYYLPVMLTGNVGYFGSGSHTWAGNYKAGNFQA--------- -----SKWSGPGFYGWVAEDVFKPNLDPYASAKDLNIKGRALDEEVAYWNHS--------- ------------------------ERPLIVNTPKYG--RKVFTGKTHMPSP----TKVLWF -TNVNLINN-------------------------------AKHVYQMLKNVNP-----NIE -QIMSTDIEITGSIEY--ADFAFPA-NSWVEFQEFEITNSCSN----------PFIQIWGK -TGITPVY-E---S--------KDD------VKILAGMA-SKLGELLRD------------ -------------KRFEDNWK--FAIE----------------------GRASVYINRLLD -G---STTMKGYTCEDILN-GKYGEPGVAMLLFRTYPRHPFWE-QVH----ESL------- --------------PFYTPTGRLQAYNDEPEIIEYGENFIVHREGPEATPYLPNAIVSTNP -YIRPDDYGIPENAEYWEDR-----------------------TVRNIKKSWEE-TKKTKN -F----LWEKGYHFYCVTPKSRHTVHSQWAVTD-----------WNFIWNN-NFGDPYRMD -KRMPGVG-----EHQIHIHPQAARD-LGI-------------E-------------DGDY -VYVDANPAD-RPYEGWKPNDSFYKVSR---L--M-LRAKYNPAYPYNCTMMKHSAWISSD -KTVQAHETRPDGRA---------LSPSGYQSSFRYGSQQSITR-DWSMPMHQLDSLFH-- ------KAKIGMKFIFGFEAD----NHCINTVPKETLVKITKAENGGMGGKGVWDPVKTGY -TAGNENDFMKKFLNGELIKVDA-------------------------------------- -- ->NxrA_planctomycete_KSU_1_ZP_10101005 ------------------------------------------------------------- -------------------------------MKLTRRTFLQ-V-------TGATGATFTLA -NK-AMAFRLLKPAVEVGNPLDAYPDRAWESVYREQYRY----------DRTFTYCCSPND -THACRVRAFVR-NEV----LMRVEQ--------NYDHQNYA------------------- ----DLYGNKATRNWNPRMCLKGYTFHRRVYGPY-RLRYPLIRKGWKQWADDGFPELT-P- ----------ENKSKYMFDARGQDE-LLKASWD-DAWTYA--------AKGIIHITKKYSG -E-EGARKLLDQGYPKEMVDAMKGAGTR--------------------------------- --------------------------TFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNR -GVGPDKALGGRN-WSNYT-WHGDQAPGHPFSHGLQ---TSDVD-MNDV-RFSKLVIQTGK -----------NLIENKMPEAHWLTQVFE---------RGGK----LVVITPEYSPSAQKA -D----YWIPIKCNTDTALFLGITRILMDEKLYDA----------DYVKKFTDFPLLVRTD -TLKRLQAKDIFPDYKLEDISHGASYKIHGLHDDQR---------------EIIGDFVVWD -AKTKSPKAITRDDVGDKLVAKGIDPALDGTFKVKT------------------------- -----VDGKEIEVMPLFEMYKIHL-KD---------------------------------- -------------YDIDSVVEMTNSPK---------ELIVRLAHDIATI----KP-VAIHY -GEGI---NHWFHATLFNRSTYLPLMLTGNIGYPGSGSHTWSGNYKAGNFQA--------- -----SKWSGPGFYGWVAEDVFNPNLDPDAPAMDLKVKGRAYDEEVAYWNHN--------- ------------------------DRPLIVDTPKYG--RKCFTGKTHMPTP----TKIMWF -TNVNLVNN-------------------------------AKHVYQMLKNVNP-----NIE -QIMSNDIEMTGSIEY--ADFAFPA-NSWAEFETHEITTSCSN----------PFIQI-WK -GGIKPVN-D---S--------KDD------VMILAGMA-AKLGELLRD------------ -------------MRFHDVWK--FALE----------------------GRPEVYIQRLLD -G---STTTKGYSFVDIIN-GKYGEPGVALLLYRTYPRHPFWE-QVH----ESI------- --------------PFYTPTGRLQGYNDESEIIEYGENFIVHREGPEATQYLPNVIVSTNP -YIRPDDYGIPEDAEHWD--ER---------------------TVRNIKKSWAE-TKKTKN -F----LWEKGYKFYCVTPKSRHTVHSQWAVTD-----------WNFIWNN-NFGDPYRMD -KRMPGVG-----EHQIHMNPEAAKD-LGI-------------N-------------DGDY -VYVDANPAD-RPYEGWKPSDPFYKVAR---L--M-LRCKYNPAYPYGVTMMKHSAWISTE -RSVKAHETRPDGRAL--------SAGTGYQSSFRYGSQQSITR-NWSMPMHQLDNLFH-- ------KSKTSMKFVFGYEAD----NHGINTTPKETLVKITKAEDGGIGGKGLWDPAKTGY -TAGNENDFMKKYLNGELIKVEKA------------------------------------- -- ->Hydrogenobaculum_sp_Y04AAS1_YP_002121006 ------------------------------------------------------------- --------------------------------MISRRDFLKN--------GSVFLAALSTP -GF-GKKLF--EPLVIVGNPLASYPNRGWEKIYRDIYKP----------DETTVILCNPND -THGCYLNAYVK-NGI----ITRLEP--------TYKYGDAT------------------- ----DIYGIKASHRWEPRCCNKGLALVRRFYGDR-RIRGPFVRKGYYEWYKADFPRDEN-- ----------GKPPSKYFINRGKDE-WLKVSWE-EVSDII--------AKSLINIAKTYSG -EKGKAYLKAQG-YPEEMIDTMAGAGTR--------------------------------- --------------------------TLKFRGSMPWLAVLRYVGQYRMSN-MMALLDSNIR -KVEPDKALGGVG-WDNYS-EHTDLPPAHTLVTGQQ---TVDFD-LVTW-EHAKLIVLWGM -----------NPYGTKMPDSHWLTEAQI---------KGIK----VIVISNDFMATARTA -D----KVVITRTATDGALALSMAYVIMKEKLYDE----------NFVKSFTDLPLLVRMD -NAKLLRASDIIPNYIPKAL-NQAVVYNPSKQMPPPPMKQEKQYIPIQLRDQDINDFVVWD -VKTNSPKVVTRDEVGKYFDMSSLDPALTGEYEVEL------------------------- -----VNGEKVKVKPNFQAYIELLEEN---------------------------------- -------------YTPETVEEITGVPA---------NVIRELALEIANH----KGTTKITT -GMGV---NQYFHGDLIVRAIFLVAALTGNVGRESGNIGSYAGNY---------------- -----RLAVFNGVGQWNAEDPFNIELDPSKLAKVKFYWKGES------------------- ------------------------QHYFADGDRPLKVGDKMLTGKTHMPVP----TKFMWM -ADNNSGLGN------------------------------QKWAYNVMFNVLP-----NVE -CVVTNDWWWSLSCEY--SDIILGV-DAWDENRFWDISGSCTN----------PFFLVWPR -TKQKRLF-D---T--------KND------IETYALVA-KRLSELTGD------------ -------------KRFKEYWH--FVFE----------------------EKPEVYIQRIIN -A---SSNLKGYKIEEVAAKAEQGIPSLVMTRFYP--KFIGYD-QTV----DGK------- --------------PWYTKTGRLEFYREEDTFINVGENLIVHREAIDSTPYEPNTIVIAKK -HPLLRPLDPKSYGLSSEEMLKDT-------------------ELRQARAVFIS-PAKLKD -TKHPLRVSFGATHIVHTPKFRHTTHSATGDVD-----------IVALLFG-PYGDMYRHD -KRTPYVV-----DAFIEINTHDLQK-LGI-------------N-------------DGDY -VWVDADPQD-RPFIGWQNKPEEYEVAR---L--L-LRVRGSFSTPPGLAKIWFNMYGSSH -GSVKGTKVNKNGLAE--------NPVTGYQSFYRRGSQQSVTR-GWLNPTLMGDTLVR-- ------KDLFGQTLNKGFMLD----VYCPTGAPREGFAKITKAENGGIGNVGLWRPLSIGF -RPQNPNKYFKKYLEAGYVIFV--------------------------------------- -- ->Hydrogenobacter_thermophilus_YP_003433365 ------------------------------------------------------------- ------------------------------MSDLTRRDLLK-M-------GGLSLTAMLSP -SF-AFRVMEPVVRV--ENPLAYYPNRDWERFYRDIFKS----------EATFTFLCAPND -THNCLLTAHVK-NGV----ITRIEP--------TYKFGEAT------------------- ----DIYGLKASHRWDPRCCNKGLALMRRFYGDR-RVKGPMVRRGFYEWYKAGFPRDPIT- ----------GKPLEKYF-QRGKDK-FIKVTWD-EVADII--------AKTLINIATTYSG -EEGRKRLEAQGHYPKPMLDAMEGAGTR--------------------------------- --------------------------VLKFRGSMPFLAVVRYTSPYRFAN-MMALLDSHIR -GVGPDKALGGRG-WDNYA-FHTDLAPGHPMVSGQQ---NVEFD-LCMW-EHSKLIILWGM -----------NPFTTKMPDCHWLTEARI---------KGSK----VIVISNDYSPTARAS -D----ELIVVRTGTDTALALSIAYVIMKEKLYQE----------RFVKSFTDMPLLVRMD -NGKVLRARDIIPNYQPQPLQKAVVFKP--GETLPPFYKQDKQYIPEPIRKGDMDDFVVWD -TKSNSPKVITRDHVGEDFWKLGIDPALYGTYRVKT------------------------- -----VEGKEVEVKPLFQVYLEFFEKS---------------------------------- -------------YTPKQAEVITGVPA---------KKIEKLAREIASH----PRNMKLAQ -GMGV---NQYQHADLKDRAMYMICALTDNIGHATGNIGSYAGNF---------------- -----RLALFNGAPQYLAEDPFNIELDPEKPA---KVKFYWKPESAHYYSH---------- ----------------------------DDHPQYMG--EHLITGKTHMPTP----TKFVWF -VDANSALGN------------------------------AKWQYNIIMNTLP-----KIE -CIVTNEWWWSMTCEY--SDIVLGV-DAWNENKYWDIAGSVTN----------PFVYVWPK -TGHRRFF-D---T--------KND------AEAFAIVA-NRLSELTGD------------ -------------ERFRNYWK--FVLE---------------------GKQDVVYVQRVIN -A---SSNLRGYRLEEIAKKAHEGIPSLI--------MTRSYPKYVGEDQTKEG------- -------------MPWYTKSGRLEFYREEPEFMDAGENLPVYREPIDSTHHEPNVIVARPH -PLLRPKKPEDYGLSAKDALLST--------------------EWRQARNVLVS-PEKLPN -TKHPLMVTVGATHIVHTPKYRHSAHTTTGDTD-----------IIVLLFG-PFGDIYRHD -KRMPFVS-----EAYIDINPKDLKK-MGI-------------Q-------------DGDY -VWVDADPQD-RPFAGWQKRPEDYEVGR---L--L-LRARASNNTPPGCAKIWFNMYGSSH -GSVRGTKENPNGLAK--------NPNTGYQSLYRRGSHQSITR-GWFKPTYQTDTLVR-- ------KNLMGQIIGKGFELD----VHGLIGAPREGFCKIAKAEDGGIGGKGVWRPVRLGY -RPMTANEMLKKYLKGEYVK----------------------------------------- -- ->I_OP1_uncultured_candidate_division_bacterium_BAL57377 ------------------------------------------------------------- -------------------------------MAVSRRRFVKAT-------AALTGAALVTD -TL-GLQGF-KFVP-EIKNPLEFYPNRDWEKIYRDQFRY----------DSSFTFLCAPND -THNCLLRAYVR-NGV----IVRIGP--------TYGYNEAR------------------- ----DLYGNKVSARWEPRCCQKGLALGRRFYGDR-RVNGVWVRKGFFDWVRAGFPRDPHT- ----------GAPPKEYF-NRGQDS-WLKLSFD-EAYGIV--------AQALFNIVQTYSG -PEGAARLKAQN-YDPTMLEAMHEAGTQ--------------------------------- --------------------------TVKVRGGMPFLGATRIYGLARFAN-MLALLDAHIR -NVSPDQALGGRV-WDSYS-WHTDLPPGHPMVTGQQ---TVEFD-LFTA-ENAKLITLWGM -----------NWICTKMPDAHWLTEARQ---------RGAK----VITIATEYQATANKA -D----EVIIIRPGTDAAFALGVASVIINEKLYDE----------EYVKTFTDLPLLVRMD -TLKLLRASDIIRDYQPAELTNYAKVLKPDEKPGPPL-AQRVQYIPERAR-QAWGDFVVWD -STKNAPEVITRDHVGQFFAARGIDPALEGSFTVQT------------------------- -----TDHQEITVRPVFDLIKEYLK-E---------------------------------- -------------FTPPKVAEMSWAPS---------EAIVNLARQIAAN----KASTLLSH -GMGP---NHFFNADLKDRALFLIAALTKNIGHFGGSPGSYAGNY---------------- -----RVALFNGLPQYIAEDPFNIELDPTKPATVKSYAKSES------------------- ------------------------AHYYNYGDRPLRVGKKLFTGKTHTPTP----TKFMWF -ANSNSLLGN------------------------------SKWGYDVIHNTLP-----KIE -AIVVNEWWWTMSCEY--ADVVFGV-DSWGELKYPDMCGSVTN----------PFVQVFPR -TPLPRIF-D---T--------RSD------IETYMGVA-EKFAELTGD------------ -------------ARFRDYWH--FVRE----------------------NRVDVYLQRICD -A---SSSLRGYKFTDLEEQARQGTPMLKLLRTYP--KIVGWE-QTQ----ESK------- --------------PWYTKTGRLEFYREEDEFIEYGENLPVYREPVDATPHEPNVIVAPKT -LSALKPAPPEQYGLKRDDLS----------------------TETRQVRNVIK-TPEEVV -RSQHPRTKDGLKFIFITPKYRHGAHTTPVDLD-----------VLAVYFG-PFGDIYRRD -KRSPWVG-----EVYADINPQDAKE-LGI-------------E-------------DGDY -IWIDADPED-RPYRGAKPSDPDYKIAR---L--M-GRARYYNGTPRGVVRMWFNMYQATH -GTVNAHETRPDKLAK--------DPQTNYQAMFRYGGHQSCTR-AWLRPTLMTDSLVR-- ------KDVFGQTIGQGFAPD----IHCPVGAPKESFVKITRAEPGGADLKSLWRPAQLGY -RPTYESDEMKQYLAGGFIEVT--------------------------------------- -- ->Beggiatoa_sp_PS_ZP_02000390 ------------------------------------------------------------- --------------------------------------------------MAVTGAGAAVI -SQQAISATQLLTPVAIDNPLSNYPNRDWEKTYRDLYHY----------DSSFTFLCAPND -THNCLLRGYVK-NGV----VTRIAP--------TYGYQKAK------------------- ----DLDGNQSTQRWDPRCCQKGLALVRRFYGDR-RCKRPMIRKGFKDWVEAGFPRLPET- ----------GAVDQKYL-QRGRDS-WVGASWD-EAFELA--------GKALTNIAQTYTG -EEGQKKLLAQG-YDPLMVEATEGAGTQ--------------------------------- --------------------------VLKFRGGMPPLGMTRVFAQYREAN-AMALLDDKIR -GKGTD-SLGGRG-FDNYS-WHTDLPPGHPMVTGQQ---TVDFD-LCNV-ERTNLLIVWGM -----------NWITTKMPDSHWMTEARM---------KGTK----VVVIAAEYSATSSKA -D----EVFVVRPGTTPALALGIAQVLISENLYDA----------PYVKANTDLPLLVRMD -TAEMLRAGDVFKDYQLAKLENNTLVV-PTGEKGPPMHQQKGPILDEKQR-ADWGDFVYWD -ASESKPVAMNHDQVGKHFSG---NPQLTGEFAVPL------------------------- -----ASGETVQCRTVFDVTKEMLDGS---------------------------------- -------------YTPEDVAKLTWTSA---------DGIRGLARQIAAN----QSNTLFTV -GMGP---NQFFNSDLKDRNIFLVAALTQNIGKIGGNVGSYAGNY---------------- -----RASFFNGLAQFIGEDPFNPELDPTKPA---KLRKRWKAESVHYFNHGD-------- ------------------------------TILRMG--KAVLTGKTHIPTP----TKAFHV -SNSNSLIGN------------------------------VKGHYDFVINTLS-----RVE -FIAQNEWWWTASCEY--ADIVFAV-DSWAELKYPDMTISVTN----------PFLYTFPA -TPLPRIH-D---T--------RSD------LEVAAGIC-GAIGKVTND------------ -------------SRHKDYWH--FINK----------------------GEVRPHIQRVLD -H---SNATRGYKIEDLEKLANEGIP--AILQTRTYPKVGAWE-QGN----ENK------- --------------PWYTKTGRLEFYREEPEFRDSGENIVVHREPIDSTRFEPNVIVAKSH -PLLRPKTPEDYGVPSSD--MS---------------------GDTRQARHVVK-TVDEVL -NSEHPLHKEGYDFVFHTPKYRHGAHTTAVDTD-----------IVAAWFG-PFGDMLRRD -RRMPFVA-----EAYVDINPDDAKG-LGI-------------E-------------DGDY -VYIDADPHD-RPFKGWQKYPEGYKVAR---L--L-VRARYYPGTPRGVTRMWHNMFGATF -SSVRGQETNPTGLAK--------SPETGYQSLYRGGSHQSCTR-GWLKPTWMTDSLYV-- ------KGLMGQKITQGFVPD----VHCPTGAPREALVRIIKAENGGIDGKGLWSPAARGL -RPTYENDILKQFMAGKFVELA--------------------------------------- -- ->Nitrococcus_mobi_EAR23355 ------------------------------------------------------------- --------------------------------------------------MGWIQD---LI -NP-KTRRW-EEF-----------YRNRWQH------------------DNIFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLLGRGEGGRGIPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYGKGVLLDFWREARSSHNNPV -EAWSSIVTDENKRKRWQKARGKGG-YRRTTWD-ELLELI----------ASACLYTAQKY -G-------------PDRVM----------------------------------------- --------------------------GFSPIPAMSM---------------LSYAAGSRFL -Q-----LFGGVN-MSFYD-WYADLPNSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NLNMTRTPDVHFISEARH---------EGAK----FVVLAPDFSQVSKYA -D----WWIPVKKGEDLGLWMAAGHVIYTEFYVKR----QVPYFIDYVTRYTDMPFLVKLE -K----DGDG----YRPGRYLTSEEVKKYKKQENA-AWKQLVFDRKSNEA-RCPKGQIGHR -HGK-HGQ-----WNLKMEDGLDNSPIEPVLSFLGE---SDDVAMVQFYEFA--------- -------SQTVYKRGVPAKKIDTGSGS----VLVATVYDLNMGQYAVNRGL--------PG -DYPESYDDLK-PYTPAWQEQFSGIGR---------QTVIRFAREFAGTAEKTKGRSMVIV -GASA---NHWYHNNHIYRAAINCLIACGCCGRNGGGMNHYVGQEKLAIVAPWNALALAGD -WGIKPRLQQSPVWHYVNSDSWRYEGSFEEYAPS-PPNAKWAKGHSVDLVAKSVRMGWMPH -YPQFNRSPLEVAREAEKAGAKDDKGMADYVVQALK--KKNLSFSVDDPDAPENWPRVWFI -WRGNAMQSSAKGAEFFLRHYLGTHDNAVAEERAKP----HVKHVKFREPAPR----GKFD -LVVDINFRMDSTALY--SDIVLPT-AFWYE-KNDLNSTDLH-----------SFIHP-LG -QAVPPVW-E---S--------KSD------WDIFKAFA-KKISEMAPSVFSEPFKDVVAA -PLTHDTPDEIAQRDVKD-WL--EGECEPIPGKTMPHFRVVERDYSLLYNKYISLGSAIRE -N---GISGNGCSFPITKQYDELTNQPVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLL -YLAPETNGEVAYQAFKSEQEHCGVPLTDLAEPYRGHQVTFYDLTRQPRRLLCSPVWTGNC -GDGRAYSAWTLQIDRLV--PFRTLTGRQHIYIDHPWYMDFGEHLCTYRPKLDY-KKIHDL -DN-SPIDDKTLILNYITPHGKWNIHSTYKDNH-----------RMLTLSR--GMDP---- ------VW----------INDKDAAR-VGL-------------K-------------DNDW -VEVY---ND-N--------------GV---I--V-TRANVSRRVQSGMCLYYHA-VERTI -Y----------------------IPKSQIRGGRRAGGHNSVTR-TRINPVYLAG-GNA-- ------QFTYL-------FNY----WGPTGIMTRDTHVAVRKLEKLEW------------- ------------------------------------------------------------- -- ->A_Nitrobacter_hamburgensis_YP_578638 ------------------------------------------------------------- --------------------------------------------------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYIRGPLLDMWREAKASSADPV -QAWGALIGDEQKRSRIQKARGKGG-FRRAKWE-ELVELI----------AAASLHTARKH -G-------------PDRIM----------------------------------------- --------------------------GFSPIPAMSM---------------LSFAAGTRFL -S-----LMGGSL-MSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NMNMTRTPDVHFISEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYVDR----QVPYFVDYIKRYTDLPFLVELE -S----NGNT----YKTGRLLRSNRVPRYKDVENG-DWKMLLLDANSGEL-RAPKGQVGDR -WGSVHGK-----WNLSGEDTLDNSPLDPVLSFIDR---SDDVVQVGFDDFA--------- -------NGRIVSRGVPVKRVATDKGE----ILCATGFDIMMSQFGISRGL--------EG -AFATSYDDEDAPYTPAWQERHTGIGR---------ETAIRFAREFATNAELTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWATVALALD -WAKPPRLVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPKWAKGHAIDLEAKAVHNGWMPF -TPHFNRNPIEVAAEAERSGAKNVQDIETYVVDQVV--SKKLQMAIDDPDAAENWPRMWFI -WRGNAIQSSAKGHEFFLRHYLGAHDNAIAEDRAKG----KAQVVKYHETAPR----GKYD -LVIDLNFRMNTTSLY--SDIVLPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WEIFKLIG-KKVSELAPLAFSKPVRDVVLQ -PLMHDTPDELAQPEILD-WS--LGECKAVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GISAVGVQIPIKKQYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTVL -LCAPEANGEVCYQAFHNEEHHVGLPLVDLAEPNRNVAATFYDLTRQPRRIITSPCWTGMV -NDGRAYSAWCMNVERLV--PWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RMLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-TRINPLFLAG-GYA-- ------QFTYG-------WNY----WGPTGILTRDTHVVVRKMEKLEW------------- ------------------------------------------------------------- -- ->B_Nitrobacter_hamburgensis_YP_578186 ------------------------------------------------------------- --------------------------MTTGLAAGQRTEETQ---------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RIKYPYVRGPLLDMWREAKASSADPV -QAWGALVGDEQKRARMQKARGKGG-YRRAKWE-ELVELI----------AAASLHTARKH -G-------------PDRIM----------------------------------------- --------------------------GFSPIPAMSM---------------LSFAAGTRFL -S-----LMGGSL-LSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NLNMTRTPDVHFIAEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYVDR----QVPYFIDYVKRYTDLPFLVELE -P----NGTT----YKTGRLLRARHVPRYKDVENG-DWKMLLLDANSGEL-RAPKGQVGDR -WGSVHGK-----WNLSGEDTLDNSPLDPVLSFIDR---SDDVVQVGFDDFA--------- -------NGRIVSRGVPVRRIATDKGE----ILCATGFDIMMSQFGISRGL--------EG -AFATSYDDEDAPYTPAWQERHTGIGR---------ETAIRFAREFATTAEYTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWASIALALD -WSKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPRWAKGHAIDLEAKAVRSGWMPF -TPHFNRNPIEVAAEAERAGAKSTEDIATHVIDQVA--SKKLNLAIEDPDAAENWPRLWFI -WRGNAIQSSAKGHEFFLRHYLGTHDNAIAEDRAKG----KTHTVKYHDTAPR----GKYD -LVVDLNFRMDTSSLY--SDIVLPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WDIFKLIA-KKVSELAPLAFSKPVRDVVLQ -PLMHDTPDELAQPEILD-WA--EGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GVSAVGVNVPIKKQYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVL -LCAPEANGEVCYQAFHNEEHHVGLPLVDLAEPTRNVATTFYDLTRQPRRLLTSPCWTGMM -NDGRAYSAWCMNVERLV--PWRTLTGRQTLYIDHQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RMLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-TRINPLFLAG-GYA-- ------QFTYG-------WNY----WGPTGILTRDTHVVVRKMEKLEW------------- ------------------------------------------------------------- -- ->Nitrobacter_winogradskyi_gb_ABA05326 ------------------------------------------------------------- --------------------------------------------------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYIRGPLADLWHEAKASYPDPV -QAWASLVEDEEKRNRIQKARGKGG-FRRAKWE-ELIELI----------AASCLYTARKH -G-------------PDRVM----------------------------------------- --------------------------GFSPIPAMSM---------------LSFAAGTRFL -S-----LFGGGL-MSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NMNMTRTPDVHFISEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYIDR----QVPYFIDYVKRYTDLPFLVELE -P----NGNT----YKTGRLLRSNRVARYKDVENG-EWKMLVLDTATGEP-RAFKGQVGDR -WGSTHGK-----WNLSAEDTLDNSPIDPVLSFIDQ---SDGVVQVGFDDFV--------- -------NGSVVSRGVPVKRIATDKGE----VLVTTGFDIMMSQFGHSRGL--------EG -SFATSYDDEDAPYTPAWQERHTGIGR---------ETAIRFAREFATNAELTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWSTVAMALD -WNKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPRWAKGHAIDLEAKSVRCGWMPF -TPNFHRNPIEVVAEAERAGAKSTADIATYVADQVA--SKKLDLAINDPDAEENWPRVWFI -WRANAIQSSAKGHEFFLRHYLGAHDNVIAEERAKG----KTTTVKYRDTAPQ----GKYD -LVVDINFRMNTTGLY--SDIILPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WEIFKLIA-KKVSELSPLAFSKPVRDIVLQ -PLMHDTPDELAQPEILD-WA--EGECKLVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GISAVGVNIPIKKQYDQMLENPIMPMPDSRHMRCVEWGGKRYPSLEDVLDACNVVL -LCAPVANGEVSYQGFVNEEQHVGLPLADIAEPTRGVSSTFYDLTRQPRRILTSPCWTGLV -NDGRAYSAWCMNIERLV--PWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RLLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-IRINPLFLAG-GYA-- ------QFTYG-------WNY----WGPTGIFTRDTHVVVRKMEKVEW------------- ------------------------------------------------------------- -- ->Nitrobacter_sp_Nb_311A_ZP_01048070 ------------------------------------------------------------- --------------------------------------------------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYIRGPLYDLWREAKASHPDPV -QAWASLVGDEQKRLRMQKARGKGG-FRRAKWE-ELVELI----------AAAALYTARKW -G-------------PDRVM----------------------------------------- --------------------------GFSPIPAMSM---------------LSYAAGSRFL -Q-----LFGGVN-MSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAA -----------NMNMTRTPDVHFIAEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYIDR----QVPYFIDYVKRYTDLPFLVELE -P----NGNT----YKTGRLLRAKRVARYQDVENG-DWKMLVLDSKTGEP-RAFKGQVGDR -WGSTHGK-----WNLSAEDTLDNSPIDPVLSFIDQ---SDGVVQVGFDDFV--------- -------NGSVVSRGVPVKRIATDKGE----VLVTTGFDIMMSQFGHSRGL--------EG -SFATSYDDENAPYTPAWQERHTGIGR---------ETAIRFAREFATNAELTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWNTIAMALD -WTKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPRWAKGHAIDLQAKAVRSGWMPF -TPHFNRNPIELAAEAERAGAKSTDDIVTHVVDQVA--SKKVNFAIDDPDAEESWPRMWFI -WRGNAIQSSAKGHEFFLRHYLGAHDNSIAEDRAKG----KTQRVKYRDTAPR----GKYD -LVVDLNFRMNTTSLY--SDIVLPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WEIFKLIA-KKVSELSPLAFSKPVRDVVVQ -PLMHDTPDELAQPEILD-WA--EGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GVSAVGVQIPIKKQYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTLL -MCAPEANGEVCYQGFHNEEHHVGLPLVDIAEPTRGVSSTFYDLTRQPRRILTSPCWTGMT -NDGRAYSAWCMNVERLV--PWRTLTGRQTLYIDSQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RMLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-TRINPLFLAG-GYA-- ------QFTYG-------FNY----WGPTGIFTRDTHVVVRKMEKLEW------------- ------------------------------------------------------------- -- ->Acidovorax delafieldii_NARG ------------------------------------------------------------- -----------------------------MSHFLDRLSYFSQP-------RENFAQGHGQT -NG-EDRTW-EDA-----------YRDRWAH------------------DKIVRSTHGVNC -TGSCSWKIYVK-GGIVTWETQQTDYPRT-----RPDLPNHE------------------- ----------------PRGCARGASYSWYLYSAN-RVKYPMVRGRLLKHWRAAMALAKSPV -DAWASIVENDASRSEWQKQRGLGG-FVRSTWD-EVNQMI----------AAANVYTIKKH -G-------------PDRII----------------------------------------- --------------------------GFSPIPAMSM---------------ISYAAGSRYL -S-----LIGGVC-MSFYD-WYCDLPPSSPQVWGEQ---TDVPE-SADW-YNSSYIIAWGS -----------NVPQTRTPDAHFLTEVRY---------KGTK----VVSITPDYSEVAKLG -D----LWMHPKQGTDAAVAMAMGHVILKEFYFKDGGKGRSAYFDDYARRYTDLPLLVVLK -EKTLPDGRTV---MVPDRYVRASDFPGQLDQSNNPDWKTVGYD-ELGQV-TLPNGSIGFR -WGA-DGRADQGLWNLENKEARTGNTVKLKLSVIEDGVQAHDVADVAFPYFGGVQTPNFTA -NEQ---GGDVIVRRVPVSHLELAGHEAQGRVMVATVFDLLAGNYGIDRGL-------PGE -EPGGSYDADR-PYTPAWQEKITGVPR---------DQIITVARQFADNADKTHGKSMVII -GAAM---NHWYHCDMNYRGIINMLMLCGCIGQSGGGWAHYVGQEKLRPQTGWTALAFALD -WIRPPRQMNSTSFFYAHTDQWRYEKLGMEEILSPLADKKSYSGSMIDYNVRAERMGWLPS -APQLKTSPLQVAKDAAAKG----MDAKDYVVQSLK--NGSLTMSCEDPDHPDNWPRNMFV -WRSNILGSSGKGHEYFLKHLLGTTHGVQGKDLGQDEA--KPEEVQWHAKAPE----GKLD -LLVTLDFRMSTTCLY--SDIVLPT-ATWYE-KNDLNTSDMH-----------PFIHP-LS -TAVDPAW-Q---A--------KSD------WEIYKGFA-KAVSEVSVGHLGVE-KDVVLT -PIMHDTAGEMAQPYGVRDWK--RGECELIPGKTAPQVTVVERDYPNLYKRFTALGPLMDK -A---GNGGKGIGWNTQTEVGQLGDLNGRV-------KEEGVT-QGMPRIVTDIDATEVVM -MLAPETNGHVACKAWEALGKQTGRDHVHLALHREDEKIRFRDIQAQPRKIISSPTWSGLE -SEKVSYNAGYTNVHEYI--PWRTLTGRQQFYQDHPWMRDFGEGFVSYRPPVHL-KALHEV -EGKKPNGNREIALNFITPHQKWGIHSTYSDNL-----------IMLTLNR--GGSV---- ------VW----------LSEDDAAR-AGI-------------V-------------DNDW -VELF---NA-N--------------GA---I--A-ARAVVSQRVNPGMVMMYHS-QEKII -N----------------------TPGSEIT-GTRGGIHNSVTR-VVLKPTHMIG-GYA-- ------QYSYG-------FNY----YGTIGT-NRDEFVLVRKMDRVDWLDDDVSDAPAHA- ------------------------------------------------------------- -- ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 ------------------------------------------------------------- -----------------------------MSHLLDQLRFFNRK-------QGEFADGHGET -RI-ESRDW-ENV-----------YRSRWQY------------------DKIVRSTHGVNC -TGSCSWKIYVK-NGLITWETQQTDYPRT-----RNDLPNHE------------------- ----------------PRGCPRGASYSWYIYSAN-RLKYPKVRKPLLKLWREARRNMT-PV -DAWASIVEDKAKAESYKSKRGMGG-FIRSSWD-EVNEII----------AAANVYTVKQY -G-------------PDRVI----------------------------------------- --------------------------GFSPIPAMSM---------------VSYAAGSRYL -S-----LIGGVC-LSFYD-WYCDLPPASPQIWGEQ---TDVPE-SADW-YNSNYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVAITPDYAEVAKLT -D----LWLNPKQGTDAALAQAFAHVIFKEFHLEK----PSEYFRDYAKRYTDLPVLVRLN -EK---DGS-----YIADRFLRASDLADNLGQENNPEWKTIAVDGSTGEL-VSPLGSIGYR -WGE-KGK-----WNIEAREGKDGRDVDLSLTQIEG----GETAEVAFPYFGGILHEHFQH -AE----GESIQLRRVPVRTITLADGST---TKVATVFDLMAANLGIDRGL-------GGG -NVASSYDDASVPGTPAWQEVITGVSR---------EKAIQIAREFADNADKTHGRSMIIV -GAAM---NHWYHMDMNYRGLINMLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLD -WSRPPRQMNGTSFFYNHSSQWRHEKMSIHEVLSPLADKSQFPEHMLDYNIRAERAGWLPS -APQLNRNPLQICRDAEAAG----MSPVDYVTQSLK--DGSLKFACEQPDNPDNFPRNMFV -WRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDLGKRADGFKPTEAEWQDEGAI----GKLD -LVTTLDFRMSSTCVY--SDIVLPT-ATWYE-KDDMNTSDMH-----------PFIHP-LS -AAIDPAW-E---A--------KSD------WEIYKGIA-KAFSKMAEGQLGVE-KDLVTV -PLLHDSPGELAQPFGGTDWK--TAGVDPQPGKNCPNMAVVERDYPATYKKFTSLGPLLDK -L---GNGGKGINWNTQDEVDFLGELNYKV-------RDEGVS-QGRPQIESAIDAAEVIL -SLAPETNGHVAVKAWAALSEFTGRDHSHLALPKEHEAIRFRDIQAQPRKIISSPTWSGLE -DEHVSYNAGYTNVHEYI--PWRTITGRQQFFQDHPWMQAFGEQLMSYRPPINT-RTIDYV -KGKKSNGNPEIVLNWITPHQKWGIHSTYSDNL-----------IMLTLSR--GGPI---- ------VW----------MSEVDAKK-AGI-------------E-------------DNDW -IECF---NA-N--------------GA---L--T-ARAVVSQRVMEGMVMMYHA-QERIV -N----------------------VPGAEST-KTRGGHHNSVTR-VVLKPTHMIG-GYA-- ------QQAYG-------FNY----YGTVGC-NRDEFVVVRKMAKVDWLDGPNGNDLPQPL -PQDI-------------------------------------------------------- -- ->NarG_Pseudomonas_fluorescens_gb_AEV63780 ------------------------------------------------------------- -----------------------------MSHLLDQLRFFNRK-------QGEFSDGHGET -RK-ESRDW-ENV-----------YRSRWQY------------------DKIVRSTHGVNC -TGSCSWKIYVK-NGLITWETQQTDYPRT-----RNDLPNHE------------------- ----------------PRGCPRGASYSWYIYSAN-RLKYPKIRKPLLKLWREARQTLP-PV -EAWASIVEDKAKADSYKSKRGMGG-FIRSNWE-EVNEII----------AAANVYTVKEH -G-------------PDRVV----------------------------------------- --------------------------GFSPIPAMSM---------------VSYAAGSRYL -S-----LIGGVC-LSFYD-WYCDLPPASPMVWGEQ---TDVPE-SADW-YNSNYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVAITPDYSEVAKLT -D----LWLNPKQGTDAALAQAFNHVIFKEFHLDK----PSAYFTEYAKRYTDLPVLVMLK -PM---LGAAPGAGYQPDRFLRASDLTDNLGQDNNPEWKTIALD-AAGEL-VSPQGSIGYR -WGE-KGK-----WNILPREGGEGREIDLKLSLI-G----GDVAEVAFPYFAGEAQEYFQH -VA----GDAVQFRRVPVHSVVLADGSV---AKVATVFDLSAANLAIDRGL-------GGA -NVAKDYNDASVPGTPAWQEQITGVSR---------EKAIQIAREFADNADKTRGRSMIIV -GAAM---NHWYHMDMNYRGLINMLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLD -WNRPPRQMNGTSFFYGHSSQWRHEKMSMHDVLSPLADKSQFPEHALDYNIRAERAGWLPS -APQLNTNPLHICRDAAAAG----MEPKDYVVKSLQ--DGSLRFACEQPDSPVNFPRNMFI -WRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDIGHSTEC-KPTEAEWVDEGAI----GKLD -LVTTLDFRMSSTCVY--SDIVLPT-ATWYE-KDDMNTSDMH-----------PFIHP-LS -AAIDPAW-E---S--------RSD------WEIYKGIA-KAFSAMSVGHLGVE-KDLVTV -PLMHDSVGELAQPFGGTDWK--SAGVAPVPGKNAPNLQVVERDYPNIYKQFTSLGPMLEK -L---GNGGKGINWNTDTEVKFLGELNHKE-------VEAGIS-QGRPKIDSAIDAAEVIL -SLAPETNGHVAVKAWAALSEFTGIDHSHLAISKEHEAIRFRDIQAQPRKIISSPTWSGLE -DDHVSYNAGYTNVHESI--PWRTITGRQQFYQDHPWMQAFGEQLMSYRPPVNT-RTIAGV -KGKRSNGETEIVLNWITPHQKWGIHSTYSDNL-----------LMLTLSR--GGPI---- ------VW----------LSEIDAKR-AGI-------------E-------------DNDW -IECF---NV-N--------------GA---L--T-ARAVVSQRVKEGMVMMYHA-QERIV -N----------------------VPGSETT-KTRGGHHNSVTR-VVLKPTHMIG-GYA-- ------QQAYG-------FNY----YGTVGC-NRDEFVVVRKMVKVDWLDGSSGDDLPRPL -PTDIEEN----------------------------------------------------- -- ->NarG_Halomonas_maura_gb_AAT47523 ------------------------------------------------------------- -----------------------------MSHFIDRLNFFRKA-------REPFANDHGEV -RD-ESRGW-EDG-----------YRQRWQH------------------DKVVRSTHGVNC -TGSCSWKIYVK-NGLVTWETQQTDYPRT-----RPDLPNHE------------------- ----------------PRGCPRGASYSWYLYSAN-RLKHPLVRKPLLKLWREALEEKGDPV -DAWASIVEDPAKTKQYKRARGMGG-FVRADWN-ELNELI----------AASNVYTAKQY -G-------------PDRII----------------------------------------- --------------------------GFSPIPAMSM---------------VSYAAGSRYL -S-----LIGGVC-MSFYD-WYCDLPPASPMTWGEQ---TDVPE-SADW-YNSGYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVSVTPDYAEVSKLT -D----EWLSAKQGTDAALAMAMGHVILKEFHLDR----PSAYFTDYVRRYTDMPCLVELE -ARE--DGS-----YVPGKQLRASDFEASLGQDNNPEWKTVAWDETRDQL-VVPRGSIGFR -WGE-EGK-----WNLEPRDAE-GAEIKTRLSLAEA---HDDVARVAFPYFGGIAHEHFDH -VKSGGASDELLFHSLPAKRLTLADGRE---ILAVTVFDLMCANYGIDRGFRSQEGKEGED -DGATAYDQVK-PYTPAWQEKITGVPA---------EQCLRIAREFADNADKTHGRSMIIV -GAGM---NHWYHMDMNYRGLINMLVMCGCIGQSGGGWSHYVGQEKLRPQTGWLPLAFGLD -WQRPPRHMNSTSFFYNHSSQWRYXKLEIKEILSPLAKPADYSGSLIDFNVRSERMGWLPS -APQLATNPLSLAGKAAEAG----QSTADYVVDQLK--AGGLRFAAEDPDDPQNFPRNMFI -WRSNLLGSSGKGHEYLLKYLLGTRHGIQGKDLGEDGGQ-KPEEVVWHEAAPE----GKLD -LLVTLDFRMSTTCLY--SDIVLPT-ATWYE-KDDLNTSDMH-----------PFIHP-LT -AATDPAW-E---S--------RSD------WDIYKGIA-RAFSKACVGHLGEE-TDLVTL -PLQHDSPAELAQPEVKD-WK--RGECEPIPGKTMPALVEVKRDYPATYERFTSVGPLLDS -L---GNGGKGIGWKTEKEVELLGKLNY---------VKTEGPAKGRPRIESAIDAAEVIL -TLAPETNGQVSVKAWEALSKITGRDHRHLAEPKEEEKIRFRDVVAQPRKIISSPTWSGLE -DEHVSYNAGYTNVHELI--PWRTVSGRQQFYQDHAWMRAFGESLLVYRPPIDT-KAAVSL -ADDKGNGNPEIALNWITPHQKWGIHSTYSDNL-----------LMQTLSR--GGPI---- ------VW----------LSKDDARS-IGV-------------E-------------DNDW -IELY---NA-N--------------GA---I--A-ARAVVSQRVKNGMAMMYHA-QERIL -N----------------------MPGSEVT-GTRGGIHNSVTR-VCPKPTHMIG-GYA-- ------QLAYS-------FNY----YGTVGS-NRDEFVIVRKMKKIDWLDGEGNDYEQEAV -K----------------------------------------------------------- -- ->NarG_Escherichia_coli_NP_415742 ------------------------------------------------------------- ------------------------------SKFLDRFRYFKQK-------GETFADGHGQL -LN-TNRDW-EDG-----------YRQRWQH------------------DKIVRSTHGVNC -TGSCSWKIYVK-NGLVTWETQQTDYPRT-----RPDLPNHE------------------- ----------------PRGCPRGASYSWYLYSAN-RLKYPMMRKRLMKMWREAKALHSDPV -EAWASIIEDADKAKSFKQARGRGG-FVRSSWQ-EVNELI----------AASNVYTIKNY -G-------------PDRVA----------------------------------------- --------------------------GFSPIPAMSM---------------VSYASGARYL -S-----LIGGTC-LSFYD-WYCDLPPASPQTWGEQ---TDVPE-SADW-YNSSYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVAVTPDYAEIAKLC -D----LWLAPKQGTDAAMALAMGHVMLREFHLDN----PSQYFTDYVRRYTDMPMLVMLE -ER---DGY-----YAAGRMLRAADLVDALGQENNPEWKTVAFN-TNGEM-VAPNGSIGFR -WGE-KGK-----WNLEQRDGKTGEETELQLSLLGS---QDEIAEVGFPYFGGDGTEHFNK -VE----LENVLLHKLPVKRLQLADGST---ALVTTVYDLTLANYGLERGL-------NDV -NCATSYDDVK-AYTPAWAEQITGVSR---------SQIIRIAREFADNADKTHGRSMIIV -GAGL---NHWYHLDMNYRGLINMLIFCGCVGQSGGGWAHYVGQEKLRPQTGWQPLAFALD -WQRPARHMNSTSYFYNHSSQWRYETVTAEELLSPMADKSRYTGHLIDFNVRAERMGWLPS -APQLGTNPLTIAGEAEKAG----MNPVDYTVKSLK--EGSIRFAAEQPENGKNHPRNLFI -WRSNLLGSSGKGHEFMLKYLLGTEHGIQGKDLGQQGGV-KPEEVDWQDNGLE----GKLD -LVVTLDFRLSSTCLY--SDIILPT-ATWYE-KDDMNTSDMH-----------PFIHP-LS -AAVDPAW-E---A--------KSD------WEIYKAIA-KKFSEVCVGHLGKE-TDIVTL -PIQHDSAAELAQPLDVKDWK--KGECDLIPGKTAPHIMVVERDYPATYERFTSIGPLMEK -I---GNGGKGIAWNTQSEMDLLRKLNY---------TKAEGPAKGQPMLNTAIDAAEMIL -TLAPETNGQVAVKAWAALSEFTGRDHTHLALNKEDEKIRFRDIQAQPRKIISSPTWSGLE -DEHVSYNAGYTNVHELI--PWRTLSGRQQLYQDHQWMRDFGESLLVYRPPIDT-RSVKEV -IGQKSNGNQEKALNFLTPHQKWGIHSTYSDNL-----------LMLTLGR--GGPV---- ------VW----------LSEADAKD-LGI-------------A-------------DNDW -IEVF---NS-N--------------GA---L--T-ARAVVSQRVPAGMTMMYHA-QERIV -N----------------------LPGSEIT-QQRGGIHNSVTR-ITPKPTHMIG-GYA-- ------HLAYG-------FNY----YGTVGS-NRDEFVVVRKMKNIDWLDGEGNDQVQESV -K----------------------------------------------------------- -- ->TtrA_Photobacterium_profundum_YP_133039 ------------------------------------------------------------- ----------------------------MAALIMDRRQFLK-MGAATTFTGGMAGISKATA -GD-SNQDISRYAPLSAEPEFILGPDNKLTN----------------NPNQRFAFTKCFGC -YNVCGARIRID-NNT--DQILRVCG--------NPYALSTQ-----SGNPVAME--VSPQ -EAMLQLVGEQGNENRATLCGRGNAVPDAITDSR-RVTQCLKRVG---------------- -------------------KRGENH-WQSISYE-QLIKEVVEGGNLFGEGHVEGLSDIYDD -KTVANPAYPDFGPKKNQL------------------------------------------ --------------------------LMTGCSEDPA---------------RWGFYKRFSE -A-----SWGTPN-IGNKD-SYCGHQQVAGCALGVEDGANSGALPTTDF-EHCEFAIFIGT -NPGLSG-------ISLNSASKRLADART-------QNPNFK----YVVIDPILRSLTSSS -TPENCEWVPIRSSGDTALMHAMMQYIINNERYNK----------SYLASCSQ-------- ---------------------EGAYKVSEINYTNAPYLVVTDKKHPLYRKFLTAAACGKGD -ADTKMVIDAKSQQLTTSDSSEPCNIKFSGKVTTED------------------------- -------GQAVKVETAFSLLAKRVNE----------------------------------- -------------HSMADYAAECQVPE---------AKIIELAKEFTSH-----GRRVSIE -TNTG---CNASDGSQFAFAMIMLTTLVGAHNAKGGMLHTGSMGFE--------------- -----NTSPLYDMMAFEHAHLSGFNAERSGDYRQSNEFKEKVKNGINPYPSEM-------- ------------------------PWNETFIQDNAG--ELLVAHANGNPFK----FKAWIA -WANNPLYA-------------------------------CSGLKDQVEASIKDPK--QLG -LIIASDPYFNETNVY--ADYFVPD-LAQYE-QWGASRQWGSE----------LMGDVVSF -PIITP---K---TPLNAEGNRVCM------EQFLIDVA-KQIKLNGFGENAFKDTAGNAK -AI----------NTPEDYYI--PVLA-------------------NLAHSDEVLPTPTEE -DVKFTSVDRIYSQLKERL------------------KAEEIG-PTMFLFTRGG------- --------------RYLTVNSRYEGEF-----------------------FNEMMRWDAQF -QVYNEGLAHITNFHSG--------------------------EYLDGLPVFDKQRFWDGT -AIRDLWSENEYPFYFSTFKHQLRSP------------------YSVALKS--ITAL---- ------GV-----SNFIQMNENDAKK-YGL-------------T-------------TGDK -ARIA---TPKG--------------AA---I--E-GIVQADTTVAKGCIAVPLG-YGHTA -FGASDITIDGKT-----------LTGIPERKGGMAVNAFNAV-----DPTRKGASLYR-- ------DVTFG-------STA----RH--GI-----PMKIEKV------------------ ------------------------------------------------------------- -- ->TtrA_Wolinella_succinogenes_NP_907142 ------------------------------------------------------------- -------------------------------MEEGRRRFLLGS-------GVVAGSAAVVG -YKETLGAVALLKDKGERAKDSIYGEAAEPEVRFESGRT------LINPKYSIRPSVCNGC -TTHCGIRVKINQESG---AVERVFGNPYSLLSSDPWLPYNT------------P--LKES -LEVLSAQKESGLHHRSTACARGNAVYDKLNDSF-RVTKPLKRVG---------------- -------------------KRGENA-WVEISPE-QLIQEILEGGNLFGEGEVEGLRSIRQL -DKLIDEENPEYGSSANRLC----------------------------------------- --------------------------VLGTADEGR----------------QVVMVQRFV- -Q-----SFGTVN-FMGHT-SICGLSMRAGEAAYLNDFVGYPHL-KPDF-KNCKFLLNIGT ---APAH----AG-NPFKRQAKLLAQART--------TGECR----YVTVTPILANSDNIA -VGERSRWLPVAPSGDLALVMGMIRLIIEEKRYLA----------DYLAIPSL-------- -------------------------ESQKALEEVSFTNATHLIIQKGEKEGQILKDSQGSP -W----VIDVKEGVLRDSKSVLRGELDFAGEVTLE-------------------------- -------GVSYEVKSAFLLLKESALA----------------------------------- -------------YTLEEYASFSGIDS---------KEIVHLAREFTSY-----GRSVGVD -CHGG---TMHTTGFYATYAVMMLGALVGNLNHKGGMSMGGGKFEDFNG------------ -----EAYNLIAYPNKPKPQGARIDRARMAYEKTSEFKRKVAQGENPYPAK---------- ------------------------APWYGLANALES--DVITNSEEGYPYK----LGALIS -WCANFIYG-------------------------------QSGSEHLLE-SLKDPKR-AIP -LFIAIDPFINETSRW--ADYIVPD-SVMYE-TWGVVSPWGASLT--------KASHL-RY -PILPSPNAK---WSNGEP---VSM------DSFIIELG-KALGLPGFGKNGIVAKSGEKF -PF----------DRPEELYL--RAFE-------------------NIALSG-KAVPEISD -EEIELAGLKEYASKLQ-AI-----------------NGENWR-RVAYVMARGG------- --------------RFAPIEDAYKGDS-----------------------LSR--AYPKAI -SIYNEALGTSKNSLTG--------------------------ERYSGVPRFYAPRFTDGR -ALEEAGLGDSRSFLAFSYKSNVLSA------------------PTTASRH--LKEL---- ------RY-----TTFVDMNSQSAKA-LGI-------------V-------------HGER -VRVV---SK-G--------------GF---V--I-GICRLREGIHPRSIGIEHG-AGREG -EGAIDLLINGNV-----------IRGEIARRSGVNINKLGLK-----DASKGKVGTLS-- ------DFVIG-------SNA----RQ--GI-----PVWIEKLS----------------- ------------------------------------------------------------- -- ->TtrA_Haemophilus_somnus_gb_ABI25172 ------------------------------------------------------------- -------------------------------MNKQRRNLIKGA-------LATTAATAFVA -GY-SPKVK-EIAKGVIEGSSGQKTQDNINGNSLLPEYQVKEGNLLTNSQQVVCNTQCMGC -WTLCGLRVRIDLEKN---KVLRING--------NPYHPLSS------DHYLDYN--QSIK -QAELSVSGENGLQQRSTACARGAAFLDGINSPY-RITQPLKRVG---------------- -------------------KRGEGK-WKTISFE-QLIDEVVNGGDLFGEGHVDGLKAIRDL -QTPVNAQHPDFGAKVNQLM----------------------------------------- --------------------------VTFAGPEG-----------------RQPLLKRFAN -N-----SFGTIN-FASHG-SFCGLSYRAGSGAFMNDFANNSHA-KPDW-DHVEFILFMGT ---SPAQ----SG-NPFKRQSRQLAKKRT--------EDNFE----YVVIAPRLELTSTAA -Q-DKNRWVPIIPGKDLSLALAMLRWIIENERYNE----------DYLSIPSE-------- --------------IAMQQANGVSFCNATHLFIADPNHKQYGQAIRNFHI-EDLSEPEKLS -DSDILVKDRQTGKFIAAKDCQSAVLFVEDRISLKD------------------------- -------GSQVLAKSALQLFKESCFS----------------------------------- -------------YSIEEYSEQCGVPV---------DTIIQLAKKFTSH----GPRAAVIT -HGGT----MHSNGFYTAWAILLLNAMIGNMNKKGGMSMSGGKFKDFSAG----------- -----PRYNLANFPNMVKPKGTNLARSKKDYEKSSEFKQKVAQGISPYPAK---------- ------------------------AAWYPFVGGQMS--EMITSALQGYPYS----LKAWIN -HMGNPIYG-------------------------------MTGIHHITQQKLKDPK--ILP -LFISIDAFMNETTAL--ADYIVPD-THNFE-SWGFSTPWAGVPT--------KTSTA-RW -PVIASPN-E---K--------TSQGDTICMESFVIEIA-KMMQLPGFGDNAILDKQNHSY -PL----------NRSEDFFL--RAAA-------------------NIAYDGKQPVQDATQ -EDLLLTGVQRLMPSLQQVL-----------------KPEEIK-KVATIYCKGG------- --------------RFAPHSSAWQEDN-------------------------MQARWKNCL -QIWNENVAKAKHAQTG--------------------------KNYHGCPTYFEDQFADNS -TVESHYPKIQWPFKLISFKSNLMSS------------------ITAPLLR--LHSI---- ------KP-----NGIVAINQQDATE-YGL-------------Q-------------HGDL -VELN---TP-G--------------GK---A--V-VQLVVMNGVIKGTIAIEHG-YGHKQ -LGATGYTINGKL-----------IEGNAQIGSGVNINDLGLL-----DSTKEIASPWV-- ------DWVCG-------SAV----RQ--GI-----PAKLVKLA----------------- ------------------------------------------------------------- -- ->TtrA_Yersinia_enterocolitica_YP_001005907 ------------------------------------------------------------- ------------------------------MAKSTRRQWLKGS-------LALGGVVAFGA -SY-HAVAR-KTLAGLVDGSAGKLTLDPISGNALPTEGRVGP-QWQANPQQAVSMTQCFGC -WTLCGLRVRVDTQQN---KILRIAG--------NPYHPLSH------DHHFPYQ--LPVG -EALQHLGGEQGMTGRSTACARGATLLEGVDSPY-RITEPMKRVG---------------- -------------------PRGSGK-WQRISFE-QLVAEVTEGGDLFGEGPVEGLRAIRDL -DTPIDAKQPSLGPKANQLL----------------------------------------- --------------------------VTNAGDDG-----------------RDAFIQRFAN -Q-----AFGTKN-LGSHG-AYCGLAYRAGSGALMGDLDKNAHV-KPDW-DNVRFALFLGT ---SPAQ----SG-NPFKRQGRQLANARQ--------RDDFN----YVVVAPALPLTTTLA -N-QHNRWVPVLPGTDAALAMGIIRWIIEQHRFNH----------AYLAIPGE-------- --------------MAMQAAGERSWTNASHLVITTETHPLAGQFLRANML---SGETVAEG -EESPVLAQAIDGALQPAAQMLQAELFVTQDLTLHD------------------------- -------GQNVQVQSGMTCLQQAAAR----------------------------------- -------------FTLAEYSQQCGVPE---------ATIIGLAREFTAY----QRQAAVIS -HGGM----MGGNGFYTTWAVMMLNAMIGNLNLKGGVSVGGGKFDGFADG----------- -----PRYQLATFVGMVKPKGLPLSRSKQPYEKSEEYQQKIQQGQSGYPAR---------- ------------------------GPWYPFVGGQLT--EQLAPALAGYPYP----LKAWIS -HMTNPLYG-------------------------------VAGLRNLIEERLQDPR--QLP -LFIAIDAFMNETTAL--ADYIVPD-THNFE-SWGFSAPWAGVLV--------KASTA-RW -PVVEPRTAR---TAQGEP---VAM------ESFLIAVA-KAMKLPGFGANAMQDSEGNSL -SL----------DRAEDYYL--RAAA-------------------NIAYGGEKPLPAAVD -DELRLTGVDRLWPALQRSL-----------------YPDEQR-RVAYLLARGG------- --------------RFAPYEKSWNGDA-------------------------TGSQWKKPL -QIWNENVAKHHHAITG--------------------------ERYSGCPTWYPPRLADGS -DVFQHYPVSDWPLRLMSFKSHLMSS------------------STAMIER--LRAV---- ------KS-----TNLVAINPQDAQR-NGI-------------Q-------------HGDI -VRLM---TP-G--------------GQ---M--E-VQVSLLDGVMPGVVAIEHG-YGHRE -MGSRAHT----------------LDGVVMASDPRIGQGSNLNDLGFTDPTREIPNTWL-- ------DWVSG-------AAV----RQ--GL-----PAKLQRIS----------------- ------------------------------------------------------------- -- ->DmsA_E_coli_sp_P18775 ------------------------------------------------------------- --------------------MKTKIPDAVLAAEVSRRGLVK---------TTAIGGLAMAS ----SALTL---------------PFSRIAHAVDSAIPT-------KSDEKVIWSACTVNC -GSRCPLRMHVV-DGE----IKYVETDNTGD---DNYDGLHQ------------------- ----------------VRACLRGRSMRRRVYNPD-RLKYPMKRVG---------------- -------------------ARGEGK-FERISWE-EAYDII--------ATNMQRL--IKEY -G-------------NESIYLNYGTGTL--------------------------------- --------------------------GGTMTRSWPP---------------GNTLVARLM- -N-----CCGGYLNHYGDY-SSAQIAEGLNYTYGGW---ADGNS-PSDI-ENSKLVVLFGN ---NPGE----TR-MSGGGVTYYLEQARQ--------KSNAR----MIIIDPRYTDTGAGR -E---DEWIPIRPGTDAALVNGLAYVMITENLVDQ----------AFLDKYCV-------- ----------------------------------------------------------GYD -EKTLPASAPKNGHYKAYILGEGPDGVA--------------------------------- ------------------------------------------------------------- -------------KTPEWASQITGVPA---------DKIIKLAREIGST----KP-AFISQ -GWGP---QRHANGEIATRAISMLAILTGNVGINGGNSGAREGSYSL-------------- -----PFVRMPTLENPIQTSISMFMWTD--------------------------------- ------------------------AIERGPEMTALR--DGV-RGKDKLDVP----IKMIWN -YAGNCLIN-------------------------------QHSEINRTHEILQDDK--KCE -LIVVIDCHMTSSAKY--ADILLPD-CTASE-QMDFALDASCGNM--------SYVIF-ND -QVIKPRF-E---C--------KTI------YEMTSELA-KRLGVEQQFTE---------- -------------GRTQEEWMR-HLYA-------------------QSREAIPELPT---- -------------------------------------FEEFRKQGIFKKRDPQG------- --------------HHVAYKAFREDPQ-----------------------ANPLTTPSGKI -EIYSQALADIAATWELP-------------------------EGDVIDPLPIY-TP--GF -ESYQDPLNKQYPLQLTGFHYKSRVHSTYGNVD-----------VLKAACRQE-------- ------MW----------INPLDAQK-RGI-------------H-------------NGDK -VRIF---ND-R--------------GE---V--H-IEAKVTPRMMPGVVAL--G-EGAW- ------------------------YDPDAKRV------DKGG------CINVLTTQRPS-- ------PLAKG-------NPS----HTN--------LVQVEKV------------------ ------------------------------------------------------------- -- ->DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| ------------------------------------------------------------- ------------------------MNHLDLNSNTTRRRFIKTTG------LTAFAASAGIS -IPFATKAG---------------NQSITST--------------AGADEKVVWSACTVNC -GSRCPLRMHVK-DDQ----IIYVETDNTGS---ETYNLDHQ------------------- ----------------VRACLRGRSMRRRVYNPD-RLKYPMKRIG---------------- -------------------KRGEGK-FKRISWD-EALTEI--------AQSLQKN--IAQY -G-------------NESIYLNYGTGTL--------------------------------- --------------------------GGTVTKSWPP---------------GSTLIARLM- -N-----CIGGYLNHYGDY-STAQISVGLDYTYGGGWVLGNGMA---DI-ENTKLVVLFGN ---NPAET---RMSGGGLTYCIQQAKAKS----------NAK----LIVIDPRYTDTGVGK -E---DEWIPIRPGTDAALVSALAYVMITEELVDQ----------PFLDKYCV-------- ----------------------------------------------------------GYD -ENTLPADAPQNGHYKAYILGQGEDGIA--------------------------------- ------------------------------------------------------------- -------------KTPEWAAKITGIPA---------ERIIRLAREIGST----KP-AYISQ -GWGP---QRRSNGEIISRAIAMLPILTGNVGISGGNTGARESSYGV-------------- -----PFVMMPTLTNPVKASIPMFLWT---------------------------------- ------------------------DAITRATEMTAK--TDGIRGVERLTAP----IKFIWN -YAGNCLTN-------------------------------QHADINRTHEILQDES--LCE -MIVTIDNHMTSTAKY--SDIVLPD-CMTSE-QMDFCLDGYVANM--------SYVIF-AD -QAVKPSF-E---C--------RNI------YDMLSDLS-EKLGVKQQFTE---------- -------------DRTQEEWLRYIYRQ--------------------SREQLPELPV---- -------------------------------------FDEFRTQGIFKKVDPKG------- --------------FYIPYKEFRDDPQ-----------------------ANPLKTPSGKI -EIYSSRLAEIARSWKLD-------------------------EDEVIHPLPIHVDSFEHY -GD---PLMEKYPLQLTGFHYKARTHSTYGNVD-----------ILKS----ANPQE---- ------IW----------INPFDAEK-RGI-------------K-------------NGDM -LRMF---ND-R--------------GE---V--R-IHAKVTPRIIPGVVAL--G-EGAW- ------------------------HAP-----------DNQGID-HSGCINVLTTQRP--- ------SPLAK-------GNP----QH--SN-----LVQVEKL------------------ ------------------------------------------------------------- -- ->DmsA_Haemophilus_influenza_sp_P45004 ------------------------------------------------------------- ---------------------------MSNFNQISRRDFVK---------ASSAGAALAV- ----SNLTL---------------PFNVMAKETQRLNEN--------NQERIVWSACTVNC -GSRCPLRMHVK-DNR----ITYVETDNTGT---ETYNLDHQ------------------- ----------------VRACLRGRSMRRRVYNPD-RLKYPMKRIG---------------- -------------------KRGEGK-FKRISWD-EALTEI--------ADALKRN--IKKY -G-------------NESIYLNYGTGTL--------------------------------- --------------------------GGTMAKSWPP---------------ASTMIARFM- -N-----CIGGYLNHYGDY-STAQIAVGLDYTYGGG--WALGNG-MADI-ENTKLIVLFGN ---NPAET---RMSGGGLTYCIEQAKARS----------NAK----MIIIDPRYNDTGAGR -E---DEWIPIRPGTDAALVAALAYVMIQENLVDQ----------PFLDKYCV-------- ----------------------------------------------------------GYD -EKTLPTDAPKNGHYKAYILGYGNDGIA--------------------------------- ------------------------------------------------------------- -------------KTPEWAAKITGIPA---------ERIIKLAREIGST----KP-AFISQ -GWGP---QRRSNGELISRAIAMLPILTGNVGIHGGNTGARESAYSI-------------- -----PFVRMPTLKNPVKASIPMFLWTD--------------------------------- ------------------------AIIRGTEMTALT--DGI-RGVDKLSSP----IKVIWN -YASNCLIN-------------------------------QHAQINRTHDILQDDT--QCE -MIITIDNHMTSTAKY--SDILLPD-CTTSE-QMDFALDAFVSNM--------AYVIF-AD -QVIKPSF-E---C--------RPI------YDMLSDLA-EKMGVKEKFTE---------- -------------GRTQEEWLR-HIYE-------------------QSREKLPELPT---- -------------------------------------FEEFRQQGIFKKVDPNG------- --------------FKVAYKDFRDNPE-----------------------AHPLKTPSGKI -EIYSSRLAEIAKTWKLA-------------------------EDDVIHPLPIHAQSFEHY -GD---PLMEKYPLQLSGFHYKARTHSTYGNVD-----------VLKA----ANPQE---- ------VW----------MNPIDAEP-RNI-------------K-------------NGDM -IRIF---ND-R--------------GE---V--H-INVKITPRIIPGVVAL--S-EGAW- ------------------------YAP-----------DKDRID-HSGCINVLTTQRP--- ------SPLAK-------GNP----QH--SN-----LVQVERL------------------ ------------------------------------------------------------- -- ->TMAO_Shewanella_massilia_CAA06851 ------------------------------------------------------------- ---------------------------------MNRRDFLK----------GIASSSFVVL -GG-SSVLT---------------PLNALAK--------------AGINEDEWLT----TG -SHFGAFKMKRK-NGV----IAEV----------KPFDLDKY------------------- ----------------PTDMINGIRGMV--YNPS-RVRYPMVRLDFLLKGHKSNTH----- -------------------QRGDFR-FVRVTWD-KALTLF--------KHSLDEV--QTQY -G-------------PSGLH----AGQT--------------------------------- --------------------------GWRATGQLHS---------------STSHMQRAV- -G-----MHGNYVKKIGDY-STGAGQTILPYVLGSTEVYAQGTS-WPLILEHSDTIVLWSN ---DPYKNLQVGW-NAETHESFAYLAQLK----EKVKQGKIR----VISIDPVVTKTQAYL -G---CEQLYVNPQTDVTLMLAIAHEMISKKLYDD----------KFIQGYSL-------- ----------------------------------------------------------GFE -E------------FVPYVMGTKDGVA---------------------------------- ------------------------------------------------------------- -------------KTPEWAAPICGVEA---------HVIRDLAKTLV------KGRTQFMM -GWCI---QRQQHGEQPYWMAAVLATMIGQIGLPGGGISYGHHYSSIGV------------ -----PSSGAAAPGAFPRNLDENQKP---------LFDSSDFKGASSTIPV---------- ------------------------ARWIDAILEPGK--TIDANGSKVVYPD----IKMMIF -SGNNPWNH-------------------------------HQDRNRMKQ-AFH-----KLE -CVVTVDVNWTATCRF--SDIVLPA-CTTYE-RNDIDVYGAYANR--------GILAM--Q -KMVEPLF-D---S--------LSD------FEIFTRFA-AVLGKEKEYTRNMGEM----- -------------EWLETLYN--ECKA-------------------ANAGKFEMPD----- -------------------------------------FATFWK-QGYVHFGDGE------- --------------VWTRHADFRNDPE-----------------------INPLGTPSGLI -EIFSRKIDQFGY------------------------------DDCKGHPTWME-KTERSH -GG---PGSDKHPIWLQSCHPDKRLHSQMCESR-----------EYRETYAVNGREP---- ------VY----------ISPVDAKA-RGI-------------K-------------DGDI -VRVF---ND-R--------------GQ---L--L-AGAVVSDNFPKGIVRI--H-EGAW- ------------------------YGPVGKDGSTEGGAEVGALC-SYGDPNTLTLDIGT-- ------SKLAQ-------ACS----AY--TC-----LVEFEKYQGKVPKVSSFDGPIEVEI ------------------------------------------------------------- -- ->TMAO_Photobacterium_profundum_YP_129680 ------------------------------------------------------------- -----------------------------MNMSVSRRSFLK---------GLATTSAVSVI -GP-SLLAS---------------SKAMAAE---------------------TTGTWKTSG -SHWGAFRAHVY-AGK----VQEI----------KPLEMDKY------------------- ----------------PTDMLNGIKGII--YSPS-RVRYPMVRLDWLKKHKYSGE------ -------------------TRGNNR-FIRMTWD-DALDLF--------YRELERV--QKDY -G-------------PWALH----AGQT--------------------------------- --------------------------GWRQTGQFHS---------------CTSHMQRAV- -G-----MHGNFITKVGDY-STGAGQTILPYVLGSTEVYAQGTS-WSEILDHSKNIVLWAT ---DPVKNLQVGW-NCETHESFAYLEQLK----EKVAKGEIN----VLSVDPVKNKTQRFL -G---NDHMYINPQTDVAFMLAVAHTLYTEDLYDK----------EFIKMYCL-------- ----------------------------------------------------------GFD -E------------FVPYFMGKSKDNIE--------------------------------- ------------------------------------------------------------- -------------KTPEWAAEICGLPA---------DEIRDFARMLVAE------RTQILF -GWCI---QRQEHGEQPYWMGAVIAAMVGQIGLPGGGVSYGHHYSSIGV------------ -----PSTGFAAPGGFPRNVDEGQKP---------KWDNNDFNGYSRTIPV---------- ------------------------ARWVDCLLEPGK--EIKYNGSKVILPD----YKMMII -SGNNPWHH-------------------------------HQDRNRMKQ-AFQ-----KLQ -TVVTIDFAWTATCRF--SDIVLPA-CTQFE-RNDIDVYGSYSGR--------GLVAM--H -KLVDPLY-Q---S--------KTD------FDIFTELS-RRFGRHKEYTRGMDEM----- -------------EWVRSLYS--DCRD-------------------ANKAKFDMPE----- -------------------------------------FDEFWA-KGVLDFGEGT------- --------------PWVRHADFREDPE-----------------------INALGTPSGFI -EISSRKIDRFGY------------------------------EHCQGHPMWFE-KSERSH -GG---PGSKKHPFWMQSCHPDKRLHSQMCESE-----------EMRATYAVKGREP---- ------VY----------INPKDAAE-KGI-------------K-------------DGDI -VRVF---ND-R--------------GQ---L--L-AGAVLSDSYARGVIRI--E-EGAW- ------------------------YGPLNE--------KVGAID-TYGDPNTLTQDIPS-- ------SELAQ-------ATS----AN--TC-----LVDFEKFKGEVPPVTSFGGPIEVS- ------------------------------------------------------------- -- ->TMAO_Vibrio_vulnificus_YP_004189064 ------------------------------------------------------------- -------------------------------MAITRRSFLK---------GVATTSAASVI -GP-SLLAS------------------------------------ASANAVETTGTWKVSG -SHWGAFRAHIY-AGK----VQEI----------KPIELDQN------------------- ----------------PTEMLNGIKGII--YSPS-RVRYPMVRLDWLKKHKYSAD------ -------------------TRGNNR-FVRVTWD-EALDLF--------YRELERV--QKEY -G-------------PWALH----AGQT--------------------------------- --------------------------GWNQTGSFNN---------------CTAHMQRAV- -G-----MHGNYITKVGDY-STGAGQTILPYVLGSTEVYAQGTS-WSEILENADNIILWAN ---DPVKNLQVGW-NCETHESYAYLAQLK----EKVAKGEIN----VISVDPVKNKTQRYL -E---NDHLYVNPMTDVPFMLAIAHVLYTENLYDK----------KFIETYCL-------- ----------------------------------------------------------GFE -E------------FINYVQGKTKDKVE--------------------------------- ------------------------------------------------------------- -------------KTPEWAAPICGVKA---------DKIREFARMLV------KGRTQILM -GWCI---QRQEHGEQPYWAAAVVAAMIGQIGLPGGGISYGHHYSSIGV------------ -----PSTGFAGPGGFPRNLDAGMKP---------KWDNNDFNGYSRTIPV---------- ------------------------ARWIDCLLEPGK--EINYNGGKVKLPD----FKMMVI -SGCNPWHH-------------------------------HQDRNRMKQ-AFQ-----KLQ -TVVTIDFAWTATCRF--SDIVLPA-CTQWE-RNDIDVYGSYSSR--------GLIAM--H -RLVDPLF-Q---S--------KPD------FQIMKELT-ERFGRSEEYSRGMSEM----- -------------DWIRSLYN--DCKK-------------------SNEGKFEMPE----- -------------------------------------FDEFWE-KSVLDFGQGQ------- --------------PWVRHADFRQDPE-----------------------INPLGTPSGFI -EITSRKIGRYGY------------------------------EHCQEHPMWFE-KSERSH -GG---PGSDKHPFWLQSCHPDKRLHSQMCESE-----------EFRATYAVKGREP---- ------VY----------INPLDAKA-KGI-------------K-------------EGDL -VRVF---ND-R--------------GQ---L--L-AGAVLTDSYPRGVIRI--E-EGAW- ------------------------YGPLSE--------KVGAIC-TYGDPNTLTQDIGS-- ------SELAQ-------ATS----AN--TC-----IVDFEKFTGKVPPVTSFGGPIEVA- ------------------------------------------------------------- -- ->TMAO_Citrobacter_youngae_ZP_06352135 ------------------------------------------------------------- --------------------------------------------------MLAVGAASAL- ----APNPL---------------ISKVWAA-------------------GENPEQWIQSG -SHFGAFEAKVV-NGE------WLET--------RPFKHDKY------------------- ------------------PCDMLNAVREVVYNPS-RVRYPMVRLDWLRKREKSDRS----- -------------------QRGDNR-FVRVSWD-QALDLF--------YEELERV--QKTY -G-------------SSGVF----TGLA--------------------------------- --------------------------DWQMVGKYHK---------------AGGAMDRGL- -G-----LHGSYVTTVGDY-SAAAAQVILPHVIGSLEVYEQQTS-LPLVIQNSNTIVLWGC ---DPIKNLQIEFLVPDHDAFGYWQQIKE-----AVAQGKMR----VISVDPVRSKSQNYL -G---CEQLALRPQTDVALMLALAHTLYEEKLYDT----------AFINDYTV-------- ----------------------------------------------------------GFE -Q------------FLPYLLGESDKQP---------------------------------- ------------------------------------------------------------- -------------KNAEWAAEICGLTA---------EQIRDFARLLV------KGRTQFMG -GWCA---QRMHHGEQYPWMLVVLASMVGQIGLPGGGVGFGWHYNGGGTVTS--------- -----AGPVLSGLGGIANPPPAKY--------------KADFRGASEHIPT---------- ------------------------SRIVDCLLEPGK--KVAFNGETLTWPD----IKMAIY -SAANPFHA-------------------------------QQDRNRMIE-AWK-----KLE -TVVVLDHQWTASCRF--ADIVLPV-TTRFE-RNDIEQFGTHSNK--------GLMAL--H -QVVKPQY-E---A--------RHD------FDVFAGLC-KRFDKEAVYRE---------- -------------NRDEMQWIQALYDE--------------------GVKMGASLGVSLPD -------------------------------------FTTFWQGEGYIEYPAGQ------- --------------PWVRHGEFRDQPD-----------------------LNPLGTPSGLI -EIYSKTIAGFAY------------------------------EDCPGHPVWME-PFERNH -SA----KKNKYPLHLQSCHPDKRLHSQLCSSD-----------AFRNTYAVAGREP---- ------LY----------ISAQDAAA-RGL-------------K-------------AGDI -ARVF---ND-R--------------GQ---V--L-AGVVISPDFTPGVIRI--H-EGAW- ------------------------YSP-------QEGGKAGTLC-TYGDPNVLSADIGT-- ------SQLAQ-------GPS----AH--TV-----LVEVERYQQKAPQVTAFGGPETV-- -------KEEGGSAA---------------------------------------------- -- ->TMAO_Salmonella_enterica_gb_AEZ47489 ------------------------------------------------------------- -------------------------MKNKDSLHVSRRRFLAQL-------GGLTVAGMLGP -SLLTPRSA---------------RAADAVA------------------PGAATKEGILTG -SHWGAIRATVV-DGR------FVAA--------KPFEQDKY------------------- ----------------PSKMIAGLPDHV--HNAA-RIRYPMVRVDWMRKGHQSDTS----- -------------------QRGDNR-FVRVSWD-EALDLF--------YQELERV--QKTY -G-------------PSALL-----TAS--------------------------------- --------------------------GWQSTGMFHN---------------ASGMLARAI- -A-----LHGNSVSTGGDY-STGAAQVILPRVVGSMEVYEQQTS-WPLVLQNSKTIVLWGS ---DMVKNQQANW-WCPDHDVYQYYEQLK----EKVASGAIS----VISIDPVVTSTHDYL -GRDKVKHIAINPQTDVPLQLALAHTLYSEKLYDK----------NFLDNYCV-------- ----------------------------------------------------------GFD -Q------------FLPYLLGEKDGQP---------------------------------- ------------------------------------------------------------- -------------KDAAWAEKLCGIDA---------DTIRALARQMA------GDRTQIIA -GWCV---QRMQHGEQWSWMVVVLAAMLGQIGLPGGGFGFGWHYNGAGT------------ -----PGRKGIILSGFSGSTTVPPVHDSTDYKGYSSTIPI--------------------- ------------------------ARFMDAILEPGK--IINWNGKSVKLPP----LKMCVF -AGTNPFHR-------------------------------HQQINRIIE-GWR-----KLE -TVIAIDNQWTSTCRF--ADIVLPA-TTQFE-RNDLDQFGNHSNR--------GIIAM--K -QVVSPQF-E---A--------RND------FDIFRDLC-RRFNREAAFTEGLDEM----- -------------GWLKRIWQ--EGSQ-------------------QGKGRGIHLPT---- -------------------------------------FEVFWNQQEYIEFDHPQ------- --------------MFVRHQAFREDPD-----------------------LEPLGTPSGLI -EIYSKTIADMQY------------------------------DDCQGHPMWFE-KIERSH -GG---PGSQRWPLHLQSVHPDFRLHSQLCESE-----------TLRQQYAVGGKEP---- ------VF----------INPQDASA-RGI-------------R-------------NGDI -VRVF---NA-R--------------GQ---V--L-AGAVVSDRYAPGVARI--H-EGAW- ------------------------YDP-------DKGGDLNALC-KYGNPNVLTLDTGT-- ------SQLAQ-------ATS----AH--TT-----LVEIEKYTGPMDNVTAFNGPAEMVA -QCEYVPASQGNPHD---------------------------------------------- -- ->TMAO_E_coli_CAA52095 ------------------------------------------------------------- -------------------------MNNNDLFQASRRRFLAQL-------GGLTVAGMLGP -SLLTPRRA---------------TAAQAAT------------------DAVISKEGILTG -SHWGAIRATVK-DGR------FVAA--------KPFELDKY------------------- ----------------PSKMIAGLPDHV--HNAA-RIRYPMVRVDWLRKRHLSDTS----- -------------------QRGDNR-FVRVSWD-EALDMF--------YEELERV--QKTH -G-------------PSALLTAS-------------------------------------- --------------------------GWQSTGMFHN---------------ASGMRAKRI- -A-----LHGNSVGTGGDY-STGAAQVILPRVVGSMEVYEQQTS-WPLVLQNSKTIVLWGS ---DLLKNQQANWWCPDHDVYEYYAQLKR-----KSAAGEIE----VISIDPVVTSTHEYL -GGEHVKHIAVNPQTDVPLQLALAHTLYSENLYDK----------NFLANYCV-------- ----------------------------------------------------------GFE -E------------FLPYLLGEKDGQP---------------------------------- ------------------------------------------------------------- -------------KDAAWAEKLSGIDA---------ETIRGLARQMAAN------RTQIIA -GWCV---QRMQHGEQWAWMIVVLAAMLGQIGLPGGGFGFGWHYNGAGT------------ -----PGRKGVILSGFSGSTSIPP-----------VHDNSDYKGYSSTIPI---------- ------------------------ARFIDAILEPGK--VINWNGKSVKLPP----LKMCIF -AGTNPFHR-------------------------------HQQINRIIE-GLR-----NVE -TVIAIDNQWTSTCRF--ADIVLPA-TTQFE-RNDLDQYGNHSNR--------GIIAM--K -QVVPPQF-E---A--------RND------FDIFRELC-RRFNREEAFTEGLDEM----- -------------GWLKRIWQ--EGVQ-------------------QGKGRGVHLPA---- -------------------------------------FDDFWNNKEYVEFDHPQ------- --------------MFVRHQAFREDPD-----------------------LEPLGTPSGLI -EIYSKTIADMNY------------------------------DDCQGHPMWFE-KIERSH -GG---PGSQKYPLHLQSVHPDFRLHSQLCESE-----------TLRHEYTVAGKEP---- ------VF----------INPQDASA-RGI-------------R-------------NGDV -VRVF---NA-R--------------GQ---V--M-AGAVVSDRYAPGVARI--H-EGAW- ------------------------YDP-------DKGGELGALC-KYGNPNVLTIDIGT-- ------SQLAQ-------ATS----AH--TT-----LVEIEKYNGTVEQVTAFNGPVEMVA -QCEYVPASQVKS------------------------------------------------ -- ->TtrA_Aeropyrum_pernix_NP_148724 ------------------------------------------------------------- --------------------------------MVSRRDFVK---------GSIAIASLLVA -GA-GLQPV--------------LSQLVRPKFERIAPDL------QMGANVRYVYSSCLGC -NVRCGIKARVVKVGDLEI-VERIEG--------NPYHPYNRAVSLNGNGKLGSQHLRFYH -LPYNTPVKEALTKWHGTLCPRGQDGIYYLYDPY-RVLVPLKRAG---------------- -------------------PRGSGK-WKPISWEQLIREVVEGGVIEETGERLPGLRDFFVY -G----KLREAGFEDPNAILSDMKKDVQEILEYAKKPETSYEDIVMKIEEFKEKWSKILGE -KGLKLDDILIDPDRPDLGTKANMVAYLRGRGQGH----------------TDYMSARWI- -A-----GFGSVN-WLRHT-SACQLGYYAANYLWAG---YHDIQ--PDP-VSSKVIIMAGA -SMGRLH-------PGTTGQGLLISRAGE---------GDLK----IYYVNPTAPRTDAGG -N---IVWIPIKPGYDAALAFALIRWIIENERYNK----------EFLEIPNE-------- ----------------------EAAERKGYPVHSNATWLVIMEEGHEKWGEYLKAKDVGLE -D-SDKPVVFTGEGLATYDSVDNAEIDWEGEVVLTT------------------------- -------GERVKVKTSFRILKDEALSR---------------------------------- -------------SIDQWLSVASPYEPGSSEFREWKEKVLEMARDFAEA----APMAGTYV -HRGV---GMHSNGEYAVWAYRALDTLVGNYHRKGGLLARAGHTKYNSY------------ -----VYHVDKKGFGEPVKWGPPIDRHKAKYEDTLEYWLKVKKGENPYPAKR--------- ------------------------PWYPHTPEESYT--EIFAGIAEEYPYK----MGALIL -FYANPVLS-------------------------------ANYGVKFIE-VLKDTK--KLP -LFIAITTTINETMLY--ADYIVPD-TTYLE-TGTLGMQYLYASSGGV-----LLAEAARS -PVVMPLT-----QKIGEPERYASF------WEFFIDTG-KALGMPGFGKG---------- -------------AIKGLKYH--EGKS-------------------YDLDSLWDYIMRVYA -NAAMHAKDMGIIPENVPEEEVKFVEENYPVAKFKHLIPDEWP-YVAYMLARGG------- --------------VFTSYEESFHPNGVSKRKV----------PSKRKKFKKTLMLWNEDL -AKTRNSVTG---------------------------------AKFWGGPKYIP-PSTYAP -VKGGSKSFYGTPLREIYPESEYPFHLVFTTGPLFTKHRSQFYYAIKQISP---------- -------------ENYLVVNPKDAEK-LGL-------------E-------------TGDV -VEVE---TP-T--------------GR---F--K-APVVVEPTVPPGVIMVPYG-MGRWA -DTVVKKPSYFE------------VKDSRLASLINELPEREEIPEEAVNPVKKLPELKK-- ------KVLFTKSTPAYYNQAEPDKWRFNGITPN--VAEMSDPSLGGWPLLSIIGAAQAYY -FNVARIRKTGEKHEFEKTYPYIVW------------------------------------ -- ->TtrA_Pyrobaculum_arsenaticum_YP_001152643 ------------------------------------------------------------- --------------------------------MTSRRTYLK---------AIAAAA---AL ----GVALW-GYWPVV--------DKIIKPKRNPYGPDP------QYGKNVRYVHTTCLGC -NVRCGIRVRVVKYGDVEV-IERIEG--------NPYHVYNRAVSFD----SQVK--RYKQ -LPYNTPVKEALERWSGTLCPRGVDGIHYVYDPY-RVLKPLKRAG---------------- -------------------PRGSGK-WKVITWEQLNNEVVNGGIIEETGERLPGLKDFFVY -G----KLKEAGFEDPNAVLSEMKADVDNIMKIARDPNKTYDELVKAIEGFKAKWSQKLGE -KGLKLEDVFIDPDRPDLGTKANMVMYLRGRGQPP----------------TDYFSQRWI- -Y-----AFGSVN-WTRHT-SACQLGFYTGNRIWAG---YTDIQ-A----DPVGAKVIIGA -----------GWSMGRLHPGATGQGLII----ERACEGDLK----LYYINPVAPRTPCNG -N---IIWIPVKPGEDATLAFAVIRWLIENKRYNE----------EFLSLPNR-------- ------------------------DSAKKAGYPVNTNATWLVITEGQRFGEYLKARDIGLE -N-SDKPVVWTGEKFATYDSVDKADLYYVGKVTLPT------------------------- -------GEAVAVKTAFMILREEAFSR---------------------------------- -------------SFEEWLAIASPYEPGTPEFRDYVKKVEQMARDFADA----APRAGTMI -HRGV---GMHPNGEYITWAYRAIDTLIGNFHRMGGLLGRAANTSYLSYVYNVGYSGFGEP -PRWGPPIDRHNYAYEATLEYWLRVKEAL------KEGKSWEDAVKAAFPTKR-------- ------------------------PWYPLTPEESYT--EIFAGIAEGYPYK----IGAFIM -FYANPVLA-------------------------------TNYGVKFVE-VLKDTS--KIP -LFIAITTTINETAMY--ADYIVPD-TTYLE-TGTMGVQFLYATSGGV-----TLAEPWRS -PAIMPLT-QRISDCPNGHPRYASF------WEFFIDTA-KALGMPGFGDRAVPGVKG--- -------------KKYEGRWF--PLHC-----------------------EWEYVMRVFAN -AALDAKDRGLIPEQVPEEEVKFVEENYPIAQFKDIIPPEEWK-YVAYGLARGG------- --------------VFTSYEQSFDERGV----------------------SKRSVPGRGTL -YLWDETLAKTRNSVTGEKFW----------------------GGPKYFPIATY-APAGPA -FQKADKWLHGTPLRQLYPEKDWPFMLVFYTGPIYTKHRSQFYYWIKQIAP---------- -------------ENFVLINPEDAAK-IGV-------------E-------------TGDV -VRVE---TP-V--------------GF---F--E-APAVVEPTVAPGVIMVPYG-MGRWA -DTVLVKPKYFELRDAKLKLTVDGLPEKMEVPEDAVNPVKGLPDVVKKILFTKSPAEYY-- ------EKGLA-------PDK----WRFNGVTPN--VVQMSDPSLGGWPLLSWLGASQAYF -DTPVRITKTGQKHKFETPYIVW-------------------------------------- -- ->TtrA_Pyrobaculum_aerophilum_NP_559177 ------------------------------------------------------------- --------------------------------MTSRRAYLK---------AIAAAA---TL ----GIALW-GYWPVV--------DKIIKPKRTPYGPDP------QFGTNVRYVFSSCLGC -NVRCGIVARVVKYGDVEV-IERIEG--------NPYHVYNRAVSFD----KQIK--RYAP -LPYNTPVKEALEKWSGTLCPRGADGIHYVYDPY-RVLKPLKRAG---------------- -------------------PRGSGK-WKAITWEQLINEVVNGGVIEETGERLPGLKEFFAY -G----KLKEAGFEDPNAILSEMKIDVDNIMKVARDPNKTYDDLIKAIEEFKAKWSQRLGE -KGLKLEDLLIDPDRPDLGTKANMVMYLRGRGQGHT----------------DYFSQRWI- -Y-----AFGSVN-WTRHT-SACQLGYYAGNSIWAG---YHDIQ-A----DPIGAKVIIGA -----------GWSMGRVHPGATGQGLMI----ERACEGELK----LYYVNPVAPRTTCNG -N---IIWIPVKPGEDAALAFAVIRWLIENKRYNE----------EFLSIPNR-------- ------------------------DSAKKLGYPVNTNATWLVITEGERFGEFLKARDVGIE -D-SDKPVVWTGERFATYDSVDKADLYYVGKVTLPS------------------------- -------GETVTVKTAFMIVRDEAFSK---------------------------------- -------------SFEDWLAIASPYERNTPEFADYVKKIEQMAKDFADA----APKAATTL -HRGV---GMHPNGEYIVWAYRTIDTLVGNFHRMGGLLARAAHTAYENYVYNVGRSGFGEP -VRWGPPIDRHRYAYENTLEYWLRVKKAL------KEGKSWDEAVKAAFPTKR-------- ------------------------PWYPHTPEESYT--EIFAGIAEGYPYR----IGALIL -FYANPVLA-------------------------------TNYGVKFIE-VLKDPA--KLP -LFIVITTTINETALY--ADYIVPD-TTYLE-TGTMGIQYLYATSGSV-----TLAESWRS -PVIMPLT-QRISDCPNGHPRYASF------WEFFIDTA-KALGMPGHGDKAIPGVKG--- -------------KKYEGKWF--SMHC-----------------------EWEYILRVFAN -AALDAKDKGLIPEDVPEEEVKFVEENYPIAQFRDILPPDEWK-YVAYGLARGG------- --------------VFTKYEESFDERGI----------------------SKRRVPGRGTL -YLWSEEVAKTRNNVTGEKFW----------------------GGPKYFPIATY-APAVPA -FQKADEWLHGTPLRQLYPEKEWPFILILYTGPLYTKHRSQFYYWIKQVVP---------- -------------ENFVLINPEDAAK-LGV-------------E-------------TGDV -IKVE---TP-V--------------GA---F--E-APAVVEPAVAPGVIMVPYG-MGRWA -DTVVVKPKYFE------------LKDARAKSLIDELPDKVEIPEDAVNPVKHLPDVVK-- ------KLLFTKSPAEYYEKGLAVDKWRFNGVTPN-VAEMADPSLGGWPLLSWLGAAQAYF -DTPARIVKTGQRHKFEVPYIVW-------------------------------------- -- ->ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 -----------------MPSLGLPIYGQK----------QGAGLDARRWRSVEEAA---EA -REVPPGEFPDDAAAVPE--G----------FT--RRGFLQ-V-------LGASVA---LA ----GLEAC--KPP----------RENVVSY--VRPPAG------VTPSLPSAYATVASRG -GYAVGVVVTSH-EGR----PTKIEG--------NREHPSSR------------------- ----------------GGSDAMLQASILDLYDPR-RLKG-FTRAG---------------- ---------------------------RPLGFA-TLLREV---------SALARSHAQDGG -A---------------RLR----------------------------------------- --------------------------FLVEPTSSPA---------------VADLRRRIL- -E-----RFPRAR-FDAWA-PVGADAGRAGAAIAFG---KPLDA-AASL-ADADVILSLES ---DFL-----ALEGDSLRLAREFGARRT-------AERMNR----LYVAESAYTVTGGAA -D----HRFRMRSADVLGFGRAVAAELAAKHGLAQ-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------LAPLG-APAGGERA---------KAAAAVAADLARA----RGRSAVLA -GDRQ--------PAAVHALAAALNGALGNAGKTVAYR----------------------- -----PTALLDPAAG---------------------------------------------- ------------------------PDRLRALAGELE--AGK--------------VDALVV -TAWNPAHT-------------------------------APADVPLRK-LLP-----KAK -DTIALALREDDTVRL--ATWKIAA-THPLE-AWGDLRAAD------------GTASI-QQ -PLIAPLH-E---S--------LSE------LELLAAFL----DEGDHGTW---------- -------------RIVREGWR-------------------------RRAGEAG-------- -------------------------------------FDGRWD------------------ --------------GWLAAGVV--------------------------------------- -------------------------------------------AGSAVPPEPAQADLARVA -EAVRAVAAPGASLELGFAADYKVLDGRFLENA-----------WLQEYPH-PITKL---- ------TW-----DNAAQLSAATAKQ-LGV-------------E-------------SGDL -VELS---WR-G--------------RT---L--T-APALVVPGHADGSVLLTLG-YGQA- ------------------------LSGPVGK-------GVGH------DAYALRT------ -------------------SD----APWFGA-----GVEVRKTGKRHPL------------ ------------------------------------------------------------- -- ->ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 ------------------------------------------------------------- -----MPSLDGLPGDEREWIGRFPHLEQALAHPLDRRRTLK-------------LMALALA -GG-GLAGCDPGT-----------PDRGFVSAVRAAPGV-------IPGVPNVYASAHVRD -GYANGILVTHQ-MGR----PTKVEG--------NPGHPSSL------------------- ----------------GATDVFAQAAIQDFYDPD-RASGPL-------------------- ---------------------HDG---MPAAWQ-EV------------TTALQVLRAAPNG -GVPQG---------ASGLR----------------------------------------- --------------------------ILTGTVTSPT---------------LGAAIDALL- -A-----AYPGAI-WHRWD-AIGRDTVRQGAELAYG---RPAMV-IPDL-RQVDVALAVDS ---DLLD----SA-PGHLRHARAFAGRRN-----PVQGPMNR----LYAVEPTPSLTGVAA -D----HRFITAPAACDEIIGRLAAAVLRNEAPSG-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------GPDW--------------------LGAVVADLRAH----PGRALIHL -GPDH--------GAQAQAAVHAMNEALGGRGRAFDVFDAPDHR----------------- -----PARPTSTLPA---------------------------------------------- ------------------------------LMDDME--NG----------R----VRALLI -LDVNPVYQ-------------------------------VP---RFAA-ALP-----RVP -LSVALADRPHETAQA--ARWHVPL-AHGFE-EWGDARADD------------GTATI-LQ -PQAMPLY-G---G--------VSA------ATILHLCA-GDVARPAR------------- -------------DLVRQTWR--QHLP---------------------------------- -------------------------------------SERDWRAALAAGVVPGT------- --------------ASARLDTPLA------------------------------------- -------------------------------------------PVMPPAPPPAP-PV---- ------------DLTLLLRPDPHLWDGREANNP-----------WLQELPR-PLSKI---- ------VW-----GNPLLIPPDLARS-MGL-------------R-------------NGDE -VALS---VG-A--------------RR---A--V-LPIWVQPGQASGCVVGLLG-SGRR- ------------------------RAG---------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Opitutus_terrae_gb_ACB77208 -------------------MKRKSDHSAP---------ANSEPTGPKYWRSLDELAATPGF -QEQLHREFPEGASELN---G----------VD--RRHFLK-I-------MAASFA---LG -GV-GLAGC-RR-P----------EKYVLPY--GKSVEG------MIPGLPLYFATAMPLR -RTAIPVLAETH-QGR----PTKIEG--------NPTYQQHG------------------- ----------------GSASLLAQASVLDLYDPE-RATQ---------------------- -------------------HTREGR---KLNVA-DLNEQL----------AQIGTSHAANG -G--------------AGLA----------------------------------------- --------------------------FLAEESSSPT---------------RARLLAQLR- -A-----RLPRAI-WAEYE-PVADEAPVSAATAAFG---QPVRP-LYRF-ARARRIVSLDA ---DFL-----RPDGAGLYYAREFAKGRR-VVNREDAQQMNR----LYVAESAFTITGSMA -D----HRLRLASSHMLALAAALAVKITGSAAFAP-------------------------- ------------------------------------------------------------- --------------LSAGLD----------------------------------------- ------------------------------------------------------------- -------------IDPKW--------------------IDECAADLLAH----RGTSVFVA -GAHL--------PEQVHAIAYAINAALGNIGATVDFVAP--------------------- -----PTNDAASIQT---------------------------------------------- ------------------------------LATAIR--DGA--------------IDTLVI -LGGNPVYN-------------------------------APADLDWAA-LQK-----SVK -NVVRLGYHTDETTVASPAGAHLAA-AHYLE-SWGDARTAD------------GTIVP-IQ -PMILPLF-G---G--------LTE------LEVLARIV----GANNPDPY---------- -------------ALVLETIT--ALAG---------------------GD----------- -------------------------------------AEKAFQ-QFL----HDG------- --------------LLANSAYPTVAVS---------------------------------- -------------------------------------------YNAAGVARLLG-AG--AG -NP---AALSKDNLEVRFVTDYKMDDGRFANNG-----------WLQELPD-PITKI---- ------SW-----DNAILVSPRLARE-LGV------------YP-------------DGST -LQVARVEMA-GFHQGKEQAFIGELTVNGRTV--R-APIHIQPGLSNYTVVLPLG-YGRT- ------------------------QSGHVGR-------GMGH------DFYPLRTSAGL-- ------HFTVGGKLVPTQDVKAMPNTQEHWSMEGRDIIREANVDEFLENPRFVAAFGMESH -SPSI-------------------------------------------------------- -- ->ACTB1_Ralstonia_eutropha_YP_298623 ------------------------------------------------------------- ------------MTRARVIPLVPVDEPSDAPRSPARRHFLRTT-------MAASAALAGAA -CS-GPP-----------------AEMIVPY--VQMPEG------IVPGRPLFYATALTRH -GYGMGVLVETN-MGR----PTKIEG--------NPRHPASL------------------- ----------------GATHPFDQAAVLQLWDPD-RSQAPYR------------------- -------------------GGALSG------WA-AFDAAL--------ATQRVQWRDRDGE -G----------------LR----------------------------------------- --------------------------LLTGNVGSPT---------------LSAQIAQWL- -D-----RYPKAV-WHVHD-PLYDEDPS--PRMAFG---DDVDL-LIDP-KPATTIVTLDA ---DLVG----HG-PAAVRHAHDFMADRR----GVAPMLACR----LYAIESSPTLTGEIS -D----NRLALPPHEIERLAWSLARKLGVPDVPVD-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------TP---EPASDTAR---------HWIAVLARRLREAP---PGSSLLIA -GGAL--------SGPTRALVWRLNARLGNLGKSVRPVAGT-------------------- -----PRRPLGE------------------------------------------------- ------------------------AHSIGALTEAMR--AGA--------------VSALLM -IDVNPAYD-------------------------------APCGLGFDA-ALR-----HVP -WSSHMGVYRDETARL--TTWHAPM-AHDLE-RWSDARAWD------------GTASI-VQ -PVIAPLN-G---G--------RSA------HELLS----AAVDEHQSGY----------- -------------DLVRAHWRARQRDD---------------------------------- -------------------------------------FDAFWE-QAL----RTG------- --------------VIADTAAPP-------------------------------------- -------------------------------------------ATTDMRQPITP------- ------PSFAAPPLVARFMPDPATDAGELANNA-----------WLQELPR-ALTRH---- ------TW-----DNAALIGPLTARA-RRL-------------S-------------TGDI -VVIRRTDRQ-G--------------NP---I--E-APVWVLPRHAEGVVSLPLG-YGRRH ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Salinibacter_ruber_emb_CBH25246 -------------------MIELDVIDSETAARDEESGARDGSSEPTFWRHWSESDADEDG -DDLT--EFVPGDSEPPS--G----------AS--RRQFLQ-L-------MGAAMA---MA ----GLAGC-RR-P----------EEKILPY--AREPET------VTPGIEDHYATSMPFR -GVLRPVVAQSN-EGR----PTKIKG--------NSDHPSGQ------------------- ----------------SGTSPYEQASVLNLYDPD-RSRS---------------------- -------------------VRQEGR---AASWS-DFVSFC---------RQLGNEADQHQV -A----------------------------------------------------------- --------------------------VLAEKTSSPT---------------VQAMRQRMA- -D-----RFPNLQ-WVPYA-PTGTDPRRLGMQQAFG---RPLRP-RFEL-GEAEVIVSLDA ---NFLD----GRTHDFGYHTQGFAEGRR---LDDAEDTMSR----LYTVESRYSTTGGSS -D----HRLAMRAGRIPALAAALAAELGVGEAPDV-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------SWSERER-------------LHVREMARDLQAA----GEHGVVMA -GEAQ--------PPEVHALAMAVNQRLGGLGTTVTLFDPGDDEIQ--------------- -----PQ------------------------------------------------------ ------------------------DEALADLTASMR--AGE--------------VDTLFM -LGVNPVYD-------------------------------APSELGFEE-ALS-----NVR -DTVHLGRLRNETAQA--ARWHLPR-THYLE-QWGDGRAYD------------GTKSI-VQ -PLIRPLYDD---A--------HSL------IEVLNLAA-TGVDASGH------------- -------------DLVREQWR--AQLP---------------------------------- -----------------------------------APFQERWR-KAL----HDG------- --------------YLEGSGYETAS------------------------------------ -------------------------------------------VGTATVPSIDA-PA--SD -PD---------EIEVVFRTDSKLLAGRFSNNP-----------WMQELPD-PISKI---- ------VW-----DNVAVMSRATADE-LGV-------------EVQRREGSF-----YADR -VELT---LD-G--------------QS---V--K-LPVWVQPGYPDGSIGVSMG-YGRTI -ASTRESESTP-------------FWDTSDQTNIYNGSPIAGGVDSSGEPVDVVGGNVAPM -RPNGGRVATGANVTQVGSGYLLATTQEEGSMQGRPIVRWATLDEFKENPEFVNESQPPVP -DLGHESGGHGDGGHGDGGGHGGGDGHSGDGAAGNVSGQGLEAGPGADAHGADEMPEQAAH -G ->ACTB1_Rhodothermus_marinus_gb_ABV55245 -------------------MIELPVVNPD--------GAETPGSGKRLWRSTADLRRDPEW -VKLAHDEFMPGVAEPPS--G----------TS--RRQFLQ-I-------MGASMA---LA ----GLTAC-RR-P----------VEKILPY--VRQPEE------IIPGIPLYYATAMPFR -GSVRPLLVESH-EGR----PTKIEG--------NPDHPLSR------------------- ----------------GATGVFEQASLLNLYDPD-RSQQVL-------------------- -------------------RKGEPA-----SWG-DFVQF---------ARSL-----AAEA -G-------------TKRLA----------------------------------------- --------------------------VLCEPSSSPT---------------LAALRRELE- -R-----RYAQVR-WVTYR-PEGDDHEALGLQQAFG---RPVRA-RYRF-SEARVIVSLDA ---DFLG----PTDRNFVENTREFAASRR---MERPEDEISR----LYVIESTYTVTGGMA -D----HRLRLRAGDIPAFAAALAAELGVGELREA-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------GARFAGHPY-----------VVEIARDLRAA----GARGVVLA -GETQ--------PPAVHALCAVINDLLGSLGRTVILHALDEP------------------ -----ATAQHAALAE---------------------------------------------- ------------------------------LVQAMQ--AGA--------------VDALLL -LNVNPVYD-------------------------------APAALGFAE-ALA-----QVP -EVIHLGLHMDETARR--STWHLPS-THYLE-AWGDGRAYD------------GTLSV-IQ -PLIAPLYEA---A--------HSP------LEVLALLA---TGEEQSAY----------- -------------DLVRNTWR--RLLA----------------------GRGA-------- -------------------------------------FEQAWQ-RVL----HDG------- --------------FLPDSGYPTVSLR---------------------------------- -------------------------------------------PNRQALADWPQ------- --------AAEGGLEVVFRLDPTVLDGSFANNA-----------WAQELPD-PITKI---- ------VW-----DNVAILSPKTAAA-LGV-------------KAEYHKGVY-----IADV -IELS---LD----------------GR---A--VELPVWVLPGHPDDSITVYLG-YGREI -TSTRPERKTPFFDLDE-------YTDMYGHGAIATGVGPRTWPRCGGPDNTWVAYGAQ-- ------VRKTG-------RTYKIVTTQDHGSMVGRPLVRLSTVEEFRKNPDFAKEAEPPLE -GLEP-------------------------------------------------------- -- ->ACTB1_Methylobacterium_sp_4_YP_001772545 ------------------------------------------------------------- ------------------------MPPLSGPRTVSRREALR-----------AFAAGITLA -AG-ACAKP---------------DEEIVPY--VVQPER------VTGGVPLVFASTLPLA -GYGRGCRVRSV-DGR----PIKVEG--------NPRHPGSL------------------- ----------------GATDVFAEAAVLSLYDPD-RSKTLR-------------------- -------------------QGGDIG-----TWS-ALQRAL--------VAKVAAWRETRGE -G----------------MR----------------------------------------- --------------------------LLTGRVTSPT---------------LQRQIARLL- -D-----AYPRAA-WHAHE-PTEDASARAGAALAFG---RPLWP-VPHL-DRAAVIVSLDA ---DPLG----PG-PDQIRNGRGFGSRRV----PAAGEGFSR----LYAVEAAPTLTGAKA -D----HRLALPPHRIGEVAVALARALGADL------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------RAPTLPEEAARLAA-------------RAAQDLRAR----RGAALVLA -GPTL--------PPEIHALAHWIN---GVLGAPLDWIEP--------------------- -----PDLIGGRAPGTLSD------------------------------------------ ------------------------------LARDLA--AGG--------------VQDLVM -LGVNPVYD-------------------------------APADLALAE-RLG-----RAP -FRLHLGPAVDETAVL--ATWHVPE-THPLE-AWGDLRAVD------------GTASL-VQ -PLIRPLY-A---T--------RTA------EEVVCALL----GEGDAASY---------- -------------DLVRETWR--PGRE---------------------------------- -----------------------------------AGFEEWWR-RAL----HEG------- --------------VVQDSAAA--------------------------------------- -------------------------------------------PVATGSPRLPD-PGPPAA -AQ---------DLTLVLRPDPGTWDGRMANNA-----------WLQECPA-PLTKQ---- ------VW-----GNALALAPDEAAR-RGL-------------A-------------QGDL -VRVA---AG-G--------------RS---I--E-VPVATVPGHAAGVASLTLG-HGRS- ------------------------RAGAIGN-------GIGA------SAYALRREDAL-- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Nitrosococcus_oceani_YP_343269 ------------MAGSSIKPLDLAPIRAR---------LAEAQ-GRAFWKSLEELAGSEEF -ERFLYQEFPF----FRELSQ----------ASLSRRDFMR-L-------MGASLA---LA ----GLSAC-STPP----------PEEILPY--IRAPEG------LVPGESLFFATAMPLD -GFATGVLVESR-MGR----PTKVEG--------NPLHPASL------------------- ----------------GGTDIFAQASVLQLWDPD-RAQVIS-------------------- -------------------HRGEIS-----TWQ-TFLAAM--------GEKMRTFEGNQGK -G----------------LY----------------------------------------- --------------------------LLTPTVSSPT---------------LISQLRTLG- -K-----RFPHAH-WHQYQ-PINQDNSYEGARLAFG---ESLET-RYHL-ERAEVILSLDG ---DFLG----SL-PGHLRYARDFAKKRR---VDSAQSTMNR----LYVAESSPTITGTMA -D----HGVSLRASQIEVLALQLARALGI-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------GVPRREETASDLPE---------QWVRAVAEDLRQH----RGTSLVIT -GEKQ--------PPFVHGLVHAVNQALGNVGTTLTYSAPRAFN----------------- -----PRNQNESLNH---------------------------------------------- ------------------------------LVAQMD--AGK--------------VDTLIM -LGGNPAYN-------------------------------APADLAFSK-QLA-----KVK -SSIYLGLYEDETAAH--SHWHIPE-THYLE-RWGDARAYE------------GTVSL-LQ -PLIAPLY-Q---G--------KSD------YELLAVLL----GQTDRSDY---------- -------------DWVRGYWQ--KQWP---------------------------------- ----------------------------------KSDFKSIWN-QAL----QAG------- --------------FIEGTALRS-------------------------------------- -------------------------------------------KSVKLRDDWVA-HLSRGQ -SK----SKETSGMEIIFMPDPTIWDGQFTNNG-----------WLQELPK-PLTKL---- ------TW-----DNAALISPRTAEN-LGL-------------A-------------NEEV -VALR---YQ-E--------------RQ---V--Q-APIWIMPGHPEGAVTVTLG-YGRA- ------------------------KTGQVGA-------GTGF------NAYALRSSRAP-- -------------------------WFGWGLE----------------------------- ------------------------------------------------------------- -- ->ACTB1_Chloroflexus_aggregans_YP_002464666 ---------------MTQHQSDLEAIRAQ---------LRDAR-GPQFWRSLDQLADSPAF -RELVEREFPRGASEMSD--G----------MS--RRTFLK-L-------MGASLA---LA ----GVTAC-TYQP----------RQYIAPF--DRQPEG------RIPGVPQYFASTLTLG -GYGTGVLVRAN-EGR----PTKVEG--------NPRHPASL------------------- ----------------GSTDLFAQAEILTMYDPD-RSTTVLRQ------------------ --------------------------GVPSTWA-EFTTTL--------ANALTAAQATQGA -G----------------VR----------------------------------------- --------------------------LLTTTVTSPS---------------LAAQIEQFL- -Q-----AYPQAR-WYQYE-PVNRDNVVEGARLAFG---RDVTT-RYDL-AAAQVIVSLDA ---DFLA----PG-PGFIAYARAFADGRK---VRKDSTGMNR----LYVIEASPSTTGTAA -D----HRLALRADAIAAFAGALAHELGIGGAPAT-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------LAAKAE---------EFLKAIAKDLEEH----RGRSVVIA -GDQQ--------PPIVHALAHLINAELGNVGKTVFYHEPVEAR----------------- -----PTNQTNELVT---------------------------------------------- ------------------------------LVSEMA--AGR--------------VELLVM -IGGNPVYN-------------------------------APGDLRFAE-RMA-----TVP -LTVHLSQFVDETSVQ--ATWHIPQ-AHPLE-SWGDARAFD------------GTASI-VQ -PLIEPLY-G---G--------KTA------NELLAAML----GQPDAESY---------- -------------DLVRGYWE--ERIG---------------------------------- --------------------------------------NTNWNVALATGVIADT------- ------------------------------------------------------------- -------------------------------------------SAPVINPTLNE-AAIRAT -A----IPQPGDGVEIVFRPDPSVFDGFYANNG-----------WLQELPR-PLTKL---- ------VW-----DNAALMSPRTAIKLLGLPFSADRLVGNEADDRERQRYLEQLSKVNGTI -ARIE---YR-G--------------GV---V--E-LPIWLLPGHAEDSITLNLG-YGRT- ------------------------NAGRVGN-------GVGI------NVYP--------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 -MDNGSKKNGADVCPSKKGKLELADVKQQ---------LAAAKDGPQYWRSLDELSNTDEF -QEMLHREFPRQASEWVDDGG----------SS--RRDFLK-L-------MSASLA---LA ----GLTAC-TKQP----------IEPIVPY--VRQPEE------LTLGKPLFFATANTVG -GYAVPVLAESH-EGR----PTKLEG--------NPQHPATL------------------- ----------------GGTDVFTQASVLTMYDPD-RSQVVMLD------------------ --------------------------NEIRTWG-SFVGAV--------ANPLAAQKAVQGA -G----------------LR----------------------------------------- --------------------------LLTRSTTSPT---------------LGAQIKQLL- -Q-----TYPQAK-LVQYD-PAGRDNARAGSQLAFG---QYVET-QYNL-DKADIILSLDG ---DFLS----SGFPGFHKYARNFSQRRQ----PDLKEKMVR----FYMAESTPTNTGGKA -D----HRIPMRASDVEQFGRAIAAGIGVAGAGGS-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------AKQEWQ-----------------NQVAAIVSDLNKH----KGAAVVVV -GEHQ--------PPAVHALAHSMNAALGAVGTTVTYTEPIEQI----------------- -----PADQTAGLKE---------------------------------------------- ------------------------------LVADMN--SGK--------------VDLLVV -MGANPVYE-------------------------------APADLAFLD-AFK-----KVA -VRIHHGLYVDETAVL--SHWHING-THFLE-QWGDVRAFD------------GTVTI-QQ -PLIAPLY-N---G--------KSQ------YEFVAALN----GQGSTSGY---------- -------------ELVKGTWQ--KQHT----------------------GAD--------- -------------------------------------FEAWWR-KAV----HDG------- --------------LIAGTAAPAKT------------------------------------ -------------------------------------------VSAKGAPAATN------- -------AASDSAMELIFRRDPMIYDGEYSNNG-----------WLQEAPK-PITQL---- ------TW-----DNPIEMNVTQAEQ-MGI-------------K-------------TEDE -LEIT---VD-G--------------RK---I--V-GGAWLTPGHPKNSVTVFLG-YGRT- ------------------------RAGRVGT-------GTGY------NAYQARTSDKQ-- -------------------------W----------------------------------- ------------------------------------------------------------- -- ->ACTB1_Candidatus_Solibacter_usitatus_YP_821785 -------------MSDPRNQLDLAAVQKR---------LEGAR-GRDYWRSLDDLAATPEF -QDLLEREFPRQAVGWADDED----------ANEGRRNFLK-V-------MGASLA---LA ----GMTAC-TRQP----------TEHIMPY--VRQPEE------LIPGRPLFFATAMTVN -GVANGLLAESH-MGR----PTKMEG--------NPEHPATL------------------- ----------------GACDPYSQASVLQLYDPD-RSQALT-------------------- -------------------FNGEIR-----SWG-RFTGEL--------REALALQKTKNGS -G----------------IR----------------------------------------- --------------------------ILTETVTSPT---------------MAAQLRAIQ- -Q-----VYPSSK-WHQWD-PAGPHMARAGSVQAFG---QPTNT-YYDF-THANVVVSLDS ---DFLA----SG-PGYLRYARQFSARRR---IHEPSDSMNR----LYVAEPMPTPTGTKA -D----HRLQLRAGDIEEFAWGLAISL------------------GIAEGPKN-------- ----------------------------------------------------------GEN -H----------------------------------------------------------- ------------------------------------------------------------- -------------DIYKW--------------------LGPMARDLQSN----KGASLVIA -GAHQ--------PPIVHALAAIMNEKLGNVGKTVFYTDPIEAN----------------- -----PGDQLASLMD---------------------------------------------- ------------------------------LVKDLD--AGA--------------VDVLLI -LGGNPAFN-------------------------------SPVELGMRD-RLK-----KAK -LRIRLGLYADETTEV--CQWQVPE-AHFLE-TWGDARAFD------------GTITI-QQ -PLIQPLY-N---G--------RSA------LQLLQNFT----DQPESSPY---------- -------------DVVKGYWR--TQHQ----------------------GAD--------- -------------------------------------FENWWR-RAV----HDG------- --------------FVANSALPTKT------------------------------------ -------------------------------------------PTVRGEALSAR-AGARHL -GG---------KLEVIFRPDPTIFDGRFANNG-----------WLQEMPK-PVTKL---- ------TW-----DNAAILSPYDANR-FGV-------------Q-------------NGDM -LKLT---YD----------------GR---S--LNAPVFIQPGHVNGATTLHLG-YGRW- ------------------------AGGRAAK-------GMGF------DPYGLRTSKAL-- -------------------------WQDVGMDA---------------------------- ------------------------------------------------------------- -- ->RBG1_1305 ----------------------MNNKENP---------------HKKYWSTLSEFHQDAEF -KKLKKEEFLSKPQSFFESNG-------NNDTTFSRRDILK-L-------AGAAAV---FT ----AAACA--RRP----------VEKIVPY--LDPSEE------VIPGKAVWYSST-SGT -SDGCGMLVKTR-EGR----PIKLEG--------NPDHPLNK------------------- ----------------GTLSAREQAAILDLYDPD-RLKHPA-------------------- -------------------KISAGQ-VLKSDWK-SADTEI--------ARSLKSA------ ---------------KGKMV----------------------------------------- --------------------------LLTGTIHGPA---------------RKRLIREFLF -------SFSNAE-HITFD-ALSEEEILEAQELCYG---NRVLP-RYRF-DKAEALVFLGA ---DPLA----SG-HSKTEFAYGFGHQRK-----INSNQMSK----VISFEPALSLTGQNA -D----LHYLVKPQDLIKVGLALAHQLIVAEKKSK-------------------------- ------------------------------------------------------------- --------------LASDLLVQNLLEN---------------------------------- ------------------------------------------------------------- -------------YSAKKVETEIGLPE---------GTIKSVAADLWLA----RGRGLVYT -GSLT---VRDNSALALHLVTNLLNSALENEGNTVDGVQSVSQQ----------------- -----SQGSYSELMN---------------------------------------------- ------------------------------LISDMK--SGK--------------VEAVLI -YGNNPAYG-------------------------------LPQSAGFEE-ALQ-----KVK -TKIYLGDRADETGSL--CDFVLPS-LHFLE-SWGDAEPQQ------------SLYSL-MQ -PTISPLH-D---N--------RGW------EDSLLALM-REIKGVALGKE---------- ----------------YASWH--DFLK-------------------DTWYKEIYLKNDLVA -S-----------------------------------FEDFWI-SVL----RQG------- --------------LFDTVNR---------------------------------------- -------------------------------------------SAEKSSPRQFRTTALSNI -GK---IKNVDSKFTLALYTPAMQFDGRTNNNS-----------WLLETPD-PVSKI---- ------AW-----DNYVNIAPRTSVE-LGL-------------Q-------------ESDV -VSLT---VN----------------GV---T--QEIPVHIQPGIHPEVFTVAVG-WGRE- ------------------------KVGRVGNNVGVNAFRWSKIQNRHLVSSSLPVEIKKTG -KQIKLANVQG-------HNY----INGRPVIYEATLAEYQKNPTAGRAGEEKLTSIWPSH -PYE--------------------------------------------------------- -- ->ACTB1_Leptospira_interrogans_serovar_NP_713447 --------------------MDQKNFQKE---------------KKAHWLSYDLKDKDEEV -KEMQKSEFFTSPDPLIARIK---------SGEFDRKSFLK-L-------MGAGVA---MT ----SLNCI--RKP----------VEKIVPYVDLNKTDENSQYDFVKHGHSYYYTSVVAG- ----TGVLIKAR-DGR----PLKLEG--------NPDHPVSQ------------------- ----------------GALSAAGQASIFDLYDPD-RAQNPA-------------------- --------------------TIEGGIEVKSDWA-TVDAKV--------KSALAAN------ ---------------KGKTV----------------------------------------- --------------------------VVTKLLDSPS---------------TQSIIGDFL- -R-----TVGGGK-HYEISLTSAEEVVSKGQAASYG---KAIVP-NYHF-DLANVILSIDC ---DFMG----NW-LSGEEHQKDFSKRRNLRPNGSLKQNNLADVNLFIAAESVPTMTGSNA -D----LRLAIRPGDQTKLALAIAAALGELGANTK----------DALNG----------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------ATLSALVSELGVSE---------ENIRKTAKALWSN----KGRSLVVA -GSLA---ATTKDAVDLQILVNLLNSVLENDGKTVDHSNP--------------------- -----KKEGLADSSGNLKS------------------------------------------ ------------------------------LAAELK--QGK--------------VGVLFV -NDVNLVYQ---------------------------------AGEEWKN-LLH-----QAA -LVVSLSDRADETALS--SNVLATT-THFLE-SWGDAEVTK------------GIFSI-QQ -PAIRPLF-N---S--------RSF------EDSLIAFAGGSLGGEASFY----------- -------------EYVKNSWI--KKLG---------------------------------- -------------------------------------SKRNWE-DLL----RTG------- --------------TTVTASERKKVAG---------------------------------- -------------------------------------------PSRNFNRSSIK-KIESSS -TG----------LKLSLFETIAIGDGKAANNA-----------HLQELPD-PVTKL---- ------TW-----DNCILLSPALAKE-KGI-------------S-------------SNDV -LVLK---TA-K--------------QT---I--E-LPAQIQPGMHKDAIAIAVG-YGRT- ------------------------AAGAVGT-------GVGK------NAY---------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Bdellovibrio_bacteriovorus_NP_96849 ------------------MKKALRPKVER---------------DTKYWNSLEQWSNDPEF -NKIASTEF-QSS-PLRESDD---------EGGWARREFLK-L-------MGASLA---MA ----SAGCI--RRP----------VQKIVPY--NKQPEE------VTLGMANYYTSAYFDG -SDALGVLVKTR-EGR----PIKIEA--------NPGHPFSI------------------- ----------------SGLSIRSQASLLSMYDPE-RLKGPQRNLFNE-------------- -------------------KKSNSQ-VIDVKWE-DLDKKV--------AEQLK-------- ---------------KGDVV----------------------------------------- --------------------------ILSGNVASPA---------------TRAVIGDF-- -------AQGFKAKHVVWE-ALSNDDVREGQKASYG---DDVVP-AFRF-DKAKMIVSIDA ---DFLG----TW-ISPTAFTNQFVEGRK------DIKNMNR----LVSFDSNYSLTGANA -D----IRMKIKPSQQLDVVMGLLHEIIVKKGASS-------------------------- ------------------------------------------------------------- ---------------HAGNSAVKAAL----------------------------------- ------------------------------------------------------------- -------------APFADVAKKLNVEP---------ALFAKVAADLWAN----QGTSLVVA -GGIT---TLTEKSKELQVAVNFLNSILGNDGKTVDHNGGNKG------------------ -----DKASQADMAA---------------------------------------------- ------------------------------LIKDMK--DGK--------------VKTLII -HRVNPGFV-------------------------------LGADMGFAE-AIK-----KVD -LVVYTGDRIDETGVF--ADYITPD-NHALE-SWSDMELAS------------GVYSI-CQ -PSIRPMY-D---T--------RSFQLSLMTWAYLANMGPSRLRDYETFY----------- -------------DYLRVFWK--SDIF-------------------PKYGKGQS------- -------------------------------------FEDFWQTALQKGYVGEI------- --------------NSGSSSRSFKVD----------------------------------- -------------------------------------------AFTSIKPAAAK------- -----------EGFELALYSTSQHGDGSLANVS-----------WLHELPD-PVTKA---- ------VW-----DNYVMVSLATAEK-HGL-------------K-------------QATV -VELT---VG-G--------------KT---L--E-LPVLIQPGLHDDVLAVAVG-FGRT- ------------------------RAGKVGN------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Cytophaga_hutchinsonii_YP_678817 -------------------------MKDN---------------NKVFWKGVEELGNSPEF -VKNAQNEFPEFL-PLKNSSE--------ESNGTDRRDFLK-L-------LGFSVA---AV ----SLAAC--EAP----------VKKAIPY--LNKPEE------IEPGIANYYASTFVDG -GEYCSVLVKTR-EGR----PIKIEG--------NKLSSVTK------------------- ----------------GGTNGRVQASVLSLYDTA-RIQGPLIKGA---------------- ----------------------------AATWA-DLDKQV--------GVQLGAI--AATG -G---------------NIR----------------------------------------- --------------------------IVSPTILSPT---------------TKKAIAAFK- -A-----KYPSTE-HVQYD-ANSSYGILKANQTSFG---QAVIP-SYDF-SKAEVIVGFGA ---DFLG----TW-ISPIEFVSQYADTRR---LSKTKKTMSQ----HFQFETALSLTGSNA -D----YRQPIKPSQEGLFIAELYNKIVSSK------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------VSTTPVKN---------DVLDKAAAALLKASN--RGKSLVVS -GSND---------VNVQILVNEINLALGNYGTTISLAT---------------------- -----PSFQKQGND----------------------------------------------- ------------------------EAMNTFINDAVA--GK---------------VNAVIF -YGSNPVFD-------------------------------HARGAELAK-ALS-----SVS -LTVSFADRVDETAAL--TKFVAPD-HHYLE-AWGDAEPRA------------GFYSL-GQ -PSISPIF-K---T--------RAA------QESLLLWS----GNSGDYY----------- -------------EFLKSNWI--SSIL---------------------------------- -------------------------------------GGASWD-QAL----QDG------- --------------VFEPKNK---------------------------------------- -------------------------------------------SGVEVTASSFD-RSAVEA -GIIKNYPANTSGIELKLYEKIGLGTGSQANNP-----------WLQELPD-PISKA---- ------TW-----DNYVAVSASYAKA-NAL-------------E-------------QGDR -VAVK---SA-N--------------YS---V--E-LPVLIQPGQAGNTVSIAIG-YGRT- ------------------------HVGKCGD-------GVGK---NVYPFARFVDGSVL-- ------DFVTG--------------------------VSVTKLGGDKYPIAQTQTHH---- ------------------------------------------------------------- -- ->ACTB1_Flavobacterium_psychrophilum_YP_001295304 --------------------------MSS---------------NKKYWKSVEELNENSSI -VETLRNN--EFV-EEISTNEFLGDAVTLATSSTTRRDFLK-Y-------VGFTTA---AA ----SLAAC--EGP----------VHKSIPY--VVQPEE------IVPGVADYYATTIADG -FDFANVLVKTR-EGR----PIKIEN--------NKIAGANF------------------- -----------------HANARVHASVLSLYDSM-RMKTSKIA------------------ --------------------------GKDTIWE-QANAKI--------KASIADA--KAKG -G---------------KVV----------------------------------------- --------------------------LLTNTSASPS---------------TDKLIAQFL- -------VSNPNAKHVTYD-AVSSSEALDAFQTVYG---ERALA-EYDF-SKANVIVSIGA ---DFLG----DWQGGGFDAGYAQGRIPQ-------NGKMSR----HFQFESNMTLSGAAA -D----KRVPMTVANQKQALVQIYNVITG----------------SSIGSSKD-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------EAVMKAAQQLKAA----GSKGVLVC -GIDD---------KNAQLLVLAINKVLSSEAFNTANTRQI-------------------- -----RKGNNADVKQ---------------------------------------------- ------------------------------LLADMK--SGA--------------VHTLIM -NGVNPVYS-------------------------------LPNGKEFAN-SLK-----KVK -LSVAFAMKEDETAAV--ANIAVAT-PHYLE-SWGDVSIVK------------GSYAL-TQ -PTIRPLF-D---T--------VQF------QDALLSWT----GNAQTYY----------- -------------DYLRSSWS---------------------------------------- -------------------------------------GAKSWN-QLV----HDG------- --------------VVFTEGISSSAGAG--------------------------------- -------------------------------------------ADYNGAASTLA-KA--SS -KG----------LELVLYTKTGLGDGQQANNP-----------WLQEFPD-PITRA---- ------SW-----DNYLTISQADATT-SGI----ENWNVANGGL-------------NGSY -VTLT---VD-G--------------VK---L--EKVPVIIQPGQAKGTVGLALG-YGRK- ------------------------AAMKEEM-------QVGVNAYTLYNNFSNVQNVSI-- ------AKEDG-------EHE----FA---------CVQLQRTLMGRGDIIK--------- ------------------------------------------------------------- -- ->PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 ------------------------------------------------------------- --------------------------------MVTRRDFLKAT-------ALTATAISAGI -KF-QPKSY---------------AEATAAS-----------------GEVKFVPNICAMC -PAACSIQVEVR-DGK----VHRIHG--------TPDHPINN------------------- ----------------GKICARGNAGVQRVYNPD-RLKKPLIRTG---------------- -------------------EKGTWS-FREASWE-EALSLI--------ASKVKEY--REMG -H-------------PEYIG----------------------------------------- --------------------------MLGGWLPCTY---------------YKPFFKAFL- -A-----ALGTPNGGGVPE-ALCFLSKALGWKSAYG--FGAHPELLTDY-ENARYVIMLRR -----------NV-AGSISVVHGWRLGQN--------RRKFK----LVVLDPRYSETAAKA -D----VWLPIKPGTDLAFLLAMMNVIINEKLYDS----------NFLAKYSN-------- ---------------------------APMLLKDGKPFKVWDENGKKKYLVFDLAKGAAVE -HDSAMLPALEGEYEVEGEKVIPAFEALKRRVAE--------------------------- ------------------------------------------------------------- -------------YTPEWAEGITDIEA---------KKIREIAREFALR------RGVIDS -GWHG---PKYRNSLLTWRAAAIVNALVGSVNNDGGLLFTGLAQFVT-------------- -----SKESTTEAPSQSVLRMWAEKR----------------------------------- ------------------------GIATAFLGHTVQ--AFYDAIVNEDPYP----IKMLFV -VGHNLLMN-------------------------------MPERQKWEE-ALK-----KLD -FMVAVDILPQDHLYY--ADVVLPE-STYIE-KDDPLFPIAYAPA--------FGFHT-RV -KAIEPIY-D---T--------KHV------IEMMVEIA-SRLGTEDTFFK---------- -------------ALSKGLGV--DAEK----------------------LKSYYHGEGVAG -IRRAQAEAKGVN------------------------YNELLSKGYVLKAGRDK------- --------------IVYNMPYK-----------------------------QPLPTPTGKV -EIFSFMLANF--------------------------------ASKASEPYWDA-LIKWVP -PKVSERKLGSNEFYLAYSRSPFTTHSSTSDNP-----------LLAKLID-DAELYYKG- ------IW----------INSERAAE-LGI-------------R-------------NGDR -VVVE---SVFT--------------GD---K--TEAIAFVNELVRKDTIFTVSG-FGQS- ------------------------------SERLTNIPQRGM------TMMRLIP-LQF-- ------DTLSG------------------TIMSQETIVRITKA------------------ ------------------------------------------------------------- -- ->PhsA_Wolinella_succinogenes_NP_906934 ------------------------------------------------------------- -----------------------------MEIEISRRRFLQGS-------VALTIVGASSG -AL-AVGGS---------------SGNKTES--------------QEKGERSVA-TLCEMC -VNKCAAIARVK-DGK----VIKLDP--------NPLFPKSR------------------- ----------------NMLCARGNAGIKALYDED-RLKYPLIRAG---------------- -------------------ERGDGK-FKRVTWD-EAYTYI--------QEKLVKIMDEEQD -N-------------RSAIG----------------------------------------- --------------------------FCAGEGMGEH------------------HFKEFN- -K-----VFGSSN-WLNHS-SVCLQSTVSGYTLTIG---TYGNP---DL-ANAKYVIMAGA ---NRAE-------AIVTPDTMDLFKRTL--------GRGCQ----LVVIDPRYSHTAHKA -D----LWLPIKAGTDLAFVLALTHVVLSEEIYNK----------KFVEEKFN-------- ----------------------------------------------------------GFE -E------------YKAHILQQN-------------------------------------- ------------------------------------------------------------- -------------YTPEWAEPITGISA---------SDIRKVARDFMAC----APQAIYYP -GRRT---TWAKNDFQLRRAMAIFTALGGGVDVKGGICYGKTL------------------ -----PIDEHSIPAPMYANAKSRIEQNK--------------------------------- ------------------------AAIVGGTGSWVA--WRDMVAAKETPYP----IRGMFI -YKQNPMHC-------------------------------VPNTAKTAQ-MFK-----NMD -LVVTIDTMPSDTAIM--SDVILPE-CTYLE-RTDPVKSFGGIE---------PAIAQ-RN -KVIEPLY-E---T--------KPV------LQILRELT-AKLSRPLFENSLKHDEDLQ-- -------------EMIEEKAS--ELAS-------------------SNPNKGEEELKKLAI -EEVFEDEMEGWDISQGYAHSEEEMNEH---------AVAKYAGAHEMLLKHGV------- --------------FYPGINEQFKQVSANEYVYYPES-------------KKAYSMRNGQF -NTPSKKVECVIPSLAS--------------------------KGIDTMPTWRE------- ---EYLPKTPAGQFRFVTGRHAQFTQSSTANNA-----------LLLDTMSENF------- ------IW----------INKRVAKE-RGI-------------K-------------FGDL -LEIS---SK-A--------------GK---T--R-IKAYPTEKIAPDTVFFVHG-FG--- ------------------------VQSKAMSRAYQNGGHDSM-----------IIEEHI-- ------EPVFG------------------AAAAHETLVEIRKV------------------ ------------------------------------------------------------- -- ->PsrA_Wolinella_succinogenes_NP_906381 ------------------------------------------------------------- ---------------------------------MTRRDFLKS--------AGAAGAAGLVW -SQ-TIPGT---------------LGALEKQ--------------EIKGSAKFVPSICEMC -TSSCTIEARVE-GDK----GVFIRG--------NPKDKSRG------------------- ----------------GKVCARGGSGFNQLYDPQ-RLVKPIMRVG---------------- -------------------ERGEGK-WKEVSWD-EAYTFI--------AKKLDEI--KQKH -G-------------AHTVA----------------------------------------- ---------------------------FTARSGW-----------------NKTWFHHLA- -Q-----AYGSPN-IFGHE-STCPLAYNMAGRDVFG-----GSM-NRDF-AKAKYIINMGH ---NVFE-------GIVISYVRQYMEAIE---------NGAK----VVTLEPRLSVMAQKA -S----EWHAIKPGHDLPFVLGFMHTLIFENLYDK----------KFVQKYCT-------- ----------------------------------------------------------GFE -E------------LKASIEP---------------------------------------- ------------------------------------------------------------- -------------CTPEKMALECDIPA---------DTIKRLAREFAKA----APKAIFDF -GHRV---TFTPQELELRRAMMMVNALVGNIERDGGMYFGKNASFYNQFLGEEDPKA---- -----KGLKKPKTPAYPKVEVPRIDRIGEKDGEFFL------------------------- ------------------------ANKGEGIVSLVP--KATLNELPGVPCK----IHGWFI -VRNNPVMT-------------------------------QTNADTVIK-ALK-----SMD -LVVCVDIQVSDTAWF--ADVVLPD-TTYLE-RDEEFTAGGGKN---------PSFGIGRQ -KVVEPLG-D---A--------KPG------WKIAKELS-EKMGLGEYFP----------- -------------------WK--DIED-------------------YRLQQVDGDLDLLAK -LKKDGSASFGVPLML---------------------QEKKSVAEFVKKFPGAA------- --------------SKVNEEGLIDFPK---------------------------------- -------------------------------------------KIQLFSPKLEEVSGKGGL -GYEPFKYKEEDELYFVQGKTPVRSNSHTGNVP-----------WLNNLME-YDA------ --------------IW--IHPKTASK-LGI-------------K-------------NGDA -IELY---NK-F--------------SS---Q--K-SKALITEGVREDTLFGYFG-FGHV- ------------------------SKDLKRAY------GKGV------NSNALMP-SFT-- ------SPNSG-------MD-----LH--VF-----GVKVKKA------------------ ------------------------------------------------------------- -- ->PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 ------------------------------------------------------------- ------------------------------MKKFSRRTFLKL--------SGAATAA-LAA -AP-TLPRM---------------ASLAANI--------------QLEGSAEFKASYCEMC -TSRCPIQAKVV-DGK----TVLING--------NPEWAATG------------------- ----------------GTVCARGGSGFSQLYDPQ-RLKKPLIRTG---------------- -------------------ERGEGK-WKEVSYE-EAYAYI--------AEKMQDI--KARY -G-------------PEAMA----------------------------------------- ----------------------------FACRKGPH---------------MGYLYTLAK- -------AYGSPN-TFNHE-STCPMAKTVALEATFG---TAAL--GIDY-ANVKYLVTFGR ---NFFE-------GIHVAQTRGVMTAVS---------KGAK----LVSFDPRFSLTSAKA -H----EWFAIRPGTDLAVVLAINHVLIRDGLYDR----------DFIDKYTE-------- ----------------------------------------------------------GFE -A------------VKASLTA---------------------------------------- ------------------------------------------------------------- -------------CTPAWAEQESGVRA---------ADIERIARELAAA----RPRAVVEF -GWRT---TSTPEEFELRRAIIITNLLLGNLEVPGGTFFVKSANFINSLVGKPVI------ -----QPIAGPKLPPFPQPGRPRIDGAGSKGQPYSL------------------------- ------------------------VPPIDGVVQTIP--EAALT---GKPYP----IRGWFI -YRYNPVLT-------------------------------IPDTNRVIE-GLK-----KMD -LVVVCDINMSDTAWY--ADVVLPE-STYLE-RDEGFNDYSGAV---------PVYTL-RQ -KVVEPLY-D---T--------RPH------WQIFKELA-EKLGLGAYFP----------- -------------------WK--DVEE-------------------LRLIQMGGKADLVRM -GKEKGFVNFGLKPLFL--------------------RDRASVAEFVAKFPEAK------- --------------ELVNTQGIIDKP------------------------LLNLKTKSKKI -ELLSTEAEE---------------------------------LFGRGVPVYRP-VKLAEA -GE----------AYFVQGKVAVHTNGHTHNVP-----------WLYNLMS---ENR---- ------LW----------LNPATAAK-LGL-------------K-------------DGDK -AILK---TR-T--------------GQ---Q--Q-VKVLVTEGVRPDTVFGYFG-FGRL- ------------------------SPGLGRAY------KKGI------NSNLALP------ ------------------LVT----ADVCGSTIQTTGVTISKV------------------ ------------------------------------------------------------- -- ->PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 ------------------------------------------------------------- ----------------------------MLEQKITRRTFLK---------GSLAAGALATF -GG-KLIPI---------------EPAKAAA--------------AGQAETRVVPTLCEMC -GVKCGVLAHVR-DGR----VWRLTG--------NPRDPQSG------------------- ----------------GRLCARGNAGTKTLYDPD-RLKGPMKRV----------------- ---------------------GEGQ-FQPISWE-QAFQEI--------GSKLKEL--KEQY -G-------------PQSL------------------------------------------ --------------------------VWLAHPEL-----------------ISPLEKHFM- -A-----AFGSPN-YTGHG-PTCYSSRNVAFEQMYG-----GVP-GVDY-RNVRYYIAFGR ---NLTG-------GIKNPDVQKIVAAKA---------EGAH----LVAVDPRLSDFAYFA -D----EWLPIRPGTDLAMVLAMINVLINENLYDA----------AFVAAYTT-------- ----------------------------------------------------------GFE -E------------LKKGVSG---------------------------------------- ------------------------------------------------------------- -------------YTPAWAAGITGIEA---------GTISRIARELAAA----KPAAAVDP -GWHAVTGSQYGNSVQAGRAIAALNALLGNLGARGGLSLPPTIKLGS-------------- -----PAGIMGPKPPAATAPRWDGAGSE--------------------------------- ------------------------KWPLNKDHGMIQ--TFPERVKQDQPYP----VKAVII -QHLNPVRS-------------------------------STDSLAFIE-ALK-----KLD -LVVAIDIQMNDTAYY--AHYILPE-ATYLE-RYDPLMTVG------------NKVLL-RQ -PAIKPLF-D---N--------KGA------EEIIAGIG-RAAGLSEYFNF---------- -----------------------TLEQ---------------------------------- -------------------------------------YNDALLGPLGLTQAQLA------- --------------LTGVAEVEASKPD-----------------------YSKLKTPSGKI -ELACPAFVK---------------------------------AGSTLTPAWEP-PLVEPR -DD---------SFRLIQGHVPMHTHTTTDNNS-----------YLHAIMP---ENE---- ------LW----------IHTSRAGK-LGI-------------K-------------TGDL -VEVA---SK-V--------------GK---V--R-VKARVTEAIHPEAVFLAHG-FGCR- ------------------------VPLRHLAY------NRGA------NGGDLIP-IMT-- ------APVSG------------------AAAQCETLVTVRKAG----------------- ------------------------------------------------------------- -- ->PsrA_Carboxydothermus_hydrogenoformans_YP_361367 ------------------------------------------------------------- -------------------------------MKLTRRSFLK---------ASAATGALAAL -SG-GVMSF-----------------ERWAA------------KAAETGEVKLIPSICEMC -GTKCGIIVKVK-NGR----VVKIEG--------NKEHPNGK------------------- ----------------GKICARGNAGMKLLYDPD-RLKQPLKK------------------ ----------------------EGDRFVPISWE-QAFREI--------GEKLKEI--KAKY -G-------------PEAL------------------------------------------ --------------------------VWSTHPE------------------LAYDYEVIFN -Q-----AFGSPN-LSAHA-PTCYSPRNVAYKTMYG-----EVP-TVDY-GNVKYYISCGR ---NLVE-------GINVSQVTGIMKAKE---------KGAK----LIALDPRYSNFAALA -S----EWVPIRPGTDLAFLLAMIHLIIKNEWYDK----------EFVKNYTI-------- ----------------------------------------------------------GFE -E------------VAAEVEK---------------------------------------- ------------------------------------------------------------- -------------YTPKWAEEITGIPA---------ATIERITEEFAKA----KPAAVVDP -GWHT---SRYMNSTEMVRAGAVINALMGNLGMKGGLKFPKYKFTKVEEREGLW------- -----PKLEKPKAKRFDGAG-------------------------GEKWP----------- ------------------------LAKGLGMIQMLP--EHILS---GQPYP----IKAYIV -NHHNPVRS-------------------------------AGNSQKWIE-ALK-----KLE -LLVVIDVQMSETAMM--AHYVLPE-STYLE-RFDPPQIAG------------NAVAL-RQ -PAVKPLH-N---T--------MGV------DDIIKELA-HEAGIGQYFNF---------- -----------------------TLEQ-------------------FSDQMLKP------- -------------------------------------FNVTFK-QLV----EKG------- --------------VIALDDGKTEYK------------------------VPEIKTESGKI -ELASSAFEK---------------------------------AGAKKVPTWVP-PGVTEG -NG---------KLRFLHGHTAVHTHTSTFNNE-----------YLHALMP---ENV---- ------LW----------INTRTAEK-LGI-------------K-------------NGDL -VEVK---SD-Y--------------GK---V--T-IKAKVTEAIHPDAVFMVHG-FGGF- ------------------------SPYQKKAY------KKGA------STSFIIP-CHV-- ------EPVSG------------------ASADCEVLVEVRKVGGGANA------------ ------------------------------------------------------------- -- ->PsrA_PhsA_Thermus_thermophilus_YP_004130 ------------------------------------------------------------- ---------------------------------MQRREFLK-L-------SALGVGAMALR -GS-GPAKA---------------LKAPWYA-----------------QEVKSVYQICEGC -FWRCGIVAHAV-GNR----VYKVEG--------YEANPKSR------------------- ----------------GRLCPRGQGAPQTTYDPD-RLKRPLIRVEGS-------------- -------------------QRGEGK-YRVATWE-EALDHI--------AKKMLEI--REKY -G-------------PEAIA----------------------------------------- ---------------------------FFGHGTGDY------------------WFVDFLP -A-----AWGSPN-AAKPSVSLCTAPREVASQWVFG-RPIGGHE-PIDW-ENARYIVLIGH ---HIGE-------DTHNTQLQDFALALK---------NGAK----VVVVDPRFSTAAAKA -H----RWLPIKPGTDTALLLAWIHVLIYEDLYDK----------EYVAKYTV-------- ----------------------------------------------------------GFE -E------------LKAHVKD---------------------------------------- ------------------------------------------------------------- -------------FTPEWAEKHTEIPA---------QVIREVAREMAAH----KPRAVLPP -TRHN---VWYGDDTYRVMALLYVNVLLGNYGRPGGFYIAQSPYL---------------- -----EKYPLPPLPLEPAAGGCSGPSGGDHEPEGFKPRAD--------------------- ------------------------KGKFFARSTAIQ--ELIEPMITGEPYP----IKGLFA -YGINLFHS-------------------------------IPNVPRTKE-ALK-----NLD -LYVAIDVLPQEHVMW--ADVILPE-ATYLE-RYDDFVLVAHKT---------PFIQL-RT -PAHEPLF-D---T--------KPG------WWIARELG-LRLGLEQYFP----------- -------------------WK--TIEE-------------------YLETRLQSLGLDLET -MKGMGTLVQRGKP-----------------------WLEDWE--------KEG------- --------------------------------------------------RLPFGTASGKI -ELYCQRFKE---------------------------------AGHQPLPVFTP-PEEPPE -GF----------YRLLYGRSPVHTFARTQNNW-----------VLMEMDP---ENE---- ------VW----------IHKEEAKR-LGL-------------K-------------EGDY -VMLV---NQ-D--------------GV---KEGP-VRVKPTARIRKDCVYIVHG-FGHK- ------------------------APLMRLAH------GRGA------SDNYLQTRYKL-- ------DPISG------------------GAGLRVNFVRLEKAERPRLPSLTGLAKRPFDE -RRM--------------------------------------------------------- -- ->PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 ------------------------------------------------------------- ------------------------------MPIMSRRSFLK-T-------SGICTAGAIAA ----TYLPD---------------QFLLWAG-------------EKGLAKTEKITTYCEMC -FWKCGAIATVV-GGR----VVKLEG--------NPLSATAK------------------- ----------------GKLCGRGNGGIGLLYDPD-RLKHPLIRTG---------------- -------------------KRGEGQ-FRKASWD-EALTHI--------ADKLKKI--KEEH -G-------------PESLA----------------------------------------- --------------------------LFTHGSPTEH---------------FMPLLQ---- -------GFGSNN-FAMPSFAQCRGPRVVGYELTYG--DDIGSPERLDM-ANSKVVVLIGS ---HLGE-------NMHNSQVQEFTDAIG---------NGAK----IIVVDPRFSVAAGKA -H----HWLPIKPASDMALILAWINIIIREGWYDR----------EYVAKYTH-------- ----------------------------------------------------------GFD -K------------LAAAVQQ---------------------------------------- ------------------------------------------------------------- -------------YTPEWAEKETDIPA---------AQIMATAREMGLH----RPAVCIHP -GRHV---TWDGKDVQRSRAIAILGAILGTWGREGGAYLATRGSF---------------- -----PAVPPPSFPASNRPTLKKG------------------------------------- ------------------------GFPLGGAEGVTN--AIREATSIGEPYP----VKAWMV -TGTNLLAA-------------------------------MPGQKETIE-AIS-----KLD -LLVVVDVIPSDTSLY--ADVVLPE-CTYLE-RHDGLIIGKGRA---------LSASI-RQ -PAVAPMY-D---S--------KPA------WWIAKELS-KKLGLEDYFP----------- -------------------WE--NFED-------------------RLNELCLT------- -------------------------------------YNIDYD-ELK----QKG------- --------------VISFPDTAKPFITADN--------------------QPVFKTKSGKI -ELYSKELEE---------------------------------LGFEPIPAYEK-NEEPPQ -GF----------YRLLYGRSAVHTFSRTVNNP-----------ALNELYK---ENE---- ------LW----------LSSVQARK-MGL-------------T-------------DGQY -VALQ---NQ-E--------------GI---TSNR-VRLKVTERIREDCVYMVHG-FGQQ- ------------------------SKGLTKAF------RRGA------DDQQLISSYPV-- ------DPICG------------------GTGMRCTFVKLVKGA----------------- ------------------------------------------------------------- -- ->PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 ------------------------------------------------------------- ---------------------------------MQRRDFIR---------MSSAVASAALL -GP-TLAGC--------------SRPAEWQR-------------MMTEAPATETPTVCNIC -FWACAAKVHTR-GER----LWKITG--------NPEDAHCE------------------- ----------------GRLCTRGTGGVGAYYDPN-RLVRPLVRMG---------------- -------------------KGADQR-FEVASWD-NALGLV--------AERMEKI--AREH -G-------------PDRLA----------------------------------------- --------------------------ALVHGPGAAH---------------FSHLVR---- -------AFGSDS-IAEPAFAQCRGPRDTGFFLTFG--QGFGSPEQTDM-AKARCIVLIGT ---HIGE-------NLHNSQVRTFTDGIR---------NDAT----IIVVDPRFSVAAGKA -N----HWLPIRPGTDIALLLAWMNVILAERRYDA----------GYVARNTV-------- ----------------------------------------------------------GLE -A------------LCAHVAP---------------------------------------- ------------------------------------------------------------- -------------FTPEWAYGETGIEP---------ALIRETARLMAAA----APATVVHP -GRHS---TWWGDDTQRARAMAILAGLLGIWGREGGYYLPESVAL---------------- -----PAYPVPAYPVPKTSWREIA------------------------------------- ------------------------LPVFPLAGAPVT--NVILDNAHGADAH----YKGLIV -YDTNLPMT-------------------------------MPGIRRTLEAAAQ-----SLE -LIVAVDVQPAEVTGY--ADVVLPE-CSYLE-RHDPLRNSGERY---------PALAL-RA -PALPPRG-E---S--------KPG------WWIAREIG-TRLGLGRYFP----------- -------------------WT--DYTE---------------------------------- --------------------------------------VIDWQLRQVGSSLKEL------- -----------------ETTGIRAFPRRTPAYFAPGE-------------TPRFATPSGKI -ELFSATLQQ---------------------------------AGFDPLPRYTR-PEAPPA -DH----------FHLNYGRAPQHSFSRTQNNP-----------VLYQLMP---ENL---- ------VW----------IHPTAARR-FGI-------------R-------------NGTY -VRLV---NQ-D--------------GV---VSNK-VRVRVTERTRPDSVWLVHG-FGHT- ------------------------APGLSLAR------GRGA------DDSALMTRVLY-- ------DPIMG------------------GTGMRGNFVTFRKENA---------------- ------------------------------------------------------------- -- ->B_Caldithrix_abyssi_ZP_09550397 ------------------------------------------------------------- -----------------------------MKTKMKRREFIK---------IAGAGAGSLVV -GS-KLYAS---------------FNSKDEQ------------NLLADGKIERTPTYCEMC -FWKCAGWVYKK-DGK----PWKIIG--------NPDDPNSR------------------- ----------------GRFCPRGTGGIGAYTDPD-RLKKPLLRVE---------------- -------------------KNGKQV-FKEVSWD-EALDFI--------AGRMKDI--AQKH -G-------------PECIA----------------------------------------- --------------------------LFSHGSGGSY---------------FKTLLH---- -------AFGSNN-VAAPSYAQCRGPREEAYMLTFG--EAVGSPERTDI-INAKCLVLLGS ---HIGE-------NMHNGQVQEFSEAVA---------HGAT----VITVDPRFSTAASKS -K----YWLPIKPGTDLALLLAWIHVIIYEELYDK----------EYVKKYTF-------- ----------------------------------------------------------GFE -Q------------LKEALKD---------------------------------------- ------------------------------------------------------------- -------------KTPEWAYPITTIKP---------HVIRQTAREMAKN----APATIVHP -GRHV---TWYGDDTQRVRAGAILNALLGSWGRRGGFYFPSKAHL---------------- -----PKMPIPKFPNVKRDWRKAF------------------------------------- ------------------------PNKYPVAHLALS--SGICDATIPSPERECS-FKGWIV -YGTNLPMT-------------------------------LPQPEKTLE-AIQ-----HLE -LLVAIDILPAEITGW--ADVVLPE-CTYLE-RYDNLRLSPGRV---------PSIAL-RA -PAFEPKY-E---S--------KPA------YWMARELA-KRLGLEDYFP----------- -------------AKTIEEYL--DYQL---------------------------------- -----------------------------------KAIGSSLE-EMK----KIG------- --------------VKLLPEEAQKLYLEDGE-------------------DFEFPTPTGKI -ELYSTILDE---------------------------------YGFDPIPQYTA-HEEPPE -GY----------YRLLYGRAPMHTFGRTTNNP-----------NLHDLME---ENT---- ------VW----------INSKVAKQ-WGI-------------K-------------NGEY -ITLE---NQ-D--------------GV---RSTP-VKAKVTERIRHDAVFMVHG-FGHS- ------------------------------DKRLRRAYGKGA------DDQRLITRVKI-- ------DPLMG------------------GTGMRVNFVTFRKEEA---------------- ------------------------------------------------------------- -- ->QrcB_Desulfomicrobium_baculatum_YP_003159879 ------------------------------------------------------------- -------------------------------MGLDRRSFIS-L-----VAGGVAGS---LF ----TPVIW-KTLD----------DVSIWTQ---NWPWI----PRLQYGEELTVPALCKLG -ADAYGLKVKTI-AGR----PVAAEG--------NPDHPLSL------------------- ----------------GGICPLGAASVHLLYSPS-RVKNPKLR------------------ --------------------DGS-S-FKDITWE-EAEELL--------AGKIKEA------ ---------------GASMA----------------------------------------- --------------------------MISGDETGS----------------VTDVLSGLV- -G-----KAGSDKSFFMPG----ESAPAAAALAMLG---GDGQV-GYDI-ENANYVLMLGA ---DALG----SW-GNVARNGKAFSASRE---------KGVK----FVYVGPAQNGTSAVA -D----SWIPCAAGTEPVLALGIAAVIAGTNR-DR----------SFWPGFAS-------- ------------------------------------------------------------- --------------FAKFVQTS--------------------------------------- ------------------------------------------------------------- -------------YPLDKVAEITGVSA---------ATITGLAQELVRA-----GRPLVLT -AAEA----GQGLGAFELAAGMSLNMLLQRVNTVGGVRILPWA------------------ -----PKVVEAA------------------------------------------------- ------------------------ADKKAMLANDLV--AYLSTVADGGAEA----PALLMV -YGANPAYA-------------------------------LPNLVKAQA-AID-----KAG -FVVSFSSFMDETAAM--ADLIMPD-SYAFE-RLDDAYSPYGSGQ--------PNYTV-AA -PVIKPVF-D---T--------RPA------GDVLLSVA-AKAELDLGFE----------- -----------------------TFED-----------------------VVKAKAEA--- -------------------------------------LGADFD-EMV----EGA------- --------------VWVSEEFPAQD------------------------------------ ------------------------------------------------LALWTT-PLQELA -VA----AQDGKTLALAPVLRLKIGSSKIAIPP-----------FNTNAIR-FDEML---- ------GN-----DMYVLINAATAKN-LGL-------------K-------------KDDA -VKLA---SS-G--------------GE---C--K-ARVRIFEGVMNDTVVAPLG-LGHT- ------------------------AWDAFSS-------GKGD------NVYKLLA-ADT-- ------ETETG-------LSR----FA--TV-----RVTVSKA------------------ ------------------------------------------------------------- -- ->QrcB_Desulfovibrio_magneticus_YP_002953179 ------------------------------------------------------------- -------------------------------MGLDRRAFLG-L-----VAGGTVGA---MF ----TPIPW-KLID----------DASIWTQ---NWPWI----PRVPKGQVDYVATTSKLC -PAGEGLKIMRV-AGN----PILAGG--------NPSHPLSC------------------- ----------------GGVSALARSEVYMLYSPA-RIKSPMKR------------------ --------------------NGK-T-FAPITWE-QALVEM--------AEKLGAA------ ---------------KGAVA----------------------------------------- --------------------------SISGDNTGT----------------INEVLTALT- -A-----KLGSAGSFMMPS----EATTAAKAMKLMG---AQGQA-GYDF-ENADTVLVLGA ---DIFE----TW-GTSSRNRKAFGANRP---------AGAKPANTYVYVGPSRNNTAAVC -D----QWVPAAAADLGVVALGIAWHLLKAGATSN-------------------------- --------------------------------------------------------APGFD -T------------FKAVVNGG--------------------------------------- ------------------------------------------------------------- -------------FGPEDVKRATGVAP---------ETLAAIAKALASA-----KAPLVVT -GSPF----GQGLGAAPVIAGMSLNMLLGRINKPGGVYMLPEL------------------ -----PSVVPGALTRAAM------------------------------------------- ------------------------------LDGDLP--AFLKGVESGKTPA----PKALLI -YDANPAYG-------------------------------LPEAATMAK-ALE-----KIP -FKVSFSSFMDETAAL--CDLVLPN-SLPLE-RYDDVATPYGSGF--------CVYSL-VR -PIQKPIC-D---T--------KTT------GDVLLGLA-RKLSIDLKFD----------- -----------------------NFQQ-------------------VIKEKVASLAKVSGG -FVAKDVMPWQVAAGKPAPALV---------------GGDLWK-ALE----AGY------- --------------AWTMVGQAAQ------------------------------------- -------------------------------------------TAMGFAAEVVAKAVKAGK -PA--------TATVLAPYAQLRTGTPVTGMPC-----------QDLTTVP-DTELL---- ------GD-----TTFIRVNSETAKT-LGL-------------K-------------KGQM -VKLS---GA-G--------------VD---C--Q-AKVHIFESVMPGMVSAPLG-FGHT- ------------------------AFDYYSQ-------GKGA------NYLSLAA-VVE-- ------EPGSG-------LSM----WI--AP-----EVKIA-------------------- ------------------------------------------------------------- -- ->QrcB_Desulfovibrio_vulgaris_YP_967712 ------------------------------------------------------------- -------------------------------MALDRRGFLK-F-----IGGATAGI---LA ----TPVVW-KGLD----------DVSIWSQ---NWSWI----PRNIKGANSYVPTVSKLC -PTGVGVRVRLV-DGR----PVRVIG--------NPEHPLSK------------------- ----------------GGVSSIAAAEVQMLYSPA-RMKRPLKRSP---------------- ----------------------DGA-YVMISWE-EAEAML-----------LDGLKAAKGG -D---------------ALA----------------------------------------- --------------------------CISGDDNGT----------------INELLSAFV- -Q-----QSGSKS-FFLMP---GEAQPAAKAWDLMG---GEGQI-GYDI-EKSDFVLAIGA ---NVLE----AW-GTAIRNRHAFGASHP-----HGAEPTAQ----FVYAGPVLNNTATGA -D----DWLPIRPGTESAFALGLAHLLIKAGASSS-----APDFDAFRSLAAS-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------FSPEKVAAQTGVDA---------KALTALAQALAKA-----KHPLVIV -GSEF----SQGAGAAPVMAGIALNMLLGSVNRDGGLRALPVA------------------ -----RKVVPAGMDRKAM------------------------------------------- ------------------------------LQQDLT--LWASAIASGKAKA----PKAMLV -YEANPVYA-------------------------------LPQGSAFKD-TLA-----KVP -FKVAFTSFLDETAMQ--CDLVIPV-SMGLE-RLDDVCTPYGCGE--------VVYSL-AT -PVTAPLF-D---T--------KPA------GDALIALG-GKLGLDLGVA----------- -----------------------SFED-------------------MLKAKAAA------- -------------------------------------HGADFD-KLA----EGT------- --------------AFTSRATVG-------------------------------------- -------------------------------------------ANLSFRPDVLSKALDVKA -PA--------LPLALAPVMKLNMGTSKTAIPP-----------FNTKTIR---------- ------RWEVQGKEGYVMLNGATARK-LGL-------------A-------------QHDR -VVLS---NP-T--------------GK---V--T-VRVNIFEGVMNDTVAMPLG-FGHT- ------------------------AFDEFSK-------GKGE------NVMHLLA-PST-- ------EPVTG-------LAV----WTGAGV-------NIAKA------------------ ------------------------------------------------------------- -- ->ArrA_Chrysiogenes_arsenatis_gb_AAU11839 ------------------------------------------------------------- -------------------------------MRIKRREFLK---------ASAAVGAVAVA -SP-TLNAF---------------AQTGTGA------------SAMGEAEGKWIPSTCQGC -TTWCPVEFLFR-MAV----RSKYAA--------TQLSKANN------------------- ----------------GYCCVRGHLMLQQLYDPD-RIKTPMKRTNPVKG------------ -------------------RKEDPK-ICPYHMGMKQWDTI--------ADKIMEL--RKNN -E-------------THKYL----------------------------------------- --------------------------LMRGRYSDH----------------NSIFYGDLT- -K-----MIGSPN-NISHS-AICAEVEKMGSMATEG---FWGYR-DYDL-DNMKYLIAWAC ---DPLS----SN-RQIPNAIRKIQGVMD----------RGK----VVAVDPRMNNTASKA -Q----EWLPIKPSEDGALALAMAHVIITKGLWSK----------EFVGDFKD-------- ----------------------------------------------------------GKN -K------------FVAGKTVKEEDF----------------------------------- -------EEKLTNGIVKWWNLEV--KD---------------------------------- -------------RTPKWAAKVTGIDE---------ATIIRVATEFAQA----APACAIWY -GPNM-----QPRGSYAVMCIHALNGLVGASDSEGGLCTGMGS------------------ -----PSSSYPKIDAYQDDVAKAGA----------KNKKIDQRGTLKFPAMGSA------- ------------------------KPGTGVVTNNVA--DALLA---ADPYD----IKVAIG -YFCNFNFS-------------------------------GTDGARWDK-ALA-----KVP -FFVHCVPMFSEMTYF--ADIVLPAALHHTE-DWAVIRSKANLH---------GHTSI-QQ -PVVERMF-D---V--------KGVE-----TEITWLLA-EKLKAKGFENMY--------- -------------NWLYNEYK--DPET----------------------GKNPTNSLEFAL -YATKIRSKKCWDPKENAEYKGD--------------KLNGWA-DFM----EKG------- --------------IVNSPKFKFRQKW-----------------------EKGFPTETKKF -EFYSETLKKGLLAHAEKNKVTVDQVMEATNYEAR--------GELAFIPHYES-PKRHGD -VK-------EFPFSLIDMKSRLNREGRSTNAT-----------WYHAFKKCDPGDV---- ------NQ-----EDVLQINPADAKK-LGI-------------N-------------EGDM -VKVT---SV-I--------------GS---L--T-VKARLWEGVRPGCVAKCYG-QGHF- ------------------------AMGRVSAKDFGKAVARGA------NFNDIMP-ADY-- ------DRITG-------ATA----RNGGFT-----GVKIEKA------------------ ------------------------------------------------------------- -- ->ArrA_Wolinella_succinogenes_NP_906980 ------------------------------------------------------------- -------------------------------MEINRRDFLKAT-------ALTAGAVGIAQ -IP-EIEANTQVSG----------EVGKWVA------------------------STCQGC -TSWCSIQGYVV-DGR----LVKVRG--------NPNAKGNH------------------- ----------------GKICPRPHLAIQQVYDPD-RVKTPLKRTNPKKG------------ -------------------KGIDPQ-FVPISWD-EAIDTI--------ADKIMAL--IKSG -E-------------SHKFA----------------------------------------- --------------------------LFRGRYTHMN---------------EI-LYNTFP- -K-----LIGSPN-NISHS-SICAEAEKFGRYYTEA---LWDYA-DFDL-DNTRYVLGWGA ---DPLA----SN-RQVPHFINIWGKVRD----------QAR----IAIIDPRLSATAAKA -D----HWLPIIPGEDSALAVAMAHVILAGGAWNK----------GYVGDFVD-------- ----------------------------------------------------------GHN -Y------------FKPGELVPESIEVEGKIIPVEF------------------------- -------KEKHTYGVVKWWNLEL--FD---------------------------------- -------------KTPEWAEPITGIPA---------KQIRQVALEFAAA----GSRAISWV -SPGA---CMQIRGSYASMAAHALNGLVGSCDSVGGILQGTSV------------------ -----PSGKTPDIKPYLSEEIASALKQKKIDQRGTPKFPALNK------------------ ------------------------KTGGGVVTANVA--NAILD---EKPYD----LKMAIG -YWNNFVFS-------------------------------INGTHLWEK-AME-----KLP -FYAHITTHMAEMTMY--ADIVLPAKMHMFE-RYGFSKNKQNLH---------GYLSI-HQ -PMVKPLG-E---A--------KTDE-----TEIVFMIA-QALAKKGHDAPL--------- -------------RYYQENFK--DPET----------------------GKIPSTPEEFDL -FSVKYFTQPIWDGSSNDKGD----------------SINSWK-ELL----EKG------- --------------VWSTKRYSIGKK------------------------IDNFKTETKKF -EFYSETLKKVLEEHVEKNKLSSIDEAIEASNNTAR-------GERVFVPHYEP-SVRYGD -PK-------IYPLIFAEHRSRLNREGRSQNAP-----------WYYEHKDVDPGDE---- ------IE-----KDVAKINPETAKQ-FGI-------------K-------------TGDR -IRIV---GT-Q--------------AS---I--E-TEVKLWEGIRPGIVVKCYG-QGHW- ------------------------AYGSVASEKFGSK-PRGT------NNNDIHI-HEY-- ------DRLSG-------STA----RHGGTA-----RVKIEKI------------------ ------------------------------------------------------------- -- ->ArrA_Sulfurospirillum_barnesii_gb_AAU11840 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -TSWCPIQGLVV-DGK----VVKVRG--------NPNSPSM-------------------- ----------------GRICPRPHLAIQQVYDPD-RVKTPLKRTNPKKG------------ -------------------KGIDPK-FVPISWD-EAINTI--------AEQILGL--IKAG -E-------------SHKFV----------------------------------------- --------------------------LMRGRYTH-----------------MNEILYNTFP -K-----LIGSPN-NISHA-SICAKTEKFGRYYTEG---FWDYA---DF-DLTIPVIFWDG -ERDM---------VSSNRQIPWFMNQQG------YVKDRAK----ITIIDPRLSATAAKA -D----RWAPIIPGTDSALAVAIAHVILSEGRWNK----------SFVGDFQD-------- ----------------------------------------------------------GKN -Y------------FIPGSTVPTEVIVDEKSLPVVF------------------------- -------EENHTYGVVAWWNLELKE------------------------------------ -------------RTPEWAEKITGISA---------KDIRTIAREFSDA----GSKAISWV -TTGA---SMQIRGAYASLAAHALNGLVGSVDAVGGTLQGSXA------------------ -----PSGKTPDIKPYLPAEFEAALKQKKIDQRGTLKLGAFNK------------------ ------------------------KTGGGVVTQQVA--DSILT---DKPYD----VKVAIG -YWNNFVFS-------------------------------INGANVWEK-AME-----KLP -FYAHITTHLAEMSMX--ADIVLPAKMHMFE-RYGFSKNKQNLQ---------GYLTI-HQ -PLVKSFA-D---A--------KTDE-----TEIPFLIA-QALAKKGFDGPL--------- -------------RYFQDNFK--DPES----------------------GKAPTNPRRVDL -YAVKQFTXPIWSGESNEKGD----------------TINSWN-ELL----DKG------- --------------VWKTKKYKIGKK------------------------VDNFATETKKF -EFYSETLKKVLIEHAEKNKVTVDEALEALNYTCR--------GELGFVPHYEE-AVRHGD -EK-------TYPFIFAEHRSRLNREGRSQNAP-----------WYYEIKDVDPGDV---- ------AG-----KDVTKINPLDGKK-LGL-------------K-------------DGDK -IKIT---SV-Q--------------GS---I--E-SEVKLWEGTRPGT------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ArrA_Bacillus_selenitireducens_gb_AAQ19491 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------EQGEWIA------------------------SVCQGC -TAWCAVQVYRI-DGR----ATKVRG--------NPNAKANH------------------- ----------------GHSCVRSHIGLQQVYDPD-RVKQPMKRTNPNKG------------ -------------------RDEDPE-FVPISWE-EAMDTI--------ADKIIEL--RENN -E-------------THKFS----------------------------------------- --------------------------VWRGRYTSN----------------NGILYGNMP- -K-----IIGSPN-NISHS-SICAESEKFGRYYTER---YWGYA-DYDH-ENALYEIFWGG ---DPIA----TN-RXVPHTASIWGELSD----------RAT----LACVDPRFSTTAANQ -M----NGCRLIPGEDGAIASAIAHVILTEGVWYK----------PFVGDFKD-------- ----------------------------------------------------------GQN -R------------FVEGRDVNEDDF----------------------------------- -------EEIQTHGLVKWWNLEL--KD---------------------------------- -------------KTPEWAAERSGIDA---------DQIYRVARGFANA----APKAISFS -SPGS---SMTIRGGYTAMTQAALNGLVGSADNLGGVISNGISV----------------- -----PNNGFPDPSDYIDEIAANGL----------EQDRIDWGGRLEFPALKDS------- ------------------------KSGGVKVTNTVA--DAVLA---EDPYE----FKSRIE -LLDELQFL-------------------------------QPRNGSLGQ-SFG-----QDS -IHGAYDCQSGEQTHF--ADIVLPVPHSQFE-RQSPVAGSNGNLH--------RHLHL-QN -KVIESPF-D---I--------RVDE-----TEIPWMIG-ESLEKKGYSNLI--------- -------------DYFRNEFR--DPET----------------------GEAPTNAAEFDE -IATKHYTHPVWDPTFEKDGD----------------QIDGWE-EYK----RLG------- --------------TWNTNKYEFRQKW-----------------------DGNWGTETGQF -EFYSETLKVALQDHADKHNASIDDVMEATFNTAK--------GELAFVPHYEP-AMRVGD -ES-------EYPLIFMEHRSKLNREARSANTS-----------WYQEFKDIDLGDE---- ------AW-----DDVAKLNPKDAAE-LGI-------------Q-------------NGDM -VRLV---TP-E--------------GQ---I--E-VKAKLWEGTRPGVVAKCYG-QGHW- ------------------------AYGHIASLDRRRQIARGG------NNNIILA-PVH-- ------EALSG-------SGA----RHGGQT-----RVRVEKV------------------ ------------------------------------------------------------- -- ->ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 ------------------------------------------------------------- -------------------------MSRNKTSGISRREFLK-V-------MGSTGAALGLG ----LSATS-GNKV----------LAEEDPY---EVLPE------GEHKSGEWVPTGCAGC -TSWCSLEANVV-DGR----VIKIRG--------NSRSKVNG------------------- ----------------ESSCPRSHLSLQQVYDPD-RIKRPMKRTNPEKG------------ -------------------RDVDPE-FVPISWE-EAFEEI--------ADKIIEL--RENG -E-------------SHKFV----------------------------------------- --------------------------LWRGRYTR-----------------LRDILYGILP -E-----FVGSPN-KISHS-SICAEAEKFGPYYTEG---YWAYR-DYDL-QNSDYILIWGT ---DPIQ----SN-RQVSLYSREWGNILE----------GAR----IATVDPRFSRTAAKS -N----EWLPVKPGEDGALALAMAHVILTEGLWHK----------EFVGDFVD-------- ----------------------------------------------------------GEN -K------------FTAGEEVDEDEF----------------------------------- -------EENYTHGVVKWWNEELKD------------------------------------ -------------RTPEWAADKTGIPA---------EQIVRVAAEFGEA----APHACVFM -GGGG---VMQTRGGYNSMAIHGLNGLVGSIDNEGGAV-RGASV----------------- -----PNQSFPDHSEFLDDISREGL----------DHEMIDRRGRLEFPAFKDG------- ------------------------ESGGGVVTNLSA--DGIIE---EDPYE----IKMGIG -YWNNFNFA-------------------------------APETERWDE-AMS-----KLD -FYVHLVTHQSEMTQY--ADIVIPSTHHMFE-QWGMLYQKGNLH---------THFWL-SR -PMINRHWEL---I--------EPE------AEFSWLLA-EKLAEKGYSNM---------- ----------------LDYFK--TIVD-------------------PETGEEPEDYREFAK -YATKHYMQPVWDPEMESHGD----------------QFDGWE-DFK----EAG------- --------------VWNSDEFEFQQYW------------------------GEFTNSTGDF -EFYSETLKEALEEHAEKHDVSIEEVLEACKYEAE--------GELAFLPHYEE-PYTVGD -DE-------EYPLLLVDSKSALNREGRSANAN-----------WYYDLKDIDPGDS---- ------TE-----ADVIKIHPRDAEE-LGL-------------E-------------DGDE -VVVS---SP-A--------------GE---I--T-CQLNVWEAVKPGTASKTFG-MGHW- ------------------------AYGRVAAEDFADGEPRGG------NNNEIIP-AEY-- ------ERLSG-------STS----FY-SHI-----KVNIERA------------------ ------------------------------------------------------------- -- ->QrcB_Syntrophobacter_fumaroxidans_YP_844744 ------------------------------------------------------------- -------------------------------MKVGRRAVLQFM-------AGAVGGTLL-- ----SPLPWKLTD-----------DAAIWSQ---NWFWR----PSPARGEITRKPTVCALC -EGGCGVQARLV-DGK---RAILLEG--------NPNHPVNQ------------------- ----------------GGICALGAAGLQFLYAPY-RIAQPLKQTK---------------- -------------------RRGDPTGFQPIAWN-EAVGEL--------AKKLGQM--RADG -K-------------PNGLA----------------------------------------- --------------------------GITRRRCSS----------------MDALLNQFF- -A-----AYGSPN-LFKMP-AHADSLKLAGAVTT-----GREAPFGCNI-EDAPYILSFGA ---GLVE----GW-GSPGRMQAAFRRWRQ------GGKSAAK----IVQVDSRCSTTAAMA -D----RWIAVPPGTEAALALGIAHLMVKDKLYDA----------EFMADRVF-------- ----------------------------------------------------------GFE -D------------WTDSQGKNHKGFKFLVQTDA--------------------------- ------------------------------------------------------------- -------------YTPEAISKLTGVDP---------AKIRELAKEFGTQ-----KGAVAVW -GQPQ---GSVPKDMYNELSFLALNALKGNI-KAGGAIGLA-------------------- -----PEVPLGALPELPGDPSALKGLKQLRLDLASSQK----------------------- ------------------------GPPPVLPGNNLH--GFLDAVSNGGKYP----IEVMLV -HEANPAYG-------------------------------LCENKLFQQ-ALT-----KIG -TLVSLSSYMDETAQQ--ADLILPI-HTAFE-GFDDVIGIPGAPY--------AYYGV-CA -PVLKPHL-N---T--------KAA------GDIVMSVA-KQLGGSIAAAL---------- ------------------PWA--SHEE-------------------YLKKRAEGLAASARG -ALADKKGVELWKLQPEEAVKPNYKD-----------GADLWK-KLA----GGA------- --------------CWYDAPVDP---------------------------LKDLKTESGKF -ELAAQLLLAKGQTGD---------------------------DDQVYLPHFSQVPPRGSD -KD--------YPLLLVTYQMSALADRDLANPP-----------FMTKTVF-DFILR---- ------QN-----DQFVEINPATASE-LGM-------------A-------------EGDS -AVLK---TP-Q--------------GE---V--P-VRVHLYAGARPKVVYLAQG-LGHK- ------------------------AYDEYIK-------DKGV------NANGVVE-VQL-- ------DRVTG-------LGT----VW--AA-----RAHLRRA------------------ ------------------------------------------------------------- -- ->QrcB_delta_proteobacterium_NaphS2_ZP_07200609 ------------------------------------------------------------- -----------------------------MTMKITRRNFIA-A-----VVGGVVGI---QV ----TPLPW-KFTD----------DAAIWTQ---NWPWV----PVPAEGAVTEENTVCNLC -PGGCGISVRKV-AER----AVKIEG--------RTDYPVNP------------------- ----------------GGICPVGMGGLQLLYDDDMRFPGPMKRAG---------------- -------------------ARGQGQ-FVNITWG-EAYDIL--------AGRIAKL--RKDG -T-------------PEALA----------------------------------------- --------------------------AIDGNYAGTT---------------TGLLVERFM- -R-----SVGSPN-YVKPN-AITDTYH-MGNLLMMG---KSVPM-AYDL-ENSDFILSFGC ---GLLE----GW-GAPGRVMNAWGMWHD----ANPKNRKTR----VVQVESRASNTASKA -D----FWVAPRPGTDGALALGIAHVLIKKGRVDE----------RFINGFTY-------- ----------------------------------------------------------GFD -D------------LTSSEGQSQPG------------------------------------ -------------------FKTIVSNK---------------------------------- -------------YSPVQVERITGVDA---------GTIVALANAFSKA-----KAPVAVY -GKGK---NNLNGSLYEFMAVQSLNAVKGRINRPGGVLVPDPL------------------ -----PLAPLPEFDPDEVAAKGLETPRIDGAG----------------------------- ------------------------TKAYPFTDSLIN--HFADAINQGARSP----VDTLLV -FSANPFFT-------------------------------VPDGPGFMN-ALE-----KIP -FIVSFSPYRDETANM--ADLILPD-HTYLE-KIEDIVWPVGLQY--------PLYGL-TK -PVVEPVN-D---T--------QHA------GDVIISLS-KAVGEATGSAF---------- ------------------PWE--NFEE-------------------ALQARAKGLFDAGGG -LVHYDASKPPWKFKPFGNGQKPSYKS----------FDDMWG-EMK----SGG------- --------------MWFQPVKLAGMDG-------------------------LFATSSGKF -EFVSQKLRQTINETAAQTSQKAALDQMGIRVA----------GAEAFMGHYAA-PKLG-- ------VDRSKYPLFMVPYEMINLSSGWIATPP-----------FLYKTIF-ASQLL---- ------KE-----ESFAAVNPETAAK-YKL-------------Q-------------QGDR -AIVK---SP-V--------------GE---L--R-VRIDLFEGAMPEMVYMPLG-FGHT- ------------------------AYDEYQK-------DKGV------NPNNIVK-ALN-- ------DPVSG-------YPL----WW--NT-----PVTLTKA------------------ ------------------------------------------------------------- -- ->QrcB_Desulfatibacillum_alkenivorans_YP_002430439 ------------------------------------------------------------- -------------------------------MKLNRRNFLL-VSTAG-AAGGAVGS---MF ----SPLSW-KLMD----------DSSIWTQ---NWPWT----PVPADGEVSFEETTCTLC -PGGCRVKVRKV-DER----PIKLEG--------VEGGPVND------------------- ----------------GGICILGLTALQLLFGPA-RVHTPMKRAG---------------- -------------------KRGEGK-WVEITWE-EAISEV--------SGKLAEI--RETG -R-------------AQDLG----------------------------------------- --------------------------CIAGGGKGV----------------INALFSRFM- -E-----AYGSPNFYWQATAWDCYEENI---LRTLG---LNGTA-GFDL-ENADYILSFGA ---GLLD----GW-GSPVHVFQAHSKWRE------NHDGHAT----LVQIDAQLSNTAAKA -D----KWLPIVPGTEGAVAMAMAHVIISKNLYNR----------GYVNWNTT-------- ----------------------------------------------------------GFR -D-----------FYRTVESEYAPAKVVKIACPVDN------------------------- -------------------------KE---------------------------------- -------------YQKKWL-----------------EELESRAIAFAKA-----DKPLAVA -GKGN---GDRPVSQAELNAVQALNALVGAINRKEGGMVVLPDE----------------- -----PKYPWKPVVMDAEARSYKPSLVSVRGRS---------------------------- ------------------------KYGHSNLVSVLP--QALNSSHEG--------LKVLLL -AGSNPLYT-------------------------------LADTEKTAE-ALQ-----KVE -YIVSFSSQFNDTTAY--ADIILPD-HIFLE-STVDAPTPPGFAK--------PVYGL-AE -PVIKPVY-K---T--------KAM------GDSIIEIA-KAMGGTIAQSF---------- ------------------PWA--DSAE-------------------AIEQA---------- -------------------------------------LGGKWP-LLK----RGG------- --------------VYVNEDFTPETEG---------------------------------- -------------------------------------------VRFRFFARSGMESRISIQ -GK-----AEQYPLIATPVDCIRLATGALADTP-----------FMVKTVS-DKKLK---- ------HK-----ELVVQVNAMTAQQ-YGF-------------K-------------EGSE -AVLE---TP-V--------------AK---A--K-VRVHCSEEIAPGLVGVPRG-LGHI- ------------------------AHDEFVG-------GKGT------NYNTLIS-PVQ-- ------DPATG-------FDV----AW--GI-----RAKLT-------------------- ------------------------------------------------------------- -- ->QrcB_Desulfococcus_oleovorans_YP_001530428 ------------------------------------------------------------- -------------------------------MKIDRRSFLT---------LLAGGAVGTAL ----SPMTI-KLTD----------DISIWSQNFRGTPIE---VPVPERGPASYVDSVCTLC -PGGCGISVRKI-GDR----AVKIEG--------KAGHPVNN------------------- ----------------DGVCALGLSGLQLLYGPW-RVTGPK-------------------- -------------------KKENGR-WKKISWD-RALSEI--------AEKLNEL--REAG -K-------------ADAIA----------------------------------------- --------------------------GISRTGRGT----------------VARLMQRLL- -A-----AAGSP--HFLPV-PTNENAYSDAVARMFG---KPGTV-GFDF-ENSGYVLSFAA ---GLLD----GW-GSPVHMFSAHSQWKT---------NGVK----MVQVESRLSSTAAKA -D----QWVAVKPGTEADLALGLAHVILRDNLNAG----------AAANSRAF-------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------DSFAALVKKD---------------------------------- -------------YTPARVAAATGIKE---------SVIVALAKEFAAA-----SHPVAVC -GRGD---GQTPCDSREVMAVTALNALVGSVNRQGGMIIGPEPDY---------------- -----IQWARPVLDDTAQKGL---------------------------------------- ------------------------AKGPKTLADLLA--GKTPD------------VQALFV -LEANPAYT-------------------------------LHDTTKVKA-ALE-----AVP -LVVSLSSFMDETSAL--ADYILPL-PTCLE-RTEDVVVTAGLKT--------PMIGL-TQ -PVVEPRL-D---T--------RHP------GDVILDLA-KAMGGTVAESF---------- ------------------AWS--DYQD-------------------CLEKT---------- -------------------------------------FGLVYG-KLA----TEG------- --------------YLQKSVLETLIDT---------------------------------- -------------------------------------------AVAVGRADFAP-VVEADK -K----VRQNTPALVLAAYDAMRVAGGAIATPP-----------YAMKIVP-DTILK---- ------KN-----DLYVEINPETAQK-AGL-------------A-------------DGKA -AVVE---TP-A--------------GT---A--Q-VRVRVTHEVAPGMVAMPRG-FGHT- ------------------------AYDDYVS-------GKGV------NVNDLIG-PVP-- ------DPVSG-------LDT----AW--GA-----PAKLIKA------------------ ------------------------------------------------------------- -- ->Gemmatimonas_aurantiaca_YP_002761548 ------------------------------------------------------------- ----------MIAPSATTDHRPSTTMTTEAGTGVKRREFLK-I-------LGATGATTAVV -GC-SSEK----------------VGKLIPY--VTSPDN------TVPGVSQYYATSCREC -AAACGVLAEVR-DGR----PIKLEG--------NPEHPLNR------------------- ----------------GAICATGLAGIQGVYNPD-RYRSPMVR------------------ ----------------------EGNALKPTTWD-KAYELL--------AQKLGEV--KSKG -Q-------------AGNVV----------------------------------------- --------------------------FVNQHETGT----------------FPGFLDQWL- -S-----AQGMPA-HLSVD-STAPIATIAANQKAYG----AAWP-ALNF-SAAKLVISFGA ---DFLD----GW-GHSVPQQLDWADARS------KLDVAPR----LVYIGARRSLTGLNA -D----QWIAAKAGSEMAICAALTGT----------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------GSAAAAAEAANVPV---------ATIEALVKAVADA----GNGIMALC -GVTG------NDAVECGVMVAEINKKGGAVGTTINTAK---------------------- -----AHGSYTGLASYAD------------------------------------------- ---------------------------LAAAVKNMD--AGT--------------VPLAFV -RGANPAHT-------------------------------MPKSAGFAA-AFA-----KVA -FKVSFSSMPDETAQL--ADLVLPD-NHWLE-SWGDAVGEN------------GQISL-QQ -PTLDPVF-D---T--------RAT------ADVLIDLA-KKDQTLAARY----------- -----------------------NVAN---------------------------------- -------------------------------------FRSWYISQF-----PGG------- -----------------ASAFATALTK---------------------------------- -------------------------------------------ASVSGAPLVAT-STRTLA -TTALPVAEGAGEFFVQVYPSSTLGDGAGANKP-----------WLQELPD-PVTKI---- ------AW-----QSWIEVHPSTAKK-LGI-------------K-------------EGSH -LTIE---TA-A--------------GK---V--T-APAYIYMGVRTDTVAIALG-QGHT- ------------------------AYGRFAQ-------NIGV------NAYDLVS-HGW-- ------DSA-G-------SLA----IG--SV-----KGKVTVSADSSPLVTTE-------- --GSARQHGRGIAQAMTLAA----------------------------------------- -- ->ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 ------------------------------------------------------------- --------------------------MKLLETLINRRRFLKAT-------GAVAGAGVVAG -GA-GVVP----------------GLTTLSHARSPAPSA----------DTTITKNICHQC -PARCGIDVYTT-GGR----VHAIYG--------TSDHPISN------------------- ----------------GKLCPKGPLGAYILYDPD-RFKGPMKRTNPNKG------------ -------------------RDQDPG-FVPISWN-EALDMV--------ADRLNGL--RERE -E-------------SHRFA----------------------------------------- --------------------------LLYGRGWGAS---------------CAGLLGNFG- -K-----LYGSPNVAIGHS-SMCSDGSIISKKAVDG---IGGYN-SYDY-KNANMLLMFGA ---GFLE----AF-RPYNNNMQVWGYIRG------VKVPKTR----ITAVDVHMNTTLAGS -D----RALLIKPGTDGALALAIAHVILVDGLWEK----------AFVGDFSD-------- ----------------------------------------------------------GVN -R------------FIPGETVDPDSF----------------------------------- -------EEKWVKGLVEWWNAEL--KD---------------------------------- -------------RSPRWAAQVTTLYE---------RDILATAREFGTT----RP-AIALY -ERGA---HAHSNGIFNGMAIHTLNALVGSLYAKGGLAYQVGPSYGPL------------- -----PVNADDYLDDWARTGGWK------------AQPRIDLKGH---------------- ------------------------PDGYLLANNMMQ--EIGPNSLQGKPYK----LDTIMF -YLNNAIWT-------------------------------APDVKAWEE-ALK-----EL- -FVIETSPFPSETAMF--ADVILPD-HTYLE-RLQDAPTYPFQGW--------PMTQL-RV -PAVKPLY-D---T--------KYF------GDVLIELG-KRIQGSMGEYY---------- --------------QALDNTE--NVIR-------------------HLAKGFESDPGDNGV -N-----------------------------------SFESWK--------EKG------- --------------VWYKRVYPYRQIDGEFYEWDGQDHTRL--MSADEVRGALFKTASGKF -EIRSGWLEAHADWIAAKTGRD---------------------PSRLMFPIWEE-PSHPGG -GD----------LYMVTPKVALHAEGRGANLP-----------VAIANMQ-PTLGG---- ------RN-----TIYIEINPKTARA-RGI-------------P-------------DGSR -VRIS---SD-L--------------GA---I--E-GYCKYYEGVRPDTLVFPME-HGHW- ------------------------AHGRWAK-------GRKP------GHSGEITVNQS-- ------DRITG-------QCS----YY--TT-----KVRIERA------------------ ------------------------------------------------------------- -- ->Halorhodospira_halophila_YP_001001949 ------------------------------------------------------------- --------------------------MSVLDHLVSRRRFLQ-A-------TGVGGGAVAAG -GV-GHLLS---------------FSAGGSHARADGPVG--------GGETQITKNVCHQC -PARCGIDVYTT-DGR----VHAIYG--------DPGNPIAN------------------- ----------------GRLCPKGHLGSYILYDPD-RFKGPMKRTNPNKG------------ -------------------RDEDPQ-FEAISWD-EALGIV--------AERLNRL--REQE -E-------------SHRFA----------------------------------------- --------------------------LMYGRGWGAS---------------CAGLLGPFA- -K-----LYGTPN-VIGHS-SMCSDGSMVAKGLTDG---NESYN-AYDY-RNTNYILNFGA ---GFLE----AF-RPYNYLMQVWGHMRT-------KSPKTR----VTAVDVHMNPTLAAA -D----RAVTIKPATDGAMALAIAHEMLVNGYWDR----------DFVGDFTD-------- ----------------------------------------------------------GAN -R------------FEAGTEIDPDDF----------------------------------- -------EEVWTQGLIRWWNDEL--KD---------------------------------- -------------RTPEWAESITTVPA---------ETIRRVAYEFGTT----RP-AMAIM -ERGP---TSHSNGTYNGMAIHALNALAGTLFTEGGLFYQMDVPYGDG------------- -----PADPDDYLDDYAGRMQERFDEGEIPRIDKLG------------------------- ------------------------TDRWPLARNMMQ--EVGPNHAAGEPYK----LDTILF -YLNNPIWT-------------------------------APDATAWEE-ALK-----DV- -FIIDTSPFPGETARY--ADLILPD-HTYLE-RLQDAPTYPFEGY--------PMTAL-RT -PAVEPLY-D---T--------KVF------GDILIEIG-KRLDGPAGEY----------- -------------------WQ--------------------------AVGDTENLLRHLAE -GFRDHPGDNGVE------------------------DFESWK--------AKG------- --------------VWYKKPYHWKQERGVFYEWVEDDGDYTHEMSAEEVADKLMPTPSGRF -EFFSEKLQEHADFVASEFGID---------------------HERAGLIQWVD-PDHPGG -GD----------LYFSTPKTALHAEGRGANIP-----------HAIAHVQ-PVMGG---- ------RT-----TVYLEIHPRTARE-RGI-------------R-------------SGDR -VRIV---SD-V--------------GE---I--E-AYARLFEGTRPDTVCLPME-HGHW- ------------------------AQGRWAE-------GRKP------GHSGEVTVNQS-- ------DRISG-------LAS----YY--TT-----KVRVERA------------------ ------------------------------------------------------------- -- ->Alkalilimnicola_ehrlichii_ABI55571 ------------------------------------------------------------- -------------------------MKMILDTLLNRRRFLKAT-------GATGAAAATTA -GVGKLAGF---------------TAASTTSTHVNARPG---------GETRVTKNICHQC -PARCGINVYTT-NGR----VHAIYG--------DPGNPIAN------------------- ----------------GKLCPKGHLGTQLLYDPD-RFKGPMKRTNPNKG------------ -------------------RDEDPE-FVPISWD-EAFDIV--------AERLNRL--RERG -E-------------SHRFA----------------------------------------- --------------------------HFYGRGWGSS---------------DAGLYGDFG- -K-----LYGTPNSAIGHA-SMCAEGSKRAKRATDG---NDSYN-SYDY-RNTNYILNFGA ---GFLE----AF-RPYNYLMQVWGHMRT-------KSPKTR----VTTIDVRMNPTMAAS -D----RALMIKPGTDGALALAIAHVILTEGLWDK----------EFVGDFED-------- ----------------------------------------------------------GRN -H------------FRTGETIIPDAF----------------------------------- -------QANWTHGLAEWWNGEL--KD---------------------------------- -------------RTPEWAEEITTIPA---------KHIYTVAREFATT----RP-AMAIM -ERGP---TAHFNGTYNGMAVHALNALVGSMFAEGGLFYQMGPSYGPL------------- -----PVSADDYMDDYAREMQGKHPRIDMAG------------------------------ ------------------------TEKWPMAGTMMQ--ECAKHHLAGDPYK----LDTAMF -FVTNPIWT-------------------------------APDPRLWEE-ALK-----DV- -FIIDTSPYPGETAMY--ADIIMPE-HTYLE-RLQDSPTYPFEGW--------PMAAL-RT -PAVDPVY-D---T--------KHF------GDMIIEIG-KRINSPMADYY---------- -----------------RELG--DVEN-------------------MLRHRAAGFANDPGD -N---GVN-----------------------------DFESWK--------EKG------- --------------VWYKKPYHWRYWRGTFYEWDGEGYNI--EMSEDEVKDKLMPTASGKF -EFKSSFLENNANYIARE--MGIA-------------------EDRVGLIQWVE-PRHTGD -GD----------LHFVTPKTPLHAEGRSANIP-----------QAQAYMQ-PIVGG---- ------RG-----TCYLEIHPKTAQE-RGI-------------N-------------DGDT -VRLS---AQ-VR-------------GETKSI--L-AVARYMPGHRPDTLVLPME-YGHW- ------------------------AQGRWAT-------AQGRDM-KPGHSGDLTE-NLS-- ------DPISG-------LAC----YY--TA-----KVRLEKA------------------ ------------------------------------------------------------- -- ->RBG1_855 ------------------------------------------------------------- -------------------------------MQVTRRDFLT------------------FA -GF-TLAGI---------------TLGEWGRSKILAREEYKDTLYSGIGKEEFRLSICGQC -PAGCGIVVRLM-DGN----PKKIDG--------NPLCPLSR------------------- ----------------GKLCPKGQNGLQVLYDPD-RLTGPVKRKG---------------- -------------------KRGEND-WEKISWE-EAINTV--------SQKLKEL--KEKQ -N-------------SYRLL----------------------------------------- --------------------------ILTQENKGL----------------SGKLWKQFA- -R-----AYGTPN-LVEGN-LLRDPGILWASYLMQG---IKDYP-AYDI-ENTKYILCFSP ----FLE----GW-YSPTWAQRMYGNFRR-----KRPEIRGK----LVQIEPRLSPTAANA -D----EWIQINTGTEAALVLGLAYLIIKEGRYDE----------NFIREHTF-------- ----------------------------------------------------------GFE -D------------WTDAQKRTHLG------------------------------------ -------------------FKNFVLQE---------------------------------- -------------YDTEKVSSLTGVPI---------VTIIRLAREFSEL----NPALAIAE -QRPA------SGGFYLQMAILALNALVSSLDVKGGVIIQREV------------------ -----PFKEFPEVSGSKKESILNQE------------------------------------ ------------------------RFSSQEVFPHLT--KAILE---EKPYP----IEIVLI -DKINPFSH-------------------------------CFPIINFKE-ALE-----KIP -FIVSFSPFLDETSLY--ADLILPD-HTFLE-KWQDVVPSATLGS--------PVLGI-SR -PAVDPFL-D---T--------KNT------ADVILEIA-HDRDILAYSTL---------- ------------------PWK--NYGE----------LLKDSLQGIYLSRRGMTYGTSFQG -AWMSQMEKGGWWSPTYTN------------------FEEFWN-QLL----EKG------- --------------GWWDPFYEHQKWD------------------------RVFKTPSGKF -EFYSQIFKNQLASIKPSKEN----------------------SDFKILPHWES-VVWEGD -EN-------SFPLYLNVFELLMFSAVLNSNQP-----------YLYEHIT-PHLSV---- ------QW-----ESWVEIHPEKAKA-LGI-------------E-------------ENDE -VWVE---SV-L--------------GK---I--K-TKAKLYFGTHPEVVSLPLG-LSGL- ------------------------SQSSWIK-------KEIS------NPNQLVT-GNS-- ------GNL---------ENK----YL---------RVKIYKA------------------ ------------------------------------------------------------- -- ->II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 ------------------------------------------------------------- ----------------------------MHLRRLSRRTFLK---------AAVATSAATA- ------------------------VLSHWPRSGRGIQEG------ATPAQERWVKSVCLQC -PAACGIMVRVV-KDSLGERAVKIEG--------NPNHPSNQ------------------- ----------------GGICPKGHIGLQILYDPD-RLQGPLRRVG---------------- -------------------PRGEGK-WEPISWE-EALQIV--------TERLKKL--RERG -E-------------PHKLV----------------------------------------- --------------------------IMSGRNRGQ----------------MGALIDRFL- -A-----AFGSPN-HVGHS-SICSDGAKLAHYLTQG---FKHYA-AYDW-DNCNYLLSFGA ---GFIE----AW-RPTVRLLRAFGHMRR------GRPIRAK----IVQIETRFSVTAAKA -D----EWLPINPGTDGALALAIAHVIVREGLYNK----------KFVEEHTF-------- ----------------------------------------------------------GFE -D------------WEDEQGHFHQGFKTLIRQ----------------------------- ------------------------------------------------------------- -------------YTPAWAAPITGVPE---------ETIVRIAREFATT-----PPQIAAG -QRGA---MMQTNGIYNYMAIHALNALVGSIDAPGGVL-VQIDP----------------- -----PLTPWPPLAQDEIAQTGV------------KQPRIDHAGTEEFPLA---------- ------------------------AN----VYAALP--DFIIN---EDPYA----IDTLML -YYTNPVFS-------------------------------SPDAPKYSQ-AFE-----KIP -FIVSFSPFLDDSSLF--ADLILPD-HTYLE-RWHDDVIYPSLGY--------PVYAV-RQ -PVIAPLY-N---T--------RNT------GDLLIELA-HRLGGTVKESF---------- ------------------PWK--DFLE-------------------LIQFRARGIYESGRG -NIQANS------------------------------FEEFWQ-QLL----EVG------- --------------FWTDPPYPFGQWE------------------------RVFKTPSKKF -EFFSQKLAHTLEDLAKKKAEHEGIPEEEALDKILTRLKITARGDAAFMPHYEE-PRFVGD -PK-------EYPLYLNTYKLMAHAEGRGANSP-----------WLQEILG-THVGR---- ------RW-----ETWVEINPTTAQK-LGI-------------T-------------EGDW -VWVE---SP-L--------------GK---I--K-VRAKLHPGAKPDVVNIPFE-RGHR- ------------------------SYGRWAV-------GFGA------NPNEVLA-REY-- ------DYLGG-------DAA----FF--ST-----RVKVYKAQEGE-------------- ------------------------------------------------------------- -- ->ACTB1_Geobacter_sp_M18_YP_004200644 ------------------------------------------------------------- ---------------------------------MKRRTFLQ-I-------SGMTAA---SA ----LISGC-QSA-----------NEKLIPY---LIPPD----EGITPGKAVYYASSCRSC -PAGCGILVRVS-EGR----AKKIEG--------NPEHPVNR------------------- ----------------GKLCARGQALLQELYHPD-RVPQPLKRSG---------------- -------------------PRGSGQ-FTRISWE-EGLNLL--------TGQLKGL--ERAG -A-------------AERLA----------------------------------------- --------------------------LMTPQLRGT----------------LATLAATFM- -S-----SFGSPH-HLSYE-LLAPDALRAANRASFG---QPSLP-WYDI-AQTRYLLSFGA ---EFVD----HH-LSPVHYGNAFGRMRQ-----ERDTVRGH----FTYVGGRLSLTAASA -D----RWMPARPGSEGALALGIARLILSESLHDR----------GALSANGL-------- ------------------------------------------------------------- ----------SATDLLAGLAS---------------------------------------- ------------------------------------------------------------- -------------YDLARVAELTGLSR---------EAIAEVAREFATT-----RPSLAMA -GEGV---AFLSNGPETLRAIGLLNLVTGNLNSPGGVYPDGSF------------------ -----PDGPENSFADLVS------------------------------------------- ------------------------------LVGAMA--GG---------------RIALAL -IQGDPLHR-------------------------------VPAATGFPE-ALA-----KVP -YIVSFSQIMDDTALQ--ADLILPD-HAQLE-SWGDVIPVAGGRF--------PLTGL-MQ -PVVTPVF-D---T--------RQF------PDVLLAAA-AALGGKTARAL---------- ------------------PFP--SYQE-------------------LVKKSVLQRAARVKG -EE----------------------------------AEEIWTSLLQ----KGG------- --------------DFREGPEQPKGYRW--------------------------------- -------------------------------------------APGASLPAPQA-PLFAGD -ER-------SFPLHLQLYPSTAFLDGRGAPLP-----------WLQQLPD-PMSTV---- ------VW-----DSWVEMNPKTAAG-LGI-------------A-------------HGDL -VEVS---SP-Q--------------GS---L--R-LPAVVYPGIRPDLVAIPIG-QGMR- ------------------------GGGRYAR-------GRGV------NPLSLLA-AKL-- ------KGTGP-------TPC----WS--AT-----RVKLVRISGDGGLVTNGNPQGSYRS -DLVGI------------------------------------------------------- -- ->ACTB1_Geobacter_metallireducens_GS_15_YP_384764 ------------------------------------------------------------- ---------------------------------MKRRTFLQ---------LGTVIAAGAVL -D--GCRSK---------------NEQLIPY--LIPPDE-----GITPGKGTYYASSCNAC -PAGCGILVRVS-EGR----AKKIEG--------NPEHPINR------------------- ----------------GKLCARGQAVVQELYHPD-RVPHPLKRNG---------------- -------------------PRGSGA-FTRISWQ-EGIGLL--------TDRLKAL--QREQ -S-------------TNGLA----------------------------------------- --------------------------LLTPHLRGT----------------LAELTGRFM- -R-----TFGSTN-HVSYE-LLTPDLLRIAARRSFG---QPTLP-YYDI-AETRYLLSFGA ---DFVD----SH-LSPVKYGSAFGEMRQ-----GRDTVRGH----FTYVGGRMSLTAASA -D----RWMPAKPGSEGTLALGIARLILAESLYDS----------GALAMNGL-------- ------------------------------------------------------------- ----------EAKKLLAALDR---------------------------------------- ------------------------------------------------------------- -------------YDLPRVAQLSGLPQ---------GAIAEVAREFAST-----RPALALA -GEMV---AFQSNGPESVRAVHLLNLLVGSLNRPGGIYPDAGS------------------ -----PSGPENSFAELIA------------------------------------------- ------------------------------LIETMR--GGH--------------VKVAMI -HG-DPLYS-------------------------------VPPATGFHD-ALA-----KVP -FIVSFSSLLDDTALH--ADLVLPD-HAALE-SWGDVIPVAGTRE--------PLVGL-MQ -PVVEPLF-D---T--------RQF------PEVLLATA-HELGGRMAA------------ -------------ALPDESYL--ELLK-------------------GAVRKQAGFGAGVD- -------------------------------------FEAAWVDLLQ----HGG------- --------------LFKTKSVQPTGYR---------------------------------- -------------------------------------------WSSDAPPPLPEDPDFAGD -QK-------TYPFHLIAYPATAFYDGRGAPYP-----------WLQQLPD-PMTTV---- ------VW-----GSWVEINPETAAE-HGI-------------G-------------FGDL -VEVS---SP-Q--------------GT---L--R-LPAVVYPGIRPDMVAIPLG-QGHR- ------------------------GMGRYAQ-------GQGV------NPLALVARQGT-- ------KQ----------QPA----WN--AT-----RVRITRISGNGELVTAGHPQGSLRS -ELVEI------------------------------------------------------- -- ->ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 ------------------------------------------------------------- ---------------------------------MKRRTFLQ-L-------SGMTAA---GT ----VLSGC-QSG-----------NEKLIPY---LVPPD----EGVTPGKADYYASSCRFC -PAGCGILVRVS-EGR----AKKIEG--------NPAHPVNR------------------- ----------------GKLCAMGQAVLQELYHPD-RVPQPLKRSG---------------- -------------------PRGSGA-FTRISWE-ESLELL--------AGQLRAL--QREK -A-------------TDRLA----------------------------------------- --------------------------LVTPQLNGT----------------LVELTTRFM- -R-----VFGSPH-HLSFD-LLGPDWLRTATRRSFG---QPGLP-WYDV-AETRYLLSFGA ---DFVE----HH-LSPVQYGYAFGRMRQ-----GRDTVRGH----FTYVGGRMSLTGASA -D----RWMPARPGSEGALALGMARLILAESLSDA----------GSLAVNGL-------- ------------------------------------------------------------- ----------QTEKLLRRLEA---------------------------------------- ------------------------------------------------------------- -------------YDLPRVAEQTGLPQ---------RIIAEVAREFATT-----RPALAMA -GETV---AFQSNGPDAVRAVQMLNLLVGNLNRPGGVYPDGGSRVG--------------- -----PENSFTELLS---------------------------------------------- ------------------------------LVAAMR--DGR--------------FRVAMI -HG-DPVHA-------------------------------IPPATGFQE-ALA-----RVP -FIVSFSSLMDDTALQ--ADLILPD-HAALE-SWGDVIPLAGTRD--------RVIGL-MQ -PVVTPLF-D---T--------RQF------PDVLMAMA-DKLGGKTAAF----------- ------------------PYQ--SYQE-------------------MLKGTMEKRVGRAAR -RD----------------------------------FETVWVELLR----QGG------- --------------LFETRQGQEKGYRR--------------------------------- -------------------------------------------APGSSLPNPAE-PRFAGD -EK-------RFPLHLLVYPSIAFYDGRGAPLP-----------WLQQLPD-PMTTV---- ------VW-----DSWVEINPRTAAE-MGI-------------G-------------FGDL -VEVT---SP-Q--------------GA---M--R-LPAVIYPGIRPDMVAIPLG-QGHR- ------------------------GMGRYAR-------GRGS------NPLVLLA-LIT-- ------DGTET-------RPA----WH--AT-----RVRLTRISEKGELVTAGHPQGSYRS -ELIEI------------------------------------------------------- -- ->ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 ------------------------------------------------------------- ------------------------MSENKSSSNWTRRSFIK-A-------MGLGGAAGSAL ----VLSGC-GDTDIINEVDIEVRKEKVEPN--VDPQDY------VRPGIEMYYASTCRQC -PAGCGVHARIR-EGR----VLKLEG--------NPVSDVNH------------------- ----------------GRLCPMGQAGLQSHYNPD-RLTKPMLRKG---------------- -----------------------GK-LVEISWD-EAEDVL--------RKNLGRK------ ---------------NAKLA----------------------------------------- --------------------------WLSGATSGH----------------HRALVDAYL- -A-----AAGAKN-HFVFD-TLPPAVGHAANQEMFG----SYMP-RLDF-DKARLIVSFGA ---DFLG----TW-MSPVQFSTQYAEFRN--------APRGT----LVQIEPKMTLTGANA -D----RWIPARPGTEGHLALALASLLVQKSEYAD------RVPADVVASLKD-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------VNVDEVAKLCDIPV---------ERIHHLHHLMTD-----RSPSLVLS -GASA---EGVQHGFETARAILMLNVLLGNVGETIL------------------------- -----PRSEDPFPALAPRMGGWS-------------------------------------- ------------------------------EVKAMV--DGLNKGS----------FDTVVV -FGSNPLYQ-------------------------------APGFMQADK-AFD-----KAK -FRISFSMFPDETTMA--CDLVLPV-HSYLE-EWNTTMPAYAATD--------GYLGL-QQ -PVMNPVF-GSHAT--------RSF------GDLMLDVL-KHMDPNFKQ------------ -------------------WD--SYQA-------------------YVMGALWTMRPALVK -QYKPSVPGQT--------------------------EEEAFKQGIL----SDG------- --------------FVQMKVAKAAKIE---------------------------------- -------------------------------------------AKVSAVTLPAE------- ------KANANYPFRLIPSARLGLWDGRHANVP-----------WLQELPD-QLTEV---- ------VW-----DSWIEIHPKTAEK-LGV-------------I-------------TGDV -VQVE---SS-A--------------GK---A--K-VKVVVFPGIHPDAVAIPLG-QGHT- ------------------------EYGRYAK-------GVGV------NPFSILA-ALF-- ------DGKTG-------ELA----TY--AT-----DVKVAKIESRGKLVTLANGDLVLES -NTSTQAG-RELVKTTTAENFDLTEKGA--------------------------------- -- ->ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 ------------------------------------------------------------- ---------------------------MMTENDFNRRDFLK-V-------LGWGGT---AV ----ALSGC-GNTSIQDG------QETVTSY--VELPSY------VIPSISNYFNSTCAQC -DAGCNIMGRVR-EGR----VLKAEG--------NPNSPINR------------------- ----------------GKMCGLGQSGVQAHYNPD-RVRQPLL------------------- --------------------KGEA-----ITWD-KALGVI--------AQNLSAVK----- ---------------GAEVA----------------------------------------- --------------------------FLTGGMSGH----------------VQALLGNYM- -D-----ALGSKN-HFSYE-AISPAVLRAANKKAYG----VSMP-RYRI-DKAKVVVSFGA ---DFLG----AW-VSPVHFTQQYAQFRK----GNRPEGRGV----LVQIEPKMTLTGANA -D----RWIAVRPGTEGVLALGIINALGKAGLSIP----------ADIAAVSN-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------AYTAERVSGETDVSA---------EQIGKLAALLKE-----RTPSLVLA -GGAV---EGYAHGSQNATAIALLNRVLGNVGKTVEAT----------------------- -----ASVPFPQIAPTVGN------------------------------------------ ------------------------RSSLIGLNDGLA--AGK--------------YKVVFS -YGVNPVFS-------------------------------APASLKFRD-NFA-----KAE -FKVAFAQYMDETALA--ADLVLPL-DSAME-DWGTVVPEYMAAPAEDHSAAYAQMSF-RQ -PLMQKVFPD---T--------RGV------GDILLALL-KQREADKYKEF---------- ----------------EDFYS--YLRS-------------------AVLKNKVALGGKATD -D-----------------------------------DETFWD-NTL----SQG------- ------------IVPFKGIANPVSAK----------------------------------- -------------------------------------------ASAAGLKLPSA-V----- ------TADSSYPLRLIPAVSASMRDGRNANEP-----------WLQESPD-PLTTI---- ------VW-----DSWVEINPKTAAK-LGI-------------V-------------EGDI -VEVA---SK-S--------------GS---I--R-TQAYLFPGIHPDAVSVPVG-YGHE- ------------------------AMGRYAK-------GVGA------NVFGMLD-TVF-- ------DKETG-------ELA----LNETSVKISKVGQRVIIVKEEGPVGGSQDGKKKIAV -QVSADKVDLSKEV----------------------------------------------- -- ->ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 ------------------------------------------------------------- -------------------MIDSGSVKQMAGHPFDRRDFLK-V-------LGWSGA---AV ----ALSGC-GNTSVEDG------RETVVSY--VEANDY------MVPGIGVYFNSTCAQC -DAGCSVNGRVR-EGR----VLKLEG--------NPDSAINK------------------- ----------------GKLCGLGQAGVQHHYNPD-RVREPLLRNG---------------- -------------------NKGEA-----ISWD-KAYALI--------AEKLAGVQ----- ---------------GEEIA----------------------------------------- --------------------------FLSGGVSGH----------------LKVLLGNYL- -D-----SLGTKN-HFVYE-AIAPSVVRAANVKAFG----VEMP-RYRF-DKAQVVLSFGA ---DFLG----SW-VSPVHFSQQYAQFRK-----GVNGQRGV----LIQVESKMTLTGANA -D----RWLAVKPGTEGVLALGIINALGMATGDVA----------ELVKG----------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------YDKARVSRETGVST---------GQIDKIAALLKL-----RSPSLVLA -GSAA---EGYAHGSQNAAAINLLNQVLGNVGKTIEAP----------------------- -----VSVPFPQMAP---------------------------------------------- ------------------------SKGNTVALKNLN--DGLAAGK----------YKVVFN -FAANPVFT-------------------------------APGAFKFKD-NFA-----KAG -FKVAFAHYLDETALQ--ADLVLPL-DSALE-DWGTQVPEYLTEG--------AQINI-QQ -PLMERLHAD---T--------RGM------GDILLSLI-KQKKADEYKGF---------- ----------------EDYYA--YLRG-------------------AVLQNKGALGGGGVE -------------------------------------DDTFWNDTLTNGIVKLA------- --------------GTTTSLAAHAS------------------------------------ -------------------------------------------AAGLLLPAEAE------- -------ADEHFPLHLIPGVTASLRDGRHTNQP-----------WLQESPD-PLTTI---- ------VW-----DSWVEIHPKKAAE-LGI-------------V-------------EGDI -VEVT---SK-T--------------GS---V--K-AQVYLFPGIHPEAISIPVG-RGHD- ------------------------AMGRYAK-------GYGV------NPFQIMD-AVF-- ------EAATG-------ELA----MH--ET-----RVKISKTGQRVLVVKDEGAAGALQM -GRKIAARVSTDQVDLSKEV----------------------------------------- -- diff --git a/assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json b/assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json deleted file mode 100644 index 7d4156c1..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json +++ /dev/null @@ -1,11 +0,0 @@ -{ - "empirical_frequencies": true, - "datatype": "AA", - "subs_model": "LG", - "program": "RAxML version 8.2.9", - "ras_model": "gamma", - "gamma": { - "alpha": 2.776473, - "n_cats": 4 - } -} diff --git a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta b/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta deleted file mode 100644 index f147286f..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta +++ /dev/null @@ -1,917 +0,0 @@ - ->Acidovorax delafieldii_NARG -MSHFLDRLSYFSQPRENFAQGHGQTNGEDRTWEDAYRDRWAHDKIVRSTHGVNCTGSCSWKIYVKGGIVT -WETQQTDYPRTRPDLPNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLKHWRAAMALAKSPVDAWASIV -ENDASRSEWQKQRGLGGFVRSTWDEVNQMIAAANVYTIKKHGPDRIIGFSPIPAMSMISYAAGSRYLSLI -GGVCMSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAHFLTEVRYKGTKVVS -ITPDYSEVAKLGDLWMHPKQGTDAAVAMAMGHVILKEFYFKDGGKGRSAYFDDYARRYTDLPLLVVLKEK -TLPDGRTVMVPDRYVRASDFPGQLDQSNNPDWKTVGYDELGQVTLPNGSIGFRWGADGRADQGLWNLENK -EARTGNTVKLKLSVIEDGVQAHDVADVAFPYFGGVQTPNFTANEQGGDVIVRRVPVSHLELAGHEAQGRV -MVATVFDLLAGNYGIDRGLPGEEPGGSYDADRPYTPAWQEKITGVPRDQIITVARQFADNADKTHGKSMV -IIGAAMNHWYHCDMNYRGIINMLMLCGCIGQSGGGWAHYVGQEKLRPQTGWTALAFALDWIRPPRQMNST -SFFYAHTDQWRYEKLGMEEILSPLADKKSYSGSMIDYNVRAERMGWLPSAPQLKTSPLQVAKDAAAKGMD -AKDYVVQSLKNGSLTMSCEDPDHPDNWPRNMFVWRSNILGSSGKGHEYFLKHLLGTTHGVQGKDLGQDEA -KPEEVQWHAKAPEGKLDLLVTLDFRMSTTCLYSDIVLPTATWYEKNDLNTSDMHPFIHPLSTAVDPAWQA -KSDWEIYKGFAKAVSEVSVGHLGVEKDVVLTPIMHDTAGEMAQPYGVRDWKRGECELIPGKTAPQVTVVE -RDYPNLYKRFTALGPLMDKAGNGGKGIGWNTQTEVGQLGDLNGRVKEEGVTQGMPRIVTDIDATEVVMML -APETNGHVACKAWEALGKQTGRDHVHLALHREDEKIRFRDIQAQPRKIISSPTWSGLESEKVSYNAGYTN -VHEYIPWRTLTGRQQFYQDHPWMRDFGEGFVSYRPPVHLKALHEVEGKKPNGNREIALNFITPHQKWGIH -STYSDNLIMLTLNRGGSVVWLSEDDAARAGIVDNDWVELFNANGAIAARAVVSQRVNPGMVMMYHSQEKI -INTPGSEITGTRGGIHNSVTRVVLKPTHMIGGYAQYSYGFNYYGTIGTNRDEFVLVRKMDRVDWLDDDVS -DAPAHA - ->NxrA1_Nitrospira_defluvii_YP_003798853 -MMQLSRRQFLKVSAGTVAVAAVADKALALTALQPVVEVNNPLGEYPDRSWERVYHDQYRYDSSFTWVCSP -NDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGTFAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKG -WKQWMDDGSPELTSDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRLREQGYAPE -MIEMMKGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNPDQAQGGRYWNNYTWHGDQDP -SQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAHWKLESMERGARLVIITPEYNPTASRADYWI -PVRPETDGALFLGASKIILDENYQDIDFIKGFTDMPLLVRTDTLQYLDPHEVLKDYQVPDFTKSYSGRVQ -GLSQDQVQRLGGMMVWDLAKGKAVPLHREQVGVHLAQSGIDPALTGTYRIKLLNGREVDVMPIYQLYTIH -LQDYDLDTVHQVNRAPKDLIVRWARDCGTVKPAAIHNGEGVCHYFHMTSMGRAAALVMMLTGNIGKFGTG -CHTWSGNYKVGIWQAAPWSGAGASVYLGEDPWNLNLRDDVHGKEIKYRKYYYGEEPGYWNHGDNALIVNT -PKYGRKVFTGKTHMPSPSKVRWVVNVNILNNAKHHYDMVKNVDPNIEMLVTQDIEMTSDVNHADVAFAVN -SWMEFTYPEMTATVSNPWVQIWKGGIRPLYDTRNDLDSFAGVAAKLKEMTGEQRMADTYKFVYHNRVDIY -VQRILDASTTFFGYSADVMLKSEKGWMVMCRTYPRHPLWEETNESKPHWTRSGRLETYRIEPEAIEYGEN -FISHREGPECTPYMPNAIMTTNPYVRPEDYGIPVTAQHHDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYC -VTPKTRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYVDGNPVD -RPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRPDGRAIAVDTGYQSNFR -YGAQQSFTRSWLMPMHQTDSLPGKQANALKFKWGFEIDHHAVNTVPKECLIRITKAEDGGIGARGPWEPV -RTGFTPGQENEFMVKWLKGEHIKIKV - ->NxrA2_Nitrospira_defluvii_YP_003798871 -MQVSVSRRQFLKISAGTVAAVAVADKVLALTALQPVIEVGNPLGEYPDRSWERVYHDQYRYDSSFTWCCSPNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGTFAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQWMDDGSPELTPDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRLREQGYAPEMIEMMKGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDAEKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAHWKLESIERGARIVVITPEYNPTAYRADYWIPVRPETDGANFLGAAKIIFDENLQDIDYIKEFTDLPLLVRTDTLQYLDPRDVIADYKFPDFSKSYSGRIQSLKPEQVERLGGMMVWDLAKGKAVPLHREQVGFHFKESGIDPALTGTFRVKLLNSREIDVMPIYQMYQVHLQDYDLDTTHQITRAPKDLIVRWARDSGTIKPAAMHNGEGVCHYFHMTEMGRAAAFIMTITGNIGKFGTGCHTWSGNYKAGIWNAVPWSGAGLAVHTGEDPFNLTLDPNAHGKEIKTRSYYYGEEVGYWNHGDTALIVNTPKYGRKVFTGKTHMPSPSKVRWVTNVNILNNAKHHYDMVKNVDPNIEMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSNPWIQIWKGGIRPLYDTRNDADTFAGVAAKLAEMTGDARFRGVFHFVYMNRVDVYPQRMLDASATCYGYSADVMLKSEKGWMVMGRTYPRHPLWEETNESKPQWTRSGRIETYRIEPEAIEYGENFISHREGPECTPYLPNAIFSNNPFIRPDDYGIPITAQHHDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPKTRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFVDGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRPDGRAIAVDTGYQSNFRYGAQQSFTRNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHHGINTVPKECLIRITKAEDGGIGARGPWEPVRTGFTPGQENEFMIKWLKGEHIKIKV - ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 -MKLTRRAFLQVAGATGATLTLAKNAMAFRLLKPAVVVDNPLDTYPDRRWESVYRDQYQYDRTFTYCCSPNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKATRNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKRWADDGFPELTPENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKLIDQGYPKEMVDRMQGAGTRTFKGRGGMGLLGVIGKYGMYRFNNCLAIVDAHNRGVGPDQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAHWVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNNTDTALFLGITKILIDNKWYDADYVKKFTDFPLLIRTDTLKRVSPKDIIPNYKLQDISDGPSYHIQGLKDEQREIIGDFVVWDAKSKGPKAITRDDVGETLVKKGIDPVLEGSFKLKTIDGKEIEVMTLLEMYKIHLRDYDIDSVVSMTNSPKDLIERLAKDIATIKPVAIHYGEGVNHYFHATLMNRSYYLPVMLTGNVGYFGSGSHTWAGNYKAGNFQASKWSGPGFYGWVAEDVFKPNLDPYASAKDLNIKGRALDEEVAYWNHSERPLIVNTPKYGRKVFTGKTHMPSPTKVLWFTNVNLINNAKHVYQMLKNVNPNIEQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSNPFIQIWGKTGITPVYESKDDVKILAGMASKLGELLRDKRFEDNWKFAIEGRASVYINRLLDGSTTMKGYTCEDILNGKYGEPGVAMLLFRTYPRHPFWEQVHESLPFYTPTGRLQAYNDEPEIIEYGENFIVHREGPEATPYLPNAIVSTNPYIRPDDYGIPENAEYWEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPKSRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYVDANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRPDGRALSPSGYQSSFRYGSQQSITRDWSMPMHQLDSLFHKAKIGMKFIFGFEADNHCINTVPKETLVKITKAENGGMGGKGVWDPVKTGYTAGNENDFMKKFLNGELIKVDA - ->I_OP1_uncultured_candidate_division_bacterium_BAL57377 -MAVSRRRFVKATAALTGAALVTDTLGLQGFKFVPEIKNPLEFYPNRDWEKIYRDQFRYDSSFTFLCAPNDTHNCLLRAYVRNGVIVRIGPTYGYNEARDLYGNKVSARWEPRCCQKGLALGRRFYGDRRVNGVWVRKGFFDWVRAGFPRDPHTGAPPKEYFNRGQDSWLKLSFDEAYGIVAQALFNIVQTYSGPEGAARLKAQNYDPTMLEAMHEAGTQTVKVRGGMPFLGATRIYGLARFANMLALLDAHIRNVSPDQALGGRVWDSYSWHTDLPPGHPMVTGQQTVEFDLFTAENAKLITLWGMNWICTKMPDAHWLTEARQRGAKVITIATEYQATANKADEVIIIRPGTDAAFALGVASVIINEKLYDEEYVKTFTDLPLLVRMDTLKLLRASDIIRDYQPAELTNYAKVLKPDEKPGPPLAQRVQYIPERARQAWGDFVVWDSTKNAPEVITRDHVGQFFAARGIDPALEGSFTVQTTDHQEITVRPVFDLIKEYLKEFTPPKVAEMSWAPSEAIVNLARQIAANKASTLLSHGMGPNHFFNADLKDRALFLIAALTKNIGHFGGSPGSYAGNYRVALFNGLPQYIAEDPFNIELDPTKPATVKSYAKSESAHYYNYGDRPLRVGKKLFTGKTHTPTPTKFMWFANSNSLLGNSKWGYDVIHNTLPKIEAIVVNEWWWTMSCEYADVVFGVDSWGELKYPDMCGSVTNPFVQVFPRTPLPRIFDTRSDIETYMGVAEKFAELTGDARFRDYWHFVRENRVDVYLQRICDASSSLRGYKFTDLEEQARQGTPMLKLLRTYPKIVGWEQTQESKPWYTKTGRLEFYREEDEFIEYGENLPVYREPVDATPHEPNVIVAPKTLSALKPAPPEQYGLKRDDLSTETRQVRNVIKTPEEVVRSQHPRTKDGLKFIFITPKYRHGAHTTPVDLDVLAVYFGPFGDIYRRDKRSPWVGEVYADINPQDAKELGIEDGDYIWIDADPEDRPYRGAKPSDPDYKIARLMGRARYYNGTPRGVVRMWFNMYQATHGTVNAHETRPDKLAKDPQTNYQAMFRYGGHQSCTRAWLRPTLMTDSLVRKDVFGQTIGQGFAPDIHCPVGAPKESFVKITRAEPGGADLKSLWRPAQLGYRPTYESDEMKQYLAGGFIEVT - ->RBG1_10 -MTLSRRRFLKISSLSAAGALVDLPELKFLQFLETVENPLEYYPNRDWEKIYRDQYRYDSSFTFVCTPNDTHACRLRAYVRNGIVIRVEQAYDVQNYTDLYGNKASVMWSPRGCNKGYNLPRRVYGPYRVKHPMVRKGWKEWAEAGFPDPTLPENQQKYFRRGEDSWVKVSWDEGFELVAKGLLHTMEKYSGEKGAEILRKQGYPEEMIEAMHGSGAQTIKIRGAMPLLGATRIFGFYRFANMLGLYDGKLGARGWSNFSWHGDLPPGHPMVTGVKCSDPELNDFRHSKLLVFLGKNMVESKMADAHWWIETIERGGKVVNISPEYSATSSKSDYWIPIRPGTDTALLLGVTQIIIQEKLYDQDFIKKHTDLPLLIRMDNLKLLRPTDIIKGYKNQILTGYSVKVQKIKPELREKWGDFVVWDLKTKKPQTVTREDLGEKIERKGLNPALEGNYKIKLVNGKEIEVKTVFQLYKELLSEYDLETVSQITGSPKNLIYQLAQDLATIKPASIHTGEGVNHFFHCDLVTRAVWLPLALTGNIGKPGANVGHWAGNYKGEVFDGLGVYLNEDPFNPNLDPSAKLEDIKLKKYYKGEEVCYWNYEDRPLIVKGKCFTGKTHMPTPTKAEWVGNGNLLNNAKWAHNMIANVEGKVEMIVYNEIEWTASCEYADVVFPVHSWMELTLPDMTASCSNPFLQVWKGGIKPIFDTKQDNEVLAGVAAKLSELTHDNRYKDYWKFVLEGNNEVYLQRILDACSTTKGYKIDELLKSDRGWLMNFRTYPRIPFWEQIQESKPFYTKTGRMEFYREEDEFIDYGENLIVHREPVEATPYLPNVILGTHKAIRPNSYGISPESINADERQVRNLKMSWKQVKLSKNPLWEKGFRFYCLTPKSRHTVHSSWSVLDWNMIWQSNFGDPYRMDNRTPGVGEHQMHMNPLDAKELGINDGDYAYVDANPEDRPYTGWKEEDPFYKVSRLMVRVKYNPAYPRGITMIKHASFIATHKSVKAHESRPDKRAVSEDTGYQSSFRYGSQQSITRGWLQPTMMTDSLVRKNYMGQEIGEGYEIDVNAPNTCPKETLVKIIKAEDGGMGGKGKWEPARTGYTPAGENKDMKKFLEGGFILKV - ->A_Nitrobacter_hamburgensis_YP_578638 -MSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLERSLPP -YEPRGCQRGISASWYVYSPIRVKYPYIRGPLLDMWREAKASSADPVQAWGALIGDEQKRSRIQKARGKGG -FRRAKWEELVELIAAASLHTARKHGPDRIMGFSPIPAMSMLSFAAGTRFLSLMGGSLMSFYDWYADLPTS -FPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVHFISEARTEGTKFVVLSPDFSQIAKYCDEWIP -IQAGQDTALWMAANHVILKEYYVDRQVPYFVDYIKRYTDLPFLVELESNGNTYKTGRLLRSNRVPRYKDV -ENGDWKMLLLDANSGELRAPKGQVGDRWGSVHGKWNLSGEDTLDNSPLDPVLSFIDRSDDVVQVGFDDFA -NGRIVSRGVPVKRVATDKGEILCATGFDIMMSQFGISRGLEGAFATSYDDEDAPYTPAWQERHTGIGRET -AIRFAREFATNAELTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVA -PWATVALALDWAKPPRLVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPKWAKGHAIDLEAKAVHNGWMPFT -PHFNRNPIEVAAEAERSGAKNVQDIETYVVDQVVSKKLQMAIDDPDAAENWPRMWFIWRGNAIQSSAKGH -EFFLRHYLGAHDNAIAEDRAKGKAQVVKYHETAPRGKYDLVIDLNFRMNTTSLYSDIVLPTAFWYEKNDL -NTTDLHSFLHVLGQAVPPVWESKTDWEIFKLIGKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPEIL -DWSLGECKAVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGISAVGVQIPIKKQYDQMLDNPIMPMPD -PRHMRCVEWGGKRYPSLEDVLDACNTVLLCAPEANGEVCYQAFHNEEHHVGLPLVDLAEPNRNVAATFYD -LTRQPRRIITSPCWTGMVNDGRAYSAWCMNVERLVPWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNPR -KTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRMLMLSRGMDPVWINDRDAEKVGIEDNDWVEVYN -DNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRTRINPLFLAGGYAQFTYGWN -YWGPTGILTRDTHVVVRKMEKLEW - ->B_Nitrobacter_hamburgensis_YP_578186 -MTTGLAAGQRTEETQMSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWE -MQQTDYPLLERSLPPYEPRGCQRGISASWYVYSPIRIKYPYVRGPLLDMWREAKASSADPVQAWGALVGD -EQKRARMQKARGKGGYRRAKWEELVELIAAASLHTARKHGPDRIMGFSPIPAMSMLSFAAGTRFLSLMGG -SLLSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVHFIAEARTEGTKFVVLS -PDFSQIAKYCDEWIPIQAGQDTALWMAANHVILKEYYVDRQVPYFIDYVKRYTDLPFLVELEPNGTTYKT -GRLLRARHVPRYKDVENGDWKMLLLDANSGELRAPKGQVGDRWGSVHGKWNLSGEDTLDNSPLDPVLSFI -DRSDDVVQVGFDDFANGRIVSRGVPVRRIATDKGEILCATGFDIMMSQFGISRGLEGAFATSYDDEDAPY -TPAWQERHTGIGRETAIRFAREFATTAEYTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGG -GINHYVGQEKLAPVAPWASIALALDWSKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPRWAKGHAI -DLEAKAVRSGWMPFTPHFNRNPIEVAAEAERAGAKSTEDIATHVIDQVASKKLNLAIEDPDAAENWPRLW -FIWRGNAIQSSAKGHEFFLRHYLGTHDNAIAEDRAKGKTHTVKYHDTAPRGKYDLVVDLNFRMDTSSLYS -DIVLPTAFWYEKNDLNTTDLHSFLHVLGQAVPPVWESKTDWDIFKLIAKKVSELAPLAFSKPVRDVVLQP -LMHDTPDELAQPEILDWAEGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGVSAVGVNVPIKK -QYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVLLCAPEANGEVCYQAFHNEEHHVGLPLV -DLAEPTRNVATTFYDLTRQPRRLLTSPCWTGMMNDGRAYSAWCMNVERLVPWRTLTGRQTLYIDHQWYLD -FGEHIPTYKPRLNPRKTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRMLMLSRGMDPVWINDRDA -EKVGIEDNDWVEVYNDNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRTRINP -LFLAGGYAQFTYGWNYWGPTGILTRDTHVVVRKMEKLEW - ->Nitrobacter_winogradskyi_gb_ABA05326 -MSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLERSLPP -YEPRGCQRGISASWYVYSPIRVKYPYIRGPLADLWHEAKASYPDPVQAWASLVEDEEKRNRIQKARGKGG -FRRAKWEELIELIAASCLYTARKHGPDRVMGFSPIPAMSMLSFAAGTRFLSLFGGGLMSFYDWYADLPTS -FPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVHFISEARTEGTKFVVLSPDFSQIAKYCDEWIP -IQAGQDTALWMAANHVILKEYYIDRQVPYFIDYVKRYTDLPFLVELEPNGNTYKTGRLLRSNRVARYKDV -ENGEWKMLVLDTATGEPRAFKGQVGDRWGSTHGKWNLSAEDTLDNSPIDPVLSFIDQSDGVVQVGFDDFV -NGSVVSRGVPVKRIATDKGEVLVTTGFDIMMSQFGHSRGLEGSFATSYDDEDAPYTPAWQERHTGIGRET -AIRFAREFATNAELTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVA -PWSTVAMALDWNKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPRWAKGHAIDLEAKSVRCGWMPFT -PNFHRNPIEVVAEAERAGAKSTADIATYVADQVASKKLDLAINDPDAEENWPRVWFIWRANAIQSSAKGH -EFFLRHYLGAHDNVIAEERAKGKTTTVKYRDTAPQGKYDLVVDINFRMNTTGLYSDIILPTAFWYEKNDL -NTTDLHSFLHVLGQAVPPVWESKTDWEIFKLIAKKVSELSPLAFSKPVRDIVLQPLMHDTPDELAQPEIL -DWAEGECKLVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGISAVGVNIPIKKQYDQMLENPIMPMPD -SRHMRCVEWGGKRYPSLEDVLDACNVVLLCAPVANGEVSYQGFVNEEQHVGLPLADIAEPTRGVSSTFYD -LTRQPRRILTSPCWTGLVNDGRAYSAWCMNIERLVPWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNPR -KTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRLLMLSRGMDPVWINDRDAEKVGIEDNDWVEVYN -DNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRIRINPLFLAGGYAQFTYGWN -YWGPTGIFTRDTHVVVRKMEKVEW - ->Nitrobacter_sp_Nb_311A_ZP_01048070 -MSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLERSLPP -YEPRGCQRGISASWYVYSPIRVKYPYIRGPLYDLWREAKASHPDPVQAWASLVGDEQKRLRMQKARGKGG -FRRAKWEELVELIAAAALYTARKWGPDRVMGFSPIPAMSMLSYAAGSRFLQLFGGVNMSFYDWYADLPTS -FPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVHFIAEARTEGTKFVVLSPDFSQIAKYCDEWIP -IQAGQDTALWMAANHVILKEYYIDRQVPYFIDYVKRYTDLPFLVELEPNGNTYKTGRLLRAKRVARYQDV -ENGDWKMLVLDSKTGEPRAFKGQVGDRWGSTHGKWNLSAEDTLDNSPIDPVLSFIDQSDGVVQVGFDDFV -NGSVVSRGVPVKRIATDKGEVLVTTGFDIMMSQFGHSRGLEGSFATSYDDENAPYTPAWQERHTGIGRET -AIRFAREFATNAELTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVA -PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPRWAKGHAIDLQAKAVRSGWMPFT -PHFNRNPIELAAEAERAGAKSTDDIVTHVVDQVASKKVNFAIDDPDAEESWPRMWFIWRGNAIQSSAKGH -EFFLRHYLGAHDNSIAEDRAKGKTQRVKYRDTAPRGKYDLVVDLNFRMNTTSLYSDIVLPTAFWYEKNDL -NTTDLHSFLHVLGQAVPPVWESKTDWEIFKLIAKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPEIL -DWAEGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGVSAVGVQIPIKKQYDQMLDNPIMPMPD -PRHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHHVGLPLVDIAEPTRGVSSTFYD -LTRQPRRILTSPCWTGMTNDGRAYSAWCMNVERLVPWRTLTGRQTLYIDSQWYLDFGEHIPTYKPRLNPR -KTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRMLMLSRGMDPVWINDRDAEKVGIEDNDWVEVYN -DNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRTRINPLFLAGGYAQFTYGFN -YWGPTGIFTRDTHVVVRKMEKLEW - ->Nitrococcus_mobi_EAR23355 -MGWIQDLINPKTRRWEEFYRNRWQHDNIFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGIPPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLDFWREARSSHNNPVEAWSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKYGPDRVMGFSPIPAMSMLSYAAGSRFLQLFGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVHFISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKGEDLGLWMAAGHVIYTEFYVKRQVPYFIDYVTRYTDMPFLVKLEKDGDGYRPGRYLTSEEVKKYKKQENAAWKQLVFDRKSNEARCPKGQIGHRHGKHGQWNLKMEDGLDNSPIEPVLSFLGESDDVAMVQFYEFASQTVYKRGVPAKKIDTGSGSVLVATVYDLNMGQYAVNRGLPGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRFAREFAGTAEKTKGRSMVIVGASANHWYHNNHIYRAAINCLIACGCCGRNGGGMNHYVGQEKLAIVAPWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYAPSPPNAKWAKGHSVDLVAKSVRMGWMPHYPQFNRSPLEVAREAEKAGAKDDKGMADYVVQALKKKNLSFSVDDPDAPENWPRVWFIWRGNAMQSSAKGAEFFLRHYLGTHDNAVAEERAKPHVKHVKFREPAPRGKFDLVVDINFRMDSTALYSDIVLPTAFWYEKNDLNSTDLHSFIHPLGQAVPPVWESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRDVKDWLEGECEPIPGKTMPHFRVVERDYSLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQPVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEHCGVPLTDLAEPYRGHQVTFYDLTRQPRRLLCSPVWTGNCGDGRAYSAWTLQIDRLVPFRTLTGRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIHDLDNSPIDDKTLILNYITPHGKWNIHSTYKDNHRMLTLSRGMDPVWINDKDAARVGLKDNDWVEVYNDNGVIVTRANVSRRVQSGMCLYYHAVERTIYIPKSQIRGGRRAGGHNSVTRTRINPVYLAGGNAQFTYLFNYWGPTGIMTRDTHVAVRKLEKLEW - ->Beggiatoa_sp_PS_ZP_02000390 -MAVTGAGAAVISQQAISATQLLTPVAIDNPLSNYPNRDWEKTYRDLYHYDSSFTFLCAPNDTHNCLLRGY -VKNGVVTRIAPTYGYQKAKDLDGNQSTQRWDPRCCQKGLALVRRFYGDRRCKRPMIRKGFKDWVEAGFPR -LPETGAVDQKYLQRGRDSWVGASWDEAFELAGKALTNIAQTYTGEEGQKKLLAQGYDPLMVEATEGAGTQ -VLKFRGGMPPLGMTRVFAQYREANAMALLDDKIRGKGTDSLGGRGFDNYSWHTDLPPGHPMVTGQQTVDF -DLCNVERTNLLIVWGMNWITTKMPDSHWMTEARMKGTKVVVIAAEYSATSSKADEVFVVRPGTTPALALG -IAQVLISENLYDAPYVKANTDLPLLVRMDTAEMLRAGDVFKDYQLAKLENNTLVVPTGEKGPPMHQQKGP -ILDEKQRADWGDFVYWDASESKPVAMNHDQVGKHFSGNPQLTGEFAVPLASGETVQCRTVFDVTKEMLDG -SYTPEDVAKLTWTSADGIRGLARQIAANQSNTLFTVGMGPNQFFNSDLKDRNIFLVAALTQNIGKIGGNV -GSYAGNYRASFFNGLAQFIGEDPFNPELDPTKPAKLRKRWKAESVHYFNHGDTILRMGKAVLTGKTHIPT -PTKAFHVSNSNSLIGNVKGHYDFVINTLSRVEFIAQNEWWWTASCEYADIVFAVDSWAELKYPDMTISVT -NPFLYTFPATPLPRIHDTRSDLEVAAGICGAIGKVTNDSRHKDYWHFINKGEVRPHIQRVLDHSNATRGY -KIEDLEKLANEGIPAILQTRTYPKVGAWEQGNENKPWYTKTGRLEFYREEPEFRDSGENIVVHREPIDST -RFEPNVIVAKSHPLLRPKTPEDYGVPSSDMSGDTRQARHVVKTVDEVLNSEHPLHKEGYDFVFHTPKYRH -GAHTTAVDTDIVAAWFGPFGDMLRRDRRMPFVAEAYVDINPDDAKGLGIEDGDYVYIDADPHDRPFKGWQ -KYPEGYKVARLLVRARYYPGTPRGVTRMWHNMFGATFSSVRGQETNPTGLAKSPETGYQSLYRGGSHQSC -TRGWLKPTWMTDSLYVKGLMGQKITQGFVPDVHCPTGAPREALVRIIKAENGGIDGKGLWSPAARGLRPT -YENDILKQFMAGKFVELA - ->Hydrogenobaculum_sp_Y04AAS1_YP_002121006 -MISRRDFLKNGSVFLAALSTPGFGKKLFEPLVIVGNPLASYPNRGWEKIYRDIYKPDETTVILCNPNDTHGCYLNAYVKNGIITRLEPTYKYGDATDIYGIKASHRWEPRCCNKGLALVRRFYGDRRIRGPFVRKGYYEWYKADFPRDENGKPPSKYFINRGKDEWLKVSWEEVSDIIAKSLINIAKTYSGEKGKAYLKAQGYPEEMIDTMAGAGTRTLKFRGSMPWLAVLRYVGQYRMSNMMALLDSNIRKVEPDKALGGVGWDNYSEHTDLPPAHTLVTGQQTVDFDLVTWEHAKLIVLWGMNPYGTKMPDSHWLTEAQIKGIKVIVISNDFMATARTADKVVITRTATDGALALSMAYVIMKEKLYDENFVKSFTDLPLLVRMDNAKLLRASDIIPNYIPKALNQAVVYNPSKQMPPPPMKQEKQYIPIQLRDQDINDFVVWDVKTNSPKVVTRDEVGKYFDMSSLDPALTGEYEVELVNGEKVKVKPNFQAYIELLEENYTPETVEEITGVPANVIRELALEIANHKGTTKITTGMGVNQYFHGDLIVRAIFLVAALTGNVGRESGNIGSYAGNYRLAVFNGVGQWNAEDPFNIELDPSKLAKVKFYWKGESQHYFADGDRPLKVGDKMLTGKTHMPVPTKFMWMADNNSGLGNQKWAYNVMFNVLPNVECVVTNDWWWSLSCEYSDIILGVDAWDENRFWDISGSCTNPFFLVWPRTKQKRLFDTKNDIETYALVAKRLSELTGDKRFKEYWHFVFEEKPEVYIQRIINASSNLKGYKIEEVAAKAEQGIPSLVMTRFYPKFIGYDQTVDGKPWYTKTGRLEFYREEDTFINVGENLIVHREAIDSTPYEPNTIVIAKKHPLLRPLDPKSYGLSSEEMLKDTELRQARAVFISPAKLKDTKHPLRVSFGATHIVHTPKFRHTTHSATGDVDIVALLFGPYGDMYRHDKRTPYVVDAFIEINTHDLQKLGINDGDYVWVDADPQDRPFIGWQNKPEEYEVARLLLRVRGSFSTPPGLAKIWFNMYGSSHGSVKGTKVNKNGLAENPVTGYQSFYRRGSQQSVTRGWLNPTLMGDTLVRKDLFGQTLNKGFMLDVYCPTGAPREGFAKITKAENGGIGNVGLWRPLSIGFRPQNPNKYFKKYLEAGYVIFV - ->Hydrogenobacter_thermophilus_YP_003433365 -MSDLTRRDLLKMGGLSLTAMLSPSFAFRVMEPVVRVENPLAYYPNRDWERFYRDIFKSEATFTFLCAPNDTHNCLLTAHVKNGVITRIEPTYKFGEATDIYGLKASHRWDPRCCNKGLALMRRFYGDRRVKGPMVRRGFYEWYKAGFPRDPITGKPLEKYFQRGKDKFIKVTWDEVADIIAKTLINIATTYSGEEGRKRLEAQGHYPKPMLDAMEGAGTRVLKFRGSMPFLAVVRYTSPYRFANMMALLDSHIRGVGPDKALGGRGWDNYAFHTDLAPGHPMVSGQQNVEFDLCMWEHSKLIILWGMNPFTTKMPDCHWLTEARIKGSKVIVISNDYSPTARASDELIVVRTGTDTALALSIAYVIMKEKLYQERFVKSFTDMPLLVRMDNGKVLRARDIIPNYQPQPLQKAVVFKPGETLPPFYKQDKQYIPEPIRKGDMDDFVVWDTKSNSPKVITRDHVGEDFWKLGIDPALYGTYRVKTVEGKEVEVKPLFQVYLEFFEKSYTPKQAEVITGVPAKKIEKLAREIASHPRNMKLAQGMGVNQYQHADLKDRAMYMICALTDNIGHATGNIGSYAGNFRLALFNGAPQYLAEDPFNIELDPEKPAKVKFYWKPESAHYYSHDDHPQYMGEHLITGKTHMPTPTKFVWFVDANSALGNAKWQYNIIMNTLPKIECIVTNEWWWSMTCEYSDIVLGVDAWNENKYWDIAGSVTNPFVYVWPKTGHRRFFDTKNDAEAFAIVANRLSELTGDERFRNYWKFVLEGKQDVVYVQRVINASSNLRGYRLEEIAKKAHEGIPSLIMTRSYPKYVGEDQTKEGMPWYTKSGRLEFYREEPEFMDAGENLPVYREPIDSTHHEPNVIVARPHPLLRPKKPEDYGLSAKDALLSTEWRQARNVLVSPEKLPNTKHPLMVTVGATHIVHTPKYRHSAHTTTGDTDIIVLLFGPFGDIYRHDKRMPFVSEAYIDINPKDLKKMGIQDGDYVWVDADPQDRPFAGWQKRPEDYEVGRLLLRARASNNTPPGCAKIWFNMYGSSHGSVRGTKENPNGLAKNPNTGYQSLYRRGSHQSITRGWFKPTYQTDTLVRKNLMGQIIGKGFELDVHGLIGAPREGFCKIAKAEDGGIGGKGVWRPVRLGYRPMTANEMLKKYLKGEYVK - ->Natrinema_pellirubrum_YP_007282293 -MANRDRSVDSANERSAEGTSVSRRTLLGGAGAAGVAGFAGCLRLFTDDGEGNGNGTSTASKLNPLTEYPNREWESHYRDVWDVDDTYYLACRPNDTHNCYLEANVKNGVVTRLGPSMNYGEAEDLYGNQASDRWDPRVCQKGLSMVERFYGERRVTSPMIRQGFKDWVDEGFPREEDGSMPEEYAKRGEDSWYEASWDEAYEYAAKTFLELADHYSGADAQELLLEQGYDDRVVEEMQGVGTRTMKFRGGMPMLSTIGLFGEYRFANSMALVDHHVRDVGEDEALGGVGGDNYTFHTDLPPGHPMVTGQQTVDFDLANVEYADNIVLAGINWMCTKMADSHWLTEARMNGANVTGIFTDYNATSSKCDELVIIRPATDSALFLGVAQQIIATDGYDAEFVRSNTDLPLLVRMDTGDHLRASDVFEDYDPADLERTQVAPADEHPAPTTVDTADQWITPDQREDWDDFVVYDDAAGGVRAVDREAVGEEFDVDAALEGSWELELADGDIVEVRPVFDLVKEYLDTTWDPESTAEVTGTEPEAVTNLAEQFADNKESTLLLTGMGPNQYFNGDLKDRAAFLVASLTSNVGTHSGNVGSYAGNYRAAMLNGIPHYHLEDPFDPELDPDADSRVDSRITMESMHFYSNLDKPLKIEGEYHMGDSHMNTPTKSLWVAGSNSILGNAKGSYKIIEGLLRTGKLEAFFCNEWWWTMTCEYSDIVFPADSWAEQNVHDLTASVTNPFLMVFPETGIDRVYDTRHDCQIYQGVAEKLAEKLDEPRLEQMWEFIDEDEYRGKPYVQRILDNSNMTKGYDAETLIEKAERGEPALMMSTTYPKKIGTRQANDDEPWYTKTGRLEFLREEETWTEVGETLPVHREAVDGTIYKPNVIVDDGDHPLIDPETPDDLGWDDDNIEDASARQVRNEVVSTDALVNSSHPLQDVDPGFKYSFMTPKYRHGAHTFCNALPNIAVWWGPFGDRDRKDDRKPYFGEGYVEMNPEDAKEEGFEDGDYVWVDADPNDRPYPSANGDPDEYSRALMRVRYQPAMPRGVTRSWHNLNQASHGTTEATPDRTGMAKNEETDYVSLYRRGGHQSMTRSWLRPTILTDEMNRKGLMGQSIGKGFAPDVHCANGAPRESFVKFEKEGDAGEDGEGLWRPAEMGLRPGYETETMQRYLDGDFTSTEGD - ->NxrA_planctomycete_KSU_1_ZP_10101005 -MKLTRRTFLQVTGATGATFTLANKAMAFRLLKPAVEVGNPLDAYPDRAWESVYREQYRYDRTFTYCCSPNDTHACRVRAF -VRNEVLMRVEQNYDHQNYADLYGNKATRNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQWADDGFPELTPENKSKYM -FDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKLLDQGYPKEMVDAMKGAGTRTFKGRGGMGLLGVIGKYGMY -RFNNSLALVDSHNRGVGPDKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAHWL -TQVFERGGKLVVITPEYSPSAQKADYWIPIKCNTDTALFLGITRILMDEKLYDADYVKKFTDFPLLVRTDTLKRLQAKDI -FPDYKLEDISHGASYKIHGLHDDQREIIGDFVVWDAKTKSPKAITRDDVGDKLVAKGIDPALDGTFKVKTVDGKEIEVMP -LFEMYKIHLKDYDIDSVVEMTNSPKELIVRLAHDIATIKPVAIHYGEGINHWFHATLFNRSTYLPLMLTGNIGYPGSGSH -TWSGNYKAGNFQASKWSGPGFYGWVAEDVFNPNLDPDAPAMDLKVKGRAYDEEVAYWNHNDRPLIVDTPKYGRKCFTGKT -HMPTPTKIMWFTNVNLVNNAKHVYQMLKNVNPNIEQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSNPFIQIW -KGGIKPVNDSKDDVMILAGMAAKLGELLRDMRFHDVWKFALEGRPEVYIQRLLDGSTTTKGYSFVDIINGKYGEPGVALL -LYRTYPRHPFWEQVHESIPFYTPTGRLQGYNDESEIIEYGENFIVHREGPEATQYLPNVIVSTNPYIRPDDYGIPEDAEH -WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPKSRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNP -EAAKDLGINDGDYVYVDANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRPDGRA -LSAGTGYQSSFRYGSQQSITRNWSMPMHQLDNLFHKSKTSMKFVFGYEADNHGINTTPKETLVKITKAEDGGIGGKGLWD -PAKTGYTAGNENDFMKKYLNGELIKVEKA - ->ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 -MMTENDFNRRDFLKVLGWGGTAVALSGCGNTSIQDGQETVTSYVELPSYVIPSISNYFNSTCAQCDAGCN -IMGRVREGRVLKAEGNPNSPINRGKMCGLGQSGVQAHYNPDRVRQPLLKGEAITWDKALGVIAQNLSAVK -GAEVAFLTGGMSGHVQALLGNYMDALGSKNHFSYEAISPAVLRAANKKAYGVSMPRYRIDKAKVVVSFGA -DFLGAWVSPVHFTQQYAQFRKGNRPEGRGVLVQIEPKMTLTGANADRWIAVRPGTEGVLALGIINALGKA -GLSIPADIAAVSNAYTAERVSGETDVSAEQIGKLAALLKERTPSLVLAGGAVEGYAHGSQNATAIALLNR -VLGNVGKTVEATASVPFPQIAPTVGNRSSLIGLNDGLAAGKYKVVFSYGVNPVFSAPASLKFRDNFAKAE -FKVAFAQYMDETALAADLVLPLDSAMEDWGTVVPEYMAAPAEDHSAAYAQMSFRQPLMQKVFPDTRGVGD -ILLALLKQREADKYKEFEDFYSYLRSAVLKNKVALGGKATDDDETFWDNTLSQGIVPFKGIANPVSAKAS -AAGLKLPSAVTADSSYPLRLIPAVSASMRDGRNANEPWLQESPDPLTTIVWDSWVEINPKTAAKLGIVEG -DIVEVASKSGSIRTQAYLFPGIHPDAVSVPVGYGHEAMGRYAKGVGANVFGMLDTVFDKETGELALNETS -VKISKVGQRVIIVKEEGPVGGSQDGKKKIAVQVSADKVDLSKEV - ->ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 -MIDSGSVKQMAGHPFDRRDFLKVLGWSGAAVALSGCGNTSVEDGRETVVSYVEANDYMVPGIGVYFNSTC -AQCDAGCSVNGRVREGRVLKLEGNPDSAINKGKLCGLGQAGVQHHYNPDRVREPLLRNGNKGEAISWDKA -YALIAEKLAGVQGEEIAFLSGGVSGHLKVLLGNYLDSLGTKNHFVYEAIAPSVVRAANVKAFGVEMPRYR -FDKAQVVLSFGADFLGSWVSPVHFSQQYAQFRKGVNGQRGVLIQVESKMTLTGANADRWLAVKPGTEGVL -ALGIINALGMATGDVAELVKGYDKARVSRETGVSTGQIDKIAALLKLRSPSLVLAGSAAEGYAHGSQNAA -AINLLNQVLGNVGKTIEAPVSVPFPQMAPSKGNTVALKNLNDGLAAGKYKVVFNFAANPVFTAPGAFKFK -DNFAKAGFKVAFAHYLDETALQADLVLPLDSALEDWGTQVPEYLTEGAQINIQQPLMERLHADTRGMGDI -LLSLIKQKKADEYKGFEDYYAYLRGAVLQNKGALGGGGVEDDTFWNDTLTNGIVKLAGTTTSLAAHASAA -GLLLPAEAEADEHFPLHLIPGVTASLRDGRHTNQPWLQESPDPLTTIVWDSWVEIHPKKAAELGIVEGDI -VEVTSKTGSVKAQVYLFPGIHPEAISIPVGRGHDAMGRYAKGYGVNPFQIMDAVFEAATGELAMHETRVK -ISKTGQRVLVVKDEGAAGALQMGRKIAARVSTDQVDLSKEV - ->QrcB_Desulfatibacillum_alkenivorans_YP_002430439 -MKLNRRNFLLVSTAGAAGGAVGSMFSPLSWKLMDDSSIWTQNWPWTPVPADGEVSFEETTCTLCPGGCRV -KVRKVDERPIKLEGVEGGPVNDGGICILGLTALQLLFGPARVHTPMKRAGKRGEGKWVEITWEEAISEVS -GKLAEIRETGRAQDLGCIAGGGKGVINALFSRFMEAYGSPNFYWQATAWDCYEENILRTLGLNGTAGFDL -ENADYILSFGAGLLDGWGSPVHVFQAHSKWRENHDGHATLVQIDAQLSNTAAKADKWLPIVPGTEGAVAM -AMAHVIISKNLYNRGYVNWNTTGFRDFYRTVESEYAPAKVVKIACPVDNKEYQKKWLEELESRAIAFAKA -DKPLAVAGKGNGDRPVSQAELNAVQALNALVGAINRKEGGMVVLPDEPKYPWKPVVMDAEARSYKPSLVS -VRGRSKYGHSNLVSVLPQALNSSHEGLKVLLLAGSNPLYTLADTEKTAEALQKVEYIVSFSSQFNDTTAY -ADIILPDHIFLESTVDAPTPPGFAKPVYGLAEPVIKPVYKTKAMGDSIIEIAKAMGGTIAQSFPWADSAE -AIEQALGGKWPLLKRGGVYVNEDFTPETEGVRFRFFARSGMESRISIQGKAEQYPLIATPVDCIRLATGA -LADTPFMVKTVSDKKLKHKELVVQVNAMTAQQYGFKEGSEAVLETPVAKAKVRVHCSEEIAPGLVGVPRG -LGHIAHDEFVGGKGTNYNTLISPVQDPATGFDVAWGIRAKLT - ->Gemmatimonas_aurantiaca_YP_002761548 -MIAPSATTDHRPSTTMTTEAGTGVKRREFLKILGATGATTAVVGCSSEKVGKLIPYVTSPDNTVPGVSQY -YATSCRECAAACGVLAEVRDGRPIKLEGNPEHPLNRGAICATGLAGIQGVYNPDRYRSPMVREGNALKPT -TWDKAYELLAQKLGEVKSKGQAGNVVFVNQHETGTFPGFLDQWLSAQGMPAHLSVDSTAPIATIAANQKA -YGAAWPALNFSAAKLVISFGADFLDGWGHSVPQQLDWADARSKLDVAPRLVYIGARRSLTGLNADQWIAA -KAGSEMAICAALTGTGSAAAAAEAANVPVATIEALVKAVADAGNGIMALCGVTGNDAVECGVMVAEINKK -GGAVGTTINTAKAHGSYTGLASYADLAAAVKNMDAGTVPLAFVRGANPAHTMPKSAGFAAAFAKVAFKVS -FSSMPDETAQLADLVLPDNHWLESWGDAVGENGQISLQQPTLDPVFDTRATADVLIDLAKKDQTLAARYN -VANFRSWYISQFPGGASAFATALTKASVSGAPLVATSTRTLATTALPVAEGAGEFFVQVYPSSTLGDGAG -ANKPWLQELPDPVTKIAWQSWIEVHPSTAKKLGIKEGSHLTIETAAGKVTAPAYIYMGVRTDTVAIALGQ -GHTAYGRFAQNIGVNAYDLVSHGWDSAGSLAIGSVKGKVTVSADSSPLVTTEGSARQHGRGIAQAMTLAA - ->ACTB1_Cytophaga_hutchinsonii_YP_678817 -MKDNNKVFWKGVEELGNSPEFVKNAQNEFPEFLPLKNSSEESNGTDRRDFLKLLGFSVAAVSLAACEAPV -KKAIPYLNKPEEIEPGIANYYASTFVDGGEYCSVLVKTREGRPIKIEGNKLSSVTKGGTNGRVQASVLSL -YDTARIQGPLIKGAAATWADLDKQVGVQLGAIAATGGNIRIVSPTILSPTTKKAIAAFKAKYPSTEHVQY -DANSSYGILKANQTSFGQAVIPSYDFSKAEVIVGFGADFLGTWISPIEFVSQYADTRRLSKTKKTMSQHF -QFETALSLTGSNADYRQPIKPSQEGLFIAELYNKIVSSKVSTTPVKNDVLDKAAAALLKASNRGKSLVVS -GSNDVNVQILVNEINLALGNYGTTISLATPSFQKQGNDEAMNTFINDAVAGKVNAVIFYGSNPVFDHARG -AELAKALSSVSLTVSFADRVDETAALTKFVAPDHHYLEAWGDAEPRAGFYSLGQPSISPIFKTRAAQESL -LLWSGNSGDYYEFLKSNWISSILGGASWDQALQDGVFEPKNKSGVEVTASSFDRSAVEAGIIKNYPANTS -GIELKLYEKIGLGTGSQANNPWLQELPDPISKATWDNYVAVSASYAKANALEQGDRVAVKSANYSVELPV -LIQPGQAGNTVSIAIGYGRTHVGKCGDGVGKNVYPFARFVDGSVLDFVTGVSVTKLGGDKYPIAQTQTHH - ->ACTB1_Leptospira_interrogans_serovar_NP_713447 -MDQKNFQKEKKAHWLSYDLKDKDEEVKEMQKSEFFTSPDPLIARIKSGEFDRKSFLKLMGAGVAMTSLNC -IRKPVEKIVPYVDLNKTDENSQYDFVKHGHSYYYTSVVAGTGVLIKARDGRPLKLEGNPDHPVSQGALSA -AGQASIFDLYDPDRAQNPATIEGGIEVKSDWATVDAKVKSALAANKGKTVVVTKLLDSPSTQSIIGDFLR -TVGGGKHYEISLTSAEEVVSKGQAASYGKAIVPNYHFDLANVILSIDCDFMGNWLSGEEHQKDFSKRRNL -RPNGSLKQNNLADVNLFIAAESVPTMTGSNADLRLAIRPGDQTKLALAIAAALGELGANTKDALNGATLS -ALVSELGVSEENIRKTAKALWSNKGRSLVVAGSLAATTKDAVDLQILVNLLNSVLENDGKTVDHSNPKKE -GLADSSGNLKSLAAELKQGKVGVLFVNDVNLVYQAGEEWKNLLHQAALVVSLSDRADETALSSNVLATTT -HFLESWGDAEVTKGIFSIQQPAIRPLFNSRSFEDSLIAFAGGSLGGEASFYEYVKNSWIKKLGSKRNWED -LLRTGTTVTASERKKVAGPSRNFNRSSIKKIESSSTGLKLSLFETIAIGDGKAANNAHLQELPDPVTKLT -WDNCILLSPALAKEKGISSNDVLVLKTAKQTIELPAQIQPGMHKDAIAIAVGYGRTAAGAVGTGVGKNAY - ->ACTB1_Bdellovibrio_bacteriovorus_NP_96849 -MKKALRPKVERDTKYWNSLEQWSNDPEFNKIASTEFQSSPLRESDDEGGWARREFLKLMGASLAMASAGC -IRRPVQKIVPYNKQPEEVTLGMANYYTSAYFDGSDALGVLVKTREGRPIKIEANPGHPFSISGLSIRSQA -SLLSMYDPERLKGPQRNLFNEKKSNSQVIDVKWEDLDKKVAEQLKKGDVVILSGNVASPATRAVIGDFAQ -GFKAKHVVWEALSNDDVREGQKASYGDDVVPAFRFDKAKMIVSIDADFLGTWISPTAFTNQFVEGRKDIK -NMNRLVSFDSNYSLTGANADIRMKIKPSQQLDVVMGLLHEIIVKKGASSHAGNSAVKAALAPFADVAKKL -NVEPALFAKVAADLWANQGTSLVVAGGITTLTEKSKELQVAVNFLNSILGNDGKTVDHNGGNKGDKASQA -DMAALIKDMKDGKVKTLIIHRVNPGFVLGADMGFAEAIKKVDLVVYTGDRIDETGVFADYITPDNHALES -WSDMELASGVYSICQPSIRPMYDTRSFQLSLMTWAYLANMGPSRLRDYETFYDYLRVFWKSDIFPKYGKG -QSFEDFWQTALQKGYVGEINSGSSSRSFKVDAFTSIKPAAAKEGFELALYSTSQHGDGSLANVSWLHELP -DPVTKAVWDNYVMVSLATAEKHGLKQATVVELTVGGKTLELPVLIQPGLHDDVLAVAVGFGRTRAGKVGN - ->ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 -MPSLDGLPGDEREWIGRFPHLEQALAHPLDRRRTLKLMALALAGGGLAGCDPGTPDRGFVSAVRAAPGVI -PGVPNVYASAHVRDGYANGILVTHQMGRPTKVEGNPGHPSSLGATDVFAQAAIQDFYDPDRASGPLHDGM -PAAWQEVTTALQVLRAAPNGGVPQGASGLRILTGTVTSPTLGAAIDALLAAYPGAIWHRWDAIGRDTVRQ -GAELAYGRPAMVIPDLRQVDVALAVDSDLLDSAPGHLRHARAFAGRRNPVQGPMNRLYAVEPTPSLTGVA -ADHRFITAPAACDEIIGRLAAAVLRNEAPSGGPDWLGAVVADLRAHPGRALIHLGPDHGAQAQAAVHAMN -EALGGRGRAFDVFDAPDHRPARPTSTLPALMDDMENGRVRALLILDVNPVYQVPRFAAALPRVPLSVALA -DRPHETAQAARWHVPLAHGFEEWGDARADDGTATILQPQAMPLYGGVSAATILHLCAGDVARPARDLVRQ -TWRQHLPSERDWRAALAAGVVPGTASARLDTPLAPVMPPAPPPAPPVDLTLLLRPDPHLWDGREANNPWL -QELPRPLSKIVWGNPLLIPPDLARSMGLRNGDEVALSVGARRAVLPIWVQPGQASGCVVGLLGSGRRRAG - ->ACTB1_Methylobacterium_sp_4_YP_001772545 -MPPLSGPRTVSRREALRAFAAGITLAAGACAKPDEEIVPYVVQPERVTGGVPLVFASTLPLAGYGRGCRV -RSVDGRPIKVEGNPRHPGSLGATDVFAEAAVLSLYDPDRSKTLRQGGDIGTWSALQRALVAKVAAWRETR -GEGMRLLTGRVTSPTLQRQIARLLDAYPRAAWHAHEPTEDASARAGAALAFGRPLWPVPHLDRAAVIVSL -DADPLGPGPDQIRNGRGFGSRRVPAAGEGFSRLYAVEAAPTLTGAKADHRLALPPHRIGEVAVALARALG -ADLRAPTLPEEAARLAARAAQDLRARRGAALVLAGPTLPPEIHALAHWINGVLGAPLDWIEPPDLIGGRA -PGTLSDLARDLAAGGVQDLVMLGVNPVYDAPADLALAERLGRAPFRLHLGPAVDETAVLATWHVPETHPL -EAWGDLRAVDGTASLVQPLIRPLYATRTAEEVVCALLGEGDAASYDLVRETWRPGREAGFEEWWRRALHE -GVVQDSAAAPVATGSPRLPDPGPPAAAQDLTLVLRPDPGTWDGRMANNAWLQECPAPLTKQVWGNALALA -PDEAARRGLAQGDLVRVAAGGRSIEVPVATVPGHAAGVASLTLGHGRSRAGAIGNGIGASAYALRREDAL - ->ACTB1_Ralstonia_eutropha_YP_298623 -MTRARVIPLVPVDEPSDAPRSPARRHFLRTTMAASAALAGAACSGPPAEMIVPYVQMPEGIVPGRPLFYA -TALTRHGYGMGVLVETNMGRPTKIEGNPRHPASLGATHPFDQAAVLQLWDPDRSQAPYRGGALSGWAAFD -AALATQRVQWRDRDGEGLRLLTGNVGSPTLSAQIAQWLDRYPKAVWHVHDPLYDEDPSPRMAFGDDVDLL -IDPKPATTIVTLDADLVGHGPAAVRHAHDFMADRRGVAPMLACRLYAIESSPTLTGEISDNRLALPPHEI -ERLAWSLARKLGVPDVPVDTPEPASDTARHWIAVLARRLREAPPGSSLLIAGGALSGPTRALVWRLNARL -GNLGKSVRPVAGTPRRPLGEAHSIGALTEAMRAGAVSALLMIDVNPAYDAPCGLGFDAALRHVPWSSHMG -VYRDETARLTTWHAPMAHDLERWSDARAWDGTASIVQPVIAPLNGGRSAHELLSAAVDEHQSGYDLVRAH -WRARQRDDFDAFWEQALRTGVIADTAAPPATTDMRQPITPPSFAAPPLVARFMPDPATDAGELANNAWLQ -ELPRALTRHTWDNAALIGPLTARARRLSTGDIVVIRRTDRQGNPIEAPVWVLPRHAEGVVSLPLGYGRRH - ->ACTB1_Chloroflexus_aggregans_YP_002464666 -MTQHQSDLEAIRAQLRDARGPQFWRSLDQLADSPAFRELVEREFPRGASEMSDGMSRRTFLKLMGASLAL -AGVTACTYQPRQYIAPFDRQPEGRIPGVPQYFASTLTLGGYGTGVLVRANEGRPTKVEGNPRHPASLGST -DLFAQAEILTMYDPDRSTTVLRQGVPSTWAEFTTTLANALTAAQATQGAGVRLLTTTVTSPSLAAQIEQF -LQAYPQARWYQYEPVNRDNVVEGARLAFGRDVTTRYDLAAAQVIVSLDADFLAPGPGFIAYARAFADGRK -VRKDSTGMNRLYVIEASPSTTGTAADHRLALRADAIAAFAGALAHELGIGGAPATLAAKAEEFLKAIAKD -LEEHRGRSVVIAGDQQPPIVHALAHLINAELGNVGKTVFYHEPVEARPTNQTNELVTLVSEMAAGRVELL -VMIGGNPVYNAPGDLRFAERMATVPLTVHLSQFVDETSVQATWHIPQAHPLESWGDARAFDGTASIVQPL -IEPLYGGKTANELLAAMLGQPDAESYDLVRGYWEERIGNTNWNVALATGVIADTSAPVINPTLNEAAIRA -TAIPQPGDGVEIVFRPDPSVFDGFYANNGWLQELPRPLTKLVWDNAALMSPRTAIKLLGLPFSADRLVGN -EADDRERQRYLEQLSKVNGTIARIEYRGGVVELPIWLLPGHAEDSITLNLGYGRTNAGRVGNGVGINVYP - ->ACTB1_Nitrosococcus_oceani_YP_343269 -MAGSSIKPLDLAPIRARLAEAQGRAFWKSLEELAGSEEFERFLYQEFPFFRELSQASLSRRDFMRLMGAS -LALAGLSACSTPPPEEILPYIRAPEGLVPGESLFFATAMPLDGFATGVLVESRMGRPTKVEGNPLHPASL -GGTDIFAQASVLQLWDPDRAQVISHRGEISTWQTFLAAMGEKMRTFEGNQGKGLYLLTPTVSSPTLISQL -RTLGKRFPHAHWHQYQPINQDNSYEGARLAFGESLETRYHLERAEVILSLDGDFLGSLPGHLRYARDFAK -KRRVDSAQSTMNRLYVAESSPTITGTMADHGVSLRASQIEVLALQLARALGIGVPRREETASDLPEQWVR -AVAEDLRQHRGTSLVITGEKQPPFVHGLVHAVNQALGNVGTTLTYSAPRAFNPRNQNESLNHLVAQMDAG -KVDTLIMLGGNPAYNAPADLAFSKQLAKVKSSIYLGLYEDETAAHSHWHIPETHYLERWGDARAYEGTVS -LLQPLIAPLYQGKSDYELLAVLLGQTDRSDYDWVRGYWQKQWPKSDFKSIWNQALQAGFIEGTALRSKSV -KLRDDWVAHLSRGQSKSKETSGMEIIFMPDPTIWDGQFTNNGWLQELPKPLTKLTWDNAALISPRTAENL -GLANEEVVALRYQERQVQAPIWIMPGHPEGAVTVTLGYGRAKTGQVGAGTGFNAYALRSSRAPWFGWGLE - ->ACTB1_Candidatus_Solibacter_usitatus_YP_821785 -MSDPRNQLDLAAVQKRLEGARGRDYWRSLDDLAATPEFQDLLEREFPRQAVGWADDEDANEGRRNFLKVM -GASLALAGMTACTRQPTEHIMPYVRQPEELIPGRPLFFATAMTVNGVANGLLAESHMGRPTKMEGNPEHP -ATLGACDPYSQASVLQLYDPDRSQALTFNGEIRSWGRFTGELREALALQKTKNGSGIRILTETVTSPTMA -AQLRAIQQVYPSSKWHQWDPAGPHMARAGSVQAFGQPTNTYYDFTHANVVVSLDSDFLASGPGYLRYARQ -FSARRRIHEPSDSMNRLYVAEPMPTPTGTKADHRLQLRAGDIEEFAWGLAISLGIAEGPKNGENHDIYKW -LGPMARDLQSNKGASLVIAGAHQPPIVHALAAIMNEKLGNVGKTVFYTDPIEANPGDQLASLMDLVKDLD -AGAVDVLLILGGNPAFNSPVELGMRDRLKKAKLRIRLGLYADETTEVCQWQVPEAHFLETWGDARAFDGT -ITIQQPLIQPLYNGRSALQLLQNFTDQPESSPYDVVKGYWRTQHQGADFENWWRRAVHDGFVANSALPTK -TPTVRGEALSARAGARHLGGKLEVIFRPDPTIFDGRFANNGWLQEMPKPVTKLTWDNAAILSPYDANRFG -VQNGDMLKLTYDGRSLNAPVFIQPGHVNGATTLHLGYGRWAGGRAAKGMGFDPYGLRTSKALWQDVGMDA - ->ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 -MDNGSKKNGADVCPSKKGKLELADVKQQLAAAKDGPQYWRSLDELSNTDEFQEMLHREFPRQASEWVDDG -GSSRRDFLKLMSASLALAGLTACTKQPIEPIVPYVRQPEELTLGKPLFFATANTVGGYAVPVLAESHEGR -PTKLEGNPQHPATLGGTDVFTQASVLTMYDPDRSQVVMLDNEIRTWGSFVGAVANPLAAQKAVQGAGLRL -LTRSTTSPTLGAQIKQLLQTYPQAKLVQYDPAGRDNARAGSQLAFGQYVETQYNLDKADIILSLDGDFLS -SGFPGFHKYARNFSQRRQPDLKEKMVRFYMAESTPTNTGGKADHRIPMRASDVEQFGRAIAAGIGVAGAG -GSAKQEWQNQVAAIVSDLNKHKGAAVVVVGEHQPPAVHALAHSMNAALGAVGTTVTYTEPIEQIPADQTA -GLKELVADMNSGKVDLLVVMGANPVYEAPADLAFLDAFKKVAVRIHHGLYVDETAVLSHWHINGTHFLEQ -WGDVRAFDGTVTIQQPLIAPLYNGKSQYEFVAALNGQGSTSGYELVKGTWQKQHTGADFEAWWRKAVHDG -LIAGTAAPAKTVSAKGAPAATNAASDSAMELIFRRDPMIYDGEYSNNGWLQEAPKPITQLTWDNPIEMNV -TQAEQMGIKTEDELEITVDGRKIVGGAWLTPGHPKNSVTVFLGYGRTRAGRVGTGTGYNAYQARTSDKQW - ->ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 -MPSLGLPIYGQKQGAGLDARRWRSVEEAAEAREVPPGEFPDDAAAVPEGFTRRGFLQVLGASVALAGLEA -CKPPRENVVSYVRPPAGVTPSLPSAYATVASRGGYAVGVVVTSHEGRPTKIEGNREHPSSRGGSDAMLQA -SILDLYDPRRLKGFTRAGRPLGFATLLREVSALARSHAQDGGARLRFLVEPTSSPAVADLRRRILERFPR -ARFDAWAPVGADAGRAGAAIAFGKPLDAAASLADADVILSLESDFLALEGDSLRLAREFGARRTAERMNR -LYVAESAYTVTGGAADHRFRMRSADVLGFGRAVAAELAAKHGLAQLAPLGAPAGGERAKAAAAVAADLAR -ARGRSAVLAGDRQPAAVHALAAALNGALGNAGKTVAYRPTALLDPAAGPDRLRALAGELEAGKVDALVVT -AWNPAHTAPADVPLRKLLPKAKDTIALALREDDTVRLATWKIAATHPLEAWGDLRAADGTASIQQPLIAP -LHESLSELELLAAFLDEGDHGTWRIVREGWRRRAGEAGFDGRWDGWLAAGVVAGSAVPPEPAQADLARVA -EAVRAVAAPGASLELGFAADYKVLDGRFLENAWLQEYPHPITKLTWDNAAQLSAATAKQLGVESGDLVEL -SWRGRTLTAPALVVPGHADGSVLLTLGYGQALSGPVGKGVGHDAYALRTSDAPWFGAGVEVRKTGKRHPL - ->QrcB_Desulfococcus_oleovorans_YP_001530428 -MKIDRRSFLTLLAGGAVGTALSPMTIKLTDDISIWSQNFRGTPIEVPVPERGPASYVDSVCTLCPGGCGI -SVRKIGDRAVKIEGKAGHPVNNDGVCALGLSGLQLLYGPWRVTGPKKKENGRWKKISWDRALSEIAEKLN -ELREAGKADAIAGISRTGRGTVARLMQRLLAAAGSPHFLPVPTNENAYSDAVARMFGKPGTVGFDFENSG -YVLSFAAGLLDGWGSPVHMFSAHSQWKTNGVKMVQVESRLSSTAAKADQWVAVKPGTEADLALGLAHVIL -RDNLNAGAAANSRAFDSFAALVKKDYTPARVAAATGIKESVIVALAKEFAAASHPVAVCGRGDGQTPCDS -REVMAVTALNALVGSVNRQGGMIIGPEPDYIQWARPVLDDTAQKGLAKGPKTLADLLAGKTPDVQALFVL -EANPAYTLHDTTKVKAALEAVPLVVSLSSFMDETSALADYILPLPTCLERTEDVVVTAGLKTPMIGLTQP -VVEPRLDTRHPGDVILDLAKAMGGTVAESFAWSDYQDCLEKTFGLVYGKLATEGYLQKSVLETLIDTAVA -VGRADFAPVVEADKKVRQNTPALVLAAYDAMRVAGGAIATPPYAMKIVPDTILKKNDLYVEINPETAQKA -GLADGKAAVVETPAGTAQVRVRVTHEVAPGMVAMPRGFGHTAYDDYVSGKGVNVNDLIGPVPDPVSGLDT -AWGAPAKLIKA - ->QrcB_Desulfomicrobium_baculatum_YP_003159879 -MGLDRRSFISLVAGGVAGSLFTPVIWKTLDDVSIWTQNWPWIPRLQYGEELTVPALCKLGADAYGLKVKT -IAGRPVAAEGNPDHPLSLGGICPLGAASVHLLYSPSRVKNPKLRDGSSFKDITWEEAEELLAGKIKEAGA -SMAMISGDETGSVTDVLSGLVGKAGSDKSFFMPGESAPAAAALAMLGGDGQVGYDIENANYVLMLGADAL -GSWGNVARNGKAFSASREKGVKFVYVGPAQNGTSAVADSWIPCAAGTEPVLALGIAAVIAGTNRDRSFWP -GFASFAKFVQTSYPLDKVAEITGVSAATITGLAQELVRAGRPLVLTAAEAGQGLGAFELAAGMSLNMLLQ -RVNTVGGVRILPWAPKVVEAAADKKAMLANDLVAYLSTVADGGAEAPALLMVYGANPAYALPNLVKAQAA -IDKAGFVVSFSSFMDETAAMADLIMPDSYAFERLDDAYSPYGSGQPNYTVAAPVIKPVFDTRPAGDVLLS -VAAKAELDLGFETFEDVVKAKAEALGADFDEMVEGAVWVSEEFPAQDLALWTTPLQELAVAAQDGKTLAL -APVLRLKIGSSKIAIPPFNTNAIRFDEMLGNDMYVLINAATAKNLGLKKDDAVKLASSGGECKARVRIFE -GVMNDTVVAPLGLGHTAWDAFSSGKGDNVYKLLAADTETETGLSRFATVRVTVSKA - ->QrcB_Desulfovibrio_magneticus_YP_002953179 -MGLDRRAFLGLVAGGTVGAMFTPIPWKLIDDASIWTQNWPWIPRVPKGQVDYVATTSKLCPAGEGLKIMR -VAGNPILAGGNPSHPLSCGGVSALARSEVYMLYSPARIKSPMKRNGKTFAPITWEQALVEMAEKLGAAKG -AVASISGDNTGTINEVLTALTAKLGSAGSFMMPSEATTAAKAMKLMGAQGQAGYDFENADTVLVLGADIF -ETWGTSSRNRKAFGANRPAGAKPANTYVYVGPSRNNTAAVCDQWVPAAAADLGVVALGIAWHLLKAGATS -NAPGFDTFKAVVNGGFGPEDVKRATGVAPETLAAIAKALASAKAPLVVTGSPFGQGLGAAPVIAGMSLNM -LLGRINKPGGVYMLPELPSVVPGALTRAAMLDGDLPAFLKGVESGKTPAPKALLIYDANPAYGLPEAATM -AKALEKIPFKVSFSSFMDETAALCDLVLPNSLPLERYDDVATPYGSGFCVYSLVRPIQKPICDTKTTGDV -LLGLARKLSIDLKFDNFQQVIKEKVASLAKVSGGFVAKDVMPWQVAAGKPAPALVGGDLWKALEAGYAWT -MVGQAAQTAMGFAAEVVAKAVKAGKPATATVLAPYAQLRTGTPVTGMPCQDLTTVPDTELLGDTTFIRVN -SETAKTLGLKKGQMVKLSGAGVDCQAKVHIFESVMPGMVSAPLGFGHTAFDYYSQGKGANYLSLAAVVEE -PGSGLSMWIAPEVKIA - ->QrcB_Desulfovibrio_vulgaris_YP_967712 -MALDRRGFLKFIGGATAGILATPVVWKGLDDVSIWSQNWSWIPRNIKGANSYVPTVSKLCPTGVGVRVRL -VDGRPVRVIGNPEHPLSKGGVSSIAAAEVQMLYSPARMKRPLKRSPDGAYVMISWEEAEAMLLDGLKAAK -GGDALACISGDDNGTINELLSAFVQQSGSKSFFLMPGEAQPAAKAWDLMGGEGQIGYDIEKSDFVLAIGA -NVLEAWGTAIRNRHAFGASHPHGAEPTAQFVYAGPVLNNTATGADDWLPIRPGTESAFALGLAHLLIKAG -ASSSAPDFDAFRSLAASFSPEKVAAQTGVDAKALTALAQALAKAKHPLVIVGSEFSQGAGAAPVMAGIAL -NMLLGSVNRDGGLRALPVARKVVPAGMDRKAMLQQDLTLWASAIASGKAKAPKAMLVYEANPVYALPQGS -AFKDTLAKVPFKVAFTSFLDETAMQCDLVIPVSMGLERLDDVCTPYGCGEVVYSLATPVTAPLFDTKPAG -DALIALGGKLGLDLGVASFEDMLKAKAAAHGADFDKLAEGTAFTSRATVGANLSFRPDVLSKALDVKAPA -LPLALAPVMKLNMGTSKTAIPPFNTKTIRRWEVQGKEGYVMLNGATARKLGLAQHDRVVLSNPTGKVTVR -VNIFEGVMNDTVAMPLGFGHTAFDEFSKGKGENVMHLLAPSTEPVTGLAVWTGAGVNIAKA - ->ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 -MSENKSSSNWTRRSFIKAMGLGGAAGSALVLSGCGDTDIINEVDIEVRKEKVEPNVDPQDYVRPGIEMYY -ASTCRQCPAGCGVHARIREGRVLKLEGNPVSDVNHGRLCPMGQAGLQSHYNPDRLTKPMLRKGGKLVEIS -WDEAEDVLRKNLGRKNAKLAWLSGATSGHHRALVDAYLAAAGAKNHFVFDTLPPAVGHAANQEMFGSYMP -RLDFDKARLIVSFGADFLGTWMSPVQFSTQYAEFRNAPRGTLVQIEPKMTLTGANADRWIPARPGTEGHL -ALALASLLVQKSEYADRVPADVVASLKDVNVDEVAKLCDIPVERIHHLHHLMTDRSPSLVLSGASAEGVQ -HGFETARAILMLNVLLGNVGETILPRSEDPFPALAPRMGGWSEVKAMVDGLNKGSFDTVVVFGSNPLYQA -PGFMQADKAFDKAKFRISFSMFPDETTMACDLVLPVHSYLEEWNTTMPAYAATDGYLGLQQPVMNPVFGS -HATRSFGDLMLDVLKHMDPNFKQWDSYQAYVMGALWTMRPALVKQYKPSVPGQTEEEAFKQGILSDGFVQ -MKVAKAAKIEAKVSAVTLPAEKANANYPFRLIPSARLGLWDGRHANVPWLQELPDQLTEVVWDSWIEIHP -KTAEKLGVITGDVVQVESSAGKAKVKVVVFPGIHPDAVAIPLGQGHTEYGRYAKGVGVNPFSILAALFDG -KTGELATYATDVKVAKIESRGKLVTLANGDLVLESNTSTQAGRELVKTTTAENFDLTEKGA - ->RBG1_1305 -MNNKENPHKKYWSTLSEFHQDAEFKKLKKEEFLSKPQSFFESNGNNDTTFSRRDILKLAGAAAVFTAAACARRPVEKIVPYLDPSEEVIPGKAVWYSSTSGTSDGCGMLVKTREGRPIKLEGNPDHPLNKGTLSAREQAAILDLYDPDRLKHPAKISAGQVLKSDWKSADTEIARSLKSAKGKMVLLTGTIHGPARKRLIREFLFSFSNAEHITFDALSEEEILEAQELCYGNRVLPRYRFDKAEALVFLGADPLASGHSKTEFAYGFGHQRKINSNQMSKVISFEPALSLTGQNADLHYLVKPQDLIKVGLALAHQLIVAEKKSKLASDLLVQNLLENYSAKKVETEIGLPEGTIKSVAADLWLARGRGLVYTGSLTVRDNSALALHLVTNLLNSALENEGNTVDGVQSVSQQSQGSYSELMNLISDMKSGKVEAVLIYGNNPAYGLPQSAGFEEALQKVKTKIYLGDRADETGSLCDFVLPSLHFLESWGDAEPQQSLYSLMQPTISPLHDNRGWEDSLLALMREIKGVALGKEYASWHDFLKDTWYKEIYLKNDLVASFEDFWISVLRQGLFDTVNRSAEKSSPRQFRTTALSNIGKIKNVDSKFTLALYTPAMQFDGRTNNNSWLLETPDPVSKIAWDNYVNIAPRTSVELGLQESDVVSLTVNGVTQEIPVHIQPGIHPEVFTVAVGWGREKVGRVGNNVGVNAFRWSKIQNRHLVSSSLPVEIKKTGKQIKLANVQGHNYINGRPVIYEATLAEYQKNPTAGRAGEEKLTSIWPSHPYE - ->B_Caldithrix_abyssi_ZP_09550397 -MKTKMKRREFIKIAGAGAGSLVVGSKLYASFNSKDEQNLLADGKIERTPTYCEMCFWKCAGWVYKKDGKP -WKIIGNPDDPNSRGRFCPRGTGGIGAYTDPDRLKKPLLRVEKNGKQVFKEVSWDEALDFIAGRMKDIAQK -HGPECIALFSHGSGGSYFKTLLHAFGSNNVAAPSYAQCRGPREEAYMLTFGEAVGSPERTDIINAKCLVL -LGSHIGENMHNGQVQEFSEAVAHGATVITVDPRFSTAASKSKYWLPIKPGTDLALLLAWIHVIIYEELYD -KEYVKKYTFGFEQLKEALKDKTPEWAYPITTIKPHVIRQTAREMAKNAPATIVHPGRHVTWYGDDTQRVR -AGAILNALLGSWGRRGGFYFPSKAHLPKMPIPKFPNVKRDWRKAFPNKYPVAHLALSSGICDATIPSPER -ECSFKGWIVYGTNLPMTLPQPEKTLEAIQHLELLVAIDILPAEITGWADVVLPECTYLERYDNLRLSPGR -VPSIALRAPAFEPKYESKPAYWMARELAKRLGLEDYFPAKTIEEYLDYQLKAIGSSLEEMKKIGVKLLPE -EAQKLYLEDGEDFEFPTPTGKIELYSTILDEYGFDPIPQYTAHEEPPEGYYRLLYGRAPMHTFGRTTNNP -NLHDLMEENTVWINSKVAKQWGIKNGEYITLENQDGVRSTPVKAKVTERIRHDAVFMVHGFGHSDKRLRR -AYGKGADDQRLITRVKIDPLMGGTGMRVNFVTFRKEEA - ->ACTB1_Opitutus_terrae_gb_ACB77208 -MKRKSDHSAPANSEPTGPKYWRSLDELAATPGFQEQLHREFPEGASELNGVDRRHFLKIMAASFALGGVG -LAGCRRPEKYVLPYGKSVEGMIPGLPLYFATAMPLRRTAIPVLAETHQGRPTKIEGNPTYQQHGGSASLL -AQASVLDLYDPERATQHTREGRKLNVADLNEQLAQIGTSHAANGGAGLAFLAEESSSPTRARLLAQLRAR -LPRAIWAEYEPVADEAPVSAATAAFGQPVRPLYRFARARRIVSLDADFLRPDGAGLYYAREFAKGRRVVN -REDAQQMNRLYVAESAFTITGSMADHRLRLASSHMLALAAALAVKITGSAAFAPLSAGLDIDPKWIDECA -ADLLAHRGTSVFVAGAHLPEQVHAIAYAINAALGNIGATVDFVAPPTNDAASIQTLATAIRDGAIDTLVI -LGGNPVYNAPADLDWAALQKSVKNVVRLGYHTDETTVASPAGAHLAAAHYLESWGDARTADGTIVPIQPM -ILPLFGGLTELEVLARIVGANNPDPYALVLETITALAGGDAEKAFQQFLHDGLLANSAYPTVAVSYNAAG -VARLLGAGAGNPAALSKDNLEVRFVTDYKMDDGRFANNGWLQELPDPITKISWDNAILVSPRLARELGVY -PDGSTLQVARVEMAGFHQGKEQAFIGELTVNGRTVRAPIHIQPGLSNYTVVLPLGYGRTQSGHVGRGMGH -DFYPLRTSAGLHFTVGGKLVPTQDVKAMPNTQEHWSMEGRDIIREANVDEFLENPRFVAAFGMESHSPSI - - ->ACTB1_Flavobacterium_psychrophilum_YP_001295304 -MSSNKKYWKSVEELNENSSIVETLRNNEFVEEISTNEFLGDAVTLATSSTTRRDFLKYVGFTTAAASLAA -CEGPVHKSIPYVVQPEEIVPGVADYYATTIADGFDFANVLVKTREGRPIKIENNKIAGANFHANARVHAS -VLSLYDSMRMKTSKIAGKDTIWEQANAKIKASIADAKAKGGKVVLLTNTSASPSTDKLIAQFLVSNPNAK -HVTYDAVSSSEALDAFQTVYGERALAEYDFSKANVIVSIGADFLGDWQGGGFDAGYAQGRIPQNGKMSRH -FQFESNMTLSGAAADKRVPMTVANQKQALVQIYNVITGSSIGSSKDEAVMKAAQQLKAAGSKGVLVCGID -DKNAQLLVLAINKVLSSEAFNTANTRQIRKGNNADVKQLLADMKSGAVHTLIMNGVNPVYSLPNGKEFAN -SLKKVKLSVAFAMKEDETAAVANIAVATPHYLESWGDVSIVKGSYALTQPTIRPLFDTVQFQDALLSWTG -NAQTYYDYLRSSWSGAKSWNQLVHDGVVFTEGISSSAGAGADYNGAASTLAKASSKGLELVLYTKTGLGD -GQQANNPWLQEFPDPITRASWDNYLTISQADATTSGIENWNVANGGLNGSYVTLTVDGVKLEKVPVIIQP -GQAKGTVGLALGYGRKAAMKEEMQVGVNAYTLYNNFSNVQNVSIAKEDGEHEFACVQLQRTLMGRGDIIK - ->ACTB1_Salinibacter_ruber_emb_CBH25246 -MIELDVIDSETAARDEESGARDGSSEPTFWRHWSESDADEDGDDLTEFVPGDSEPPSGASRRQFLQLMGA -AMAMAGLAGCRRPEEKILPYAREPETVTPGIEDHYATSMPFRGVLRPVVAQSNEGRPTKIKGNSDHPSGQ -SGTSPYEQASVLNLYDPDRSRSVRQEGRAASWSDFVSFCRQLGNEADQHQVAVLAEKTSSPTVQAMRQRM -ADRFPNLQWVPYAPTGTDPRRLGMQQAFGRPLRPRFELGEAEVIVSLDANFLDGRTHDFGYHTQGFAEGR -RLDDAEDTMSRLYTVESRYSTTGGSSDHRLAMRAGRIPALAAALAAELGVGEAPDVSWSERERLHVREMA -RDLQAAGEHGVVMAGEAQPPEVHALAMAVNQRLGGLGTTVTLFDPGDDEIQPQDEALADLTASMRAGEVD -TLFMLGVNPVYDAPSELGFEEALSNVRDTVHLGRLRNETAQAARWHLPRTHYLEQWGDGRAYDGTKSIVQ -PLIRPLYDDAHSLIEVLNLAATGVDASGHDLVREQWRAQLPAPFQERWRKALHDGYLEGSGYETASVGTA -TVPSIDAPASDPDEIEVVFRTDSKLLAGRFSNNPWMQELPDPISKIVWDNVAVMSRATADELGVEVQRRE -GSFYADRVELTLDGQSVKLPVWVQPGYPDGSIGVSMGYGRTIASTRESESTPFWDTSDQTNIYNGSPIAG -GVDSSGEPVDVVGGNVAPMRPNGGRVATGANVTQVGSGYLLATTQEEGSMQGRPIVRWATLDEFKENPEF -VNESQPPVPDLGHESGGHGDGGHGDGGGHGGGDGHSGDGAAGNVSGQGLEAGPGADAHGADEMPEQAAHG - - ->ACTB1_Rhodothermus_marinus_gb_ABV55245 -MIELPVVNPDGAETPGSGKRLWRSTADLRRDPEWVKLAHDEFMPGVAEPPSGTSRRQFLQIMGASMALAG -LTACRRPVEKILPYVRQPEEIIPGIPLYYATAMPFRGSVRPLLVESHEGRPTKIEGNPDHPLSRGATGVF -EQASLLNLYDPDRSQQVLRKGEPASWGDFVQFARSLAAEAGTKRLAVLCEPSSSPTLAALRRELERRYAQ -VRWVTYRPEGDDHEALGLQQAFGRPVRARYRFSEARVIVSLDADFLGPTDRNFVENTREFAASRRMERPE -DEISRLYVIESTYTVTGGMADHRLRLRAGDIPAFAAALAAELGVGELREAGARFAGHPYVVEIARDLRAA -GARGVVLAGETQPPAVHALCAVINDLLGSLGRTVILHALDEPATAQHAALAELVQAMQAGAVDALLLLNV -NPVYDAPAALGFAEALAQVPEVIHLGLHMDETARRSTWHLPSTHYLEAWGDGRAYDGTLSVIQPLIAPLY -EAAHSPLEVLALLATGEEQSAYDLVRNTWRRLLAGRGAFEQAWQRVLHDGFLPDSGYPTVSLRPNRQALA -DWPQAAEGGLEVVFRLDPTVLDGSFANNAWAQELPDPITKIVWDNVAILSPKTAAALGVKAEYHKGVYIA -DVIELSLDGRAVELPVWVLPGHPDDSITVYLGYGREITSTRPERKTPFFDLDEYTDMYGHGAIATGVGPR -TWPRCGGPDNTWVAYGAQVRKTGRTYKIVTTQDHGSMVGRPLVRLSTVEEFRKNPDFAKEAEPPLEGLEP - ->TMAO_Photobacterium_profundum_YP_129680 -MNMSVSRRSFLKGLATTSAVSVIGPSLLASSKAMAAETTGTWKTSGSHWGAFRAHVYAGKVQEIKPLEMD -KYPTDMLNGIKGIIYSPSRVRYPMVRLDWLKKHKYSGETRGNNRFIRMTWDDALDLFYRELERVQKDYGP -WALHAGQTGWRQTGQFHSCTSHMQRAVGMHGNFITKVGDYSTGAGQTILPYVLGSTEVYAQGTSWSEILD -HSKNIVLWATDPVKNLQVGWNCETHESFAYLEQLKEKVAKGEINVLSVDPVKNKTQRFLGNDHMYINPQT -DVAFMLAVAHTLYTEDLYDKEFIKMYCLGFDEFVPYFMGKSKDNIEKTPEWAAEICGLPADEIRDFARML -VAERTQILFGWCIQRQEHGEQPYWMGAVIAAMVGQIGLPGGGVSYGHHYSSIGVPSTGFAAPGGFPRNVD -EGQKPKWDNNDFNGYSRTIPVARWVDCLLEPGKEIKYNGSKVILPDYKMMIISGNNPWHHHQDRNRMKQA -FQKLQTVVTIDFAWTATCRFSDIVLPACTQFERNDIDVYGSYSGRGLVAMHKLVDPLYQSKTDFDIFTEL -SRRFGRHKEYTRGMDEMEWVRSLYSDCRDANKAKFDMPEFDEFWAKGVLDFGEGTPWVRHADFREDPEIN -ALGTPSGFIEISSRKIDRFGYEHCQGHPMWFEKSERSHGGPGSKKHPFWMQSCHPDKRLHSQMCESEEMR -ATYAVKGREPVYINPKDAAEKGIKDGDIVRVFNDRGQLLAGAVLSDSYARGVIRIEEGAWYGPLNEKVGA -IDTYGDPNTLTQDIPSSELAQATSANTCLVDFEKFKGEVPPVTSFGGPIEVS - ->TMAO_Vibrio_vulnificus_YP_004189064 -MAITRRSFLKGVATTSAASVIGPSLLASASANAVETTGTWKVSGSHWGAFRAHIYAGKVQEIKPIELDQN -PTEMLNGIKGIIYSPSRVRYPMVRLDWLKKHKYSADTRGNNRFVRVTWDEALDLFYRELERVQKEYGPWA -LHAGQTGWNQTGSFNNCTAHMQRAVGMHGNYITKVGDYSTGAGQTILPYVLGSTEVYAQGTSWSEILENA -DNIILWANDPVKNLQVGWNCETHESYAYLAQLKEKVAKGEINVISVDPVKNKTQRYLENDHLYVNPMTDV -PFMLAIAHVLYTENLYDKKFIETYCLGFEEFINYVQGKTKDKVEKTPEWAAPICGVKADKIREFARMLVK -GRTQILMGWCIQRQEHGEQPYWAAAVVAAMIGQIGLPGGGISYGHHYSSIGVPSTGFAGPGGFPRNLDAG -MKPKWDNNDFNGYSRTIPVARWIDCLLEPGKEINYNGGKVKLPDFKMMVISGCNPWHHHQDRNRMKQAFQ -KLQTVVTIDFAWTATCRFSDIVLPACTQWERNDIDVYGSYSSRGLIAMHRLVDPLFQSKPDFQIMKELTE -RFGRSEEYSRGMSEMDWIRSLYNDCKKSNEGKFEMPEFDEFWEKSVLDFGQGQPWVRHADFRQDPEINPL -GTPSGFIEITSRKIGRYGYEHCQEHPMWFEKSERSHGGPGSDKHPFWLQSCHPDKRLHSQMCESEEFRAT -YAVKGREPVYINPLDAKAKGIKEGDLVRVFNDRGQLLAGAVLTDSYPRGVIRIEEGAWYGPLSEKVGAIC -TYGDPNTLTQDIGSSELAQATSANTCIVDFEKFTGKVPPVTSFGGPIEVA - ->TMAO_Citrobacter_youngae_ZP_06352135 -MLAVGAASALAPNPLISKVWAAGENPEQWIQSGSHFGAFEAKVVNGEWLETRPFKHDKYPCDMLNAVREV -VYNPSRVRYPMVRLDWLRKREKSDRSQRGDNRFVRVSWDQALDLFYEELERVQKTYGSSGVFTGLADWQM -VGKYHKAGGAMDRGLGLHGSYVTTVGDYSAAAAQVILPHVIGSLEVYEQQTSLPLVIQNSNTIVLWGCDP -IKNLQIEFLVPDHDAFGYWQQIKEAVAQGKMRVISVDPVRSKSQNYLGCEQLALRPQTDVALMLALAHTL -YEEKLYDTAFINDYTVGFEQFLPYLLGESDKQPKNAEWAAEICGLTAEQIRDFARLLVKGRTQFMGGWCA -QRMHHGEQYPWMLVVLASMVGQIGLPGGGVGFGWHYNGGGTVTSAGPVLSGLGGIANPPPAKYKADFRGA -SEHIPTSRIVDCLLEPGKKVAFNGETLTWPDIKMAIYSAANPFHAQQDRNRMIEAWKKLETVVVLDHQWT -ASCRFADIVLPVTTRFERNDIEQFGTHSNKGLMALHQVVKPQYEARHDFDVFAGLCKRFDKEAVYRENRD -EMQWIQALYDEGVKMGASLGVSLPDFTTFWQGEGYIEYPAGQPWVRHGEFRDQPDLNPLGTPSGLIEIYS -KTIAGFAYEDCPGHPVWMEPFERNHSAKKNKYPLHLQSCHPDKRLHSQLCSSDAFRNTYAVAGREPLYIS -AQDAAARGLKAGDIARVFNDRGQVLAGVVISPDFTPGVIRIHEGAWYSPQEGGKAGTLCTYGDPNVLSAD -IGTSQLAQGPSAHTVLVEVERYQQKAPQVTAFGGPETVKEEGGSAA - ->TMAO_Salmonella_enterica_gb_AEZ47489 -MKNKDSLHVSRRRFLAQLGGLTVAGMLGPSLLTPRSARAADAVAPGAATKEGILTGSHWGAIRATVVDGR -FVAAKPFEQDKYPSKMIAGLPDHVHNAARIRYPMVRVDWMRKGHQSDTSQRGDNRFVRVSWDEALDLFYQ -ELERVQKTYGPSALLTASGWQSTGMFHNASGMLARAIALHGNSVSTGGDYSTGAAQVILPRVVGSMEVYE -QQTSWPLVLQNSKTIVLWGSDMVKNQQANWWCPDHDVYQYYEQLKEKVASGAISVISIDPVVTSTHDYLG -RDKVKHIAINPQTDVPLQLALAHTLYSEKLYDKNFLDNYCVGFDQFLPYLLGEKDGQPKDAAWAEKLCGI -DADTIRALARQMAGDRTQIIAGWCVQRMQHGEQWSWMVVVLAAMLGQIGLPGGGFGFGWHYNGAGTPGRK -GIILSGFSGSTTVPPVHDSTDYKGYSSTIPIARFMDAILEPGKIINWNGKSVKLPPLKMCVFAGTNPFHR -HQQINRIIEGWRKLETVIAIDNQWTSTCRFADIVLPATTQFERNDLDQFGNHSNRGIIAMKQVVSPQFEA -RNDFDIFRDLCRRFNREAAFTEGLDEMGWLKRIWQEGSQQGKGRGIHLPTFEVFWNQQEYIEFDHPQMFV -RHQAFREDPDLEPLGTPSGLIEIYSKTIADMQYDDCQGHPMWFEKIERSHGGPGSQRWPLHLQSVHPDFR -LHSQLCESETLRQQYAVGGKEPVFINPQDASARGIRNGDIVRVFNARGQVLAGAVVSDRYAPGVARIHEG -AWYDPDKGGDLNALCKYGNPNVLTLDTGTSQLAQATSAHTTLVEIEKYTGPMDNVTAFNGPAEMVAQCEY -VPASQGNPHD - ->TMAO_E_coli_CAA52095 -MNNNDLFQASRRRFLAQLGGLTVAGMLGPSLLTPRRATAAQAATDAVISKEGILTGSHWGAIRATVKDGR -FVAAKPFELDKYPSKMIAGLPDHVHNAARIRYPMVRVDWLRKRHLSDTSQRGDNRFVRVSWDEALDMFYE -ELERVQKTHGPSALLTASGWQSTGMFHNASGMRAKRIALHGNSVGTGGDYSTGAAQVILPRVVGSMEVYE -QQTSWPLVLQNSKTIVLWGSDLLKNQQANWWCPDHDVYEYYAQLKRKSAAGEIEVISIDPVVTSTHEYLG -GEHVKHIAVNPQTDVPLQLALAHTLYSENLYDKNFLANYCVGFEEFLPYLLGEKDGQPKDAAWAEKLSGI -DAETIRGLARQMAANRTQIIAGWCVQRMQHGEQWAWMIVVLAAMLGQIGLPGGGFGFGWHYNGAGTPGRK -GVILSGFSGSTSIPPVHDNSDYKGYSSTIPIARFIDAILEPGKVINWNGKSVKLPPLKMCIFAGTNPFHR -HQQINRIIEGLRNVETVIAIDNQWTSTCRFADIVLPATTQFERNDLDQYGNHSNRGIIAMKQVVPPQFEA -RNDFDIFRELCRRFNREEAFTEGLDEMGWLKRIWQEGVQQGKGRGVHLPAFDDFWNNKEYVEFDHPQMFV -RHQAFREDPDLEPLGTPSGLIEIYSKTIADMNYDDCQGHPMWFEKIERSHGGPGSQKYPLHLQSVHPDFR -LHSQLCESETLRHEYTVAGKEPVFINPQDASARGIRNGDVVRVFNARGQVMAGAVVSDRYAPGVARIHEG -AWYDPDKGGELGALCKYGNPNVLTIDIGTSQLAQATSAHTTLVEIEKYNGTVEQVTAFNGPVEMVAQCEY -VPASQVKS - ->TMAO_Shewanella_massilia_CAA06851 -MNRRDFLKGIASSSFVVLGGSSVLTPLNALAKAGINEDEWLTTGSHFGAFKMKRKNGVIAEVKPFDLDKY -PTDMINGIRGMVYNPSRVRYPMVRLDFLLKGHKSNTHQRGDFRFVRVTWDKALTLFKHSLDEVQTQYGPS -GLHAGQTGWRATGQLHSSTSHMQRAVGMHGNYVKKIGDYSTGAGQTILPYVLGSTEVYAQGTSWPLILEH -SDTIVLWSNDPYKNLQVGWNAETHESFAYLAQLKEKVKQGKIRVISIDPVVTKTQAYLGCEQLYVNPQTD -VTLMLAIAHEMISKKLYDDKFIQGYSLGFEEFVPYVMGTKDGVAKTPEWAAPICGVEAHVIRDLAKTLVK -GRTQFMMGWCIQRQQHGEQPYWMAAVLATMIGQIGLPGGGISYGHHYSSIGVPSSGAAAPGAFPRNLDEN -QKPLFDSSDFKGASSTIPVARWIDAILEPGKTIDANGSKVVYPDIKMMIFSGNNPWNHHQDRNRMKQAFH -KLECVVTVDVNWTATCRFSDIVLPACTTYERNDIDVYGAYANRGILAMQKMVEPLFDSLSDFEIFTRFAA -VLGKEKEYTRNMGEMEWLETLYNECKAANAGKFEMPDFATFWKQGYVHFGDGEVWTRHADFRNDPEINPL -GTPSGLIEIFSRKIDQFGYDDCKGHPTWMEKTERSHGGPGSDKHPIWLQSCHPDKRLHSQMCESREYRET -YAVNGREPVYISPVDAKARGIKDGDIVRVFNDRGQLLAGAVVSDNFPKGIVRIHEGAWYGPVGKDGSTEG -GAEVGALCSYGDPNTLTLDIGTSKLAQACSAYTCLVEFEKYQGKVPKVSSFDGPIEVEI - ->DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| -MNHLDLNSNTTRRRFIKTTGLTAFAASAGISIPFATKAGNQSITSTAGADEKVVWSACTVNCGSRCPLRM -HVKDDQIIYVETDNTGSETYNLDHQVRACLRGRSMRRRVYNPDRLKYPMKRIGKRGEGKFKRISWDEALT -EIAQSLQKNIAQYGNESIYLNYGTGTLGGTVTKSWPPGSTLIARLMNCIGGYLNHYGDYSTAQISVGLDY -TYGGGWVLGNGMADIENTKLVVLFGNNPAETRMSGGGLTYCIQQAKAKSNAKLIVIDPRYTDTGVGKEDE -WIPIRPGTDAALVSALAYVMITEELVDQPFLDKYCVGYDENTLPADAPQNGHYKAYILGQGEDGIAKTPE -WAAKITGIPAERIIRLAREIGSTKPAYISQGWGPQRRSNGEIISRAIAMLPILTGNVGISGGNTGARESS -YGVPFVMMPTLTNPVKASIPMFLWTDAITRATEMTAKTDGIRGVERLTAPIKFIWNYAGNCLTNQHADIN -RTHEILQDESLCEMIVTIDNHMTSTAKYSDIVLPDCMTSEQMDFCLDGYVANMSYVIFADQAVKPSFECR -NIYDMLSDLSEKLGVKQQFTEDRTQEEWLRYIYRQSREQLPELPVFDEFRTQGIFKKVDPKGFYIPYKEF -RDDPQANPLKTPSGKIEIYSSRLAEIARSWKLDEDEVIHPLPIHVDSFEHYGDPLMEKYPLQLTGFHYKA -RTHSTYGNVDILKSANPQEIWINPFDAEKRGIKNGDMLRMFNDRGEVRIHAKVTPRIIPGVVALGEGAWH -APDNQGIDHSGCINVLTTQRPSPLAKGNPQHSNLVQVEKL - ->DmsA_Haemophilus_influenza_sp_P45004 -MSNFNQISRRDFVKASSAGAALAVSNLTLPFNVMAKETQRLNENNQERIVWSACTVNCGSRCPLRMHVKD -NRITYVETDNTGTETYNLDHQVRACLRGRSMRRRVYNPDRLKYPMKRIGKRGEGKFKRISWDEALTEIAD -ALKRNIKKYGNESIYLNYGTGTLGGTMAKSWPPASTMIARFMNCIGGYLNHYGDYSTAQIAVGLDYTYGG -GWALGNGMADIENTKLIVLFGNNPAETRMSGGGLTYCIEQAKARSNAKMIIIDPRYNDTGAGREDEWIPI -RPGTDAALVAALAYVMIQENLVDQPFLDKYCVGYDEKTLPTDAPKNGHYKAYILGYGNDGIAKTPEWAAK -ITGIPAERIIKLAREIGSTKPAFISQGWGPQRRSNGELISRAIAMLPILTGNVGIHGGNTGARESAYSIP -FVRMPTLKNPVKASIPMFLWTDAIIRGTEMTALTDGIRGVDKLSSPIKVIWNYASNCLINQHAQINRTHD -ILQDDTQCEMIITIDNHMTSTAKYSDILLPDCTTSEQMDFALDAFVSNMAYVIFADQVIKPSFECRPIYD -MLSDLAEKMGVKEKFTEGRTQEEWLRHIYEQSREKLPELPTFEEFRQQGIFKKVDPNGFKVAYKDFRDNP -EAHPLKTPSGKIEIYSSRLAEIAKTWKLAEDDVIHPLPIHAQSFEHYGDPLMEKYPLQLSGFHYKARTHS -TYGNVDVLKAANPQEVWMNPIDAEPRNIKNGDMIRIFNDRGEVHINVKITPRIIPGVVALSEGAWYAPDK -DRIDHSGCINVLTTQRPSPLAKGNPQHSNLVQVERL - ->DmsA_E_coli_sp_P18775 - -MKTKIPDAVLAAEVSRRGLVKTTAIGGLAMASSALTLPFSRIAHAVDSAIPTKSDEKVIWSACTVNCGSR -CPLRMHVVDGEIKYVETDNTGDDNYDGLHQVRACLRGRSMRRRVYNPDRLKYPMKRVGARGEGKFERISW -EEAYDIIATNMQRLIKEYGNESIYLNYGTGTLGGTMTRSWPPGNTLVARLMNCCGGYLNHYGDYSSAQIA -EGLNYTYGGWADGNSPSDIENSKLVVLFGNNPGETRMSGGGVTYYLEQARQKSNARMIIIDPRYTDTGAG -REDEWIPIRPGTDAALVNGLAYVMITENLVDQAFLDKYCVGYDEKTLPASAPKNGHYKAYILGEGPDGVA -KTPEWASQITGVPADKIIKLAREIGSTKPAFISQGWGPQRHANGEIATRAISMLAILTGNVGINGGNSGA -REGSYSLPFVRMPTLENPIQTSISMFMWTDAIERGPEMTALRDGVRGKDKLDVPIKMIWNYAGNCLINQH -SEINRTHEILQDDKKCELIVVIDCHMTSSAKYADILLPDCTASEQMDFALDASCGNMSYVIFNDQVIKPR -FECKTIYEMTSELAKRLGVEQQFTEGRTQEEWMRHLYAQSREAIPELPTFEEFRKQGIFKKRDPQGHHVA -YKAFREDPQANPLTTPSGKIEIYSQALADIAATWELPEGDVIDPLPIYTPGFESYQDPLNKQYPLQLTGF -HYKSRVHSTYGNVDVLKAACRQEMWINPLDAQKRGIHNGDKVRIFNDRGEVHIEAKVTPRMMPGVVALGE -GAWYDPDAKRVDKGGCINVLTTQRPSPLAKGNPSHTNLVQVEKV - ->TtrA_Wolinella_succinogenes_NP_907142 -MEEGRRRFLLGSGVVAGSAAVVGYKETLGAVALLKDKGERAKDSIYGEAAEPEVRFESGRTLINPKYSIRPSVCNGCTTHCGIRVKINQESGAVERVFGNPYSLLSSDPWLPYNTPLKESLEVLSAQKESGLHHRSTACARGNAVYDKLNDSFRVTKPLKRVGKRGENAWVEISPEQLIQEILEGGNLFGEGEVEGLRSIRQLDKLIDEENPEYGSSANRLCVLGTADEGRQVVMVQRFVQSFGTVNFMGHTSICGLSMRAGEAAYLNDFVGYPHLKPDFKNCKFLLNIGTAPAHAGNPFKRQAKLLAQARTTGECRYVTVTPILANSDNIAVGERSRWLPVAPSGDLALVMGMIRLIIEEKRYLADYLAIPSLESQKALEEVSFTNATHLIIQKGEKEGQILKDSQGSPWVIDVKEGVLRDSKSVLRGELDFAGEVTLEGVSYEVKSAFLLLKESALAYTLEEYASFSGIDSKEIVHLAREFTSYGRSVGVDCHGGTMHTTGFYATYAVMMLGALVGNLNHKGGMSMGGGKFEDFNGEAYNLIAYPNKPKPQGARIDRARMAYEKTSEFKRKVAQGENPYPAKAPWYGLANALESDVITNSEEGYPYKLGALISWCANFIYGQSGSEHLLESLKDPKRAIPLFIAIDPFINETSRWADYIVPDSVMYETWGVVSPWGASLTKASHLRYPILPSPNAKWSNGEPVSMDSFIIELGKALGLPGFGKNGIVAKSGEKFPFDRPEELYLRAFENIALSGKAVPEISDEEIELAGLKEYASKLQAINGENWRRVAYVMARGGRFAPIEDAYKGDSLSRAYPKAISIYNEALGTSKNSLTGERYSGVPRFYAPRFTDGRALEEAGLGDSRSFLAFSYKSNVLSAPTTASRHLKELRYTTFVDMNSQSAKALGIVHGERVRVVSKGGFVIGICRLREGIHPRSIGIEHGAGREGEGAIDLLINGNVIRGEIARRSGVNINKLGLKDASKGKVGTLSDFVIGSNARQGIPVWIEKLS - ->RBG1_855 -MQVTRRDFLTFAGFTLAGITLGEWGRSKILAREEYKDTLYSGIGKEEFRLSICGQCPAGCGIVVRLMDGNPKKIDGNPLCPLSRGKLCPKGQNGLQVLYDPDRLTGPVKRKGKRGENDWEKISWEEAINTVSQKLKELKEKQNSYRLLILTQENKGLSGKLWKQFARAYGTPNLVEGNLLRDPGILWASYLMQGIKDYPAYDIENTKYILCFSPFLEGWYSPTWAQRMYGNFRRKRPEIRGKLVQIEPRLSPTAANADEWIQINTGTEAALVLGLAYLIIKEGRYDENFIREHTFGFEDWTDAQKRTHLGFKNFVLQEYDTEKVSSLTGVPIVTIIRLAREFSELNPALAIAEQRPASGGFYLQMAILALNALVSSLDVKGGVIIQREVPFKEFPEVSGSKKESILNQERFSSQEVFPHLTKAILEEKPYPIEIVLIDKINPFSHCFPIINFKEALEKIPFIVSFSPFLDETSLYADLILPDHTFLEKWQDVVPSATLGSPVLGISRPAVDPFLDTKNTADVILEIAHDRDILAYSTLPWKNYGELLKDSLQGIYLSRRGMTYGTSFQGAWMSQMEKGGWWSPTYTNFEEFWNQLLEKGGWWDPFYEHQKWDRVFKTPSGKFEFYSQIFKNQLASIKPSKENSDFKILPHWESVVWEGDENSFPLYLNVFELLMFSAVLNSNQPYLYEHITPHLSVQWESWVEIHPEKAKALGIEENDEVWVESVLGKIKTKAKLYFGTHPEVVSLPLGLSGLSQSSWIKKEISNPNQLVTGNSGNLENKYLRVKIYKA - ->QrcB_delta_proteobacterium_NaphS2_ZP_07200609 -MTMKITRRNFIAAVVGGVVGIQVTPLPWKFTDDAAIWTQNWPWVPVPAEGAVTEENTVCNLCPGGCGISV -RKVAERAVKIEGRTDYPVNPGGICPVGMGGLQLLYDDDMRFPGPMKRAGARGQGQFVNITWGEAYDILAG -RIAKLRKDGTPEALAAIDGNYAGTTTGLLVERFMRSVGSPNYVKPNAITDTYHMGNLLMMGKSVPMAYDL -ENSDFILSFGCGLLEGWGAPGRVMNAWGMWHDANPKNRKTRVVQVESRASNTASKADFWVAPRPGTDGAL -ALGIAHVLIKKGRVDERFINGFTYGFDDLTSSEGQSQPGFKTIVSNKYSPVQVERITGVDAGTIVALANA -FSKAKAPVAVYGKGKNNLNGSLYEFMAVQSLNAVKGRINRPGGVLVPDPLPLAPLPEFDPDEVAAKGLET -PRIDGAGTKAYPFTDSLINHFADAINQGARSPVDTLLVFSANPFFTVPDGPGFMNALEKIPFIVSFSPYR -DETANMADLILPDHTYLEKIEDIVWPVGLQYPLYGLTKPVVEPVNDTQHAGDVIISLSKAVGEATGSAFP -WENFEEALQARAKGLFDAGGGLVHYDASKPPWKFKPFGNGQKPSYKSFDDMWGEMKSGGMWFQPVKLAGM -DGLFATSSGKFEFVSQKLRQTINETAAQTSQKAALDQMGIRVAGAEAFMGHYAAPKLGVDRSKYPLFMVP -YEMINLSSGWIATPPFLYKTIFASQLLKEESFAAVNPETAAKYKLQQGDRAIVKSPVGELRVRIDLFEGA -MPEMVYMPLGFGHTAYDEYQKDKGVNPNNIVKALNDPVSGYPLWWNTPVTLTKA - ->ACTB1_Geobacter_metallireducens_GS_15_YP_384764 -MKRRTFLQLGTVIAAGAVLDGCRSKNEQLIPYLIPPDEGITPGKGTYYASSCNACPAGCGILVRVSEGRA -KKIEGNPEHPINRGKLCARGQAVVQELYHPDRVPHPLKRNGPRGSGAFTRISWQEGIGLLTDRLKALQRE -QSTNGLALLTPHLRGTLAELTGRFMRTFGSTNHVSYELLTPDLLRIAARRSFGQPTLPYYDIAETRYLLS -FGADFVDSHLSPVKYGSAFGEMRQGRDTVRGHFTYVGGRMSLTAASADRWMPAKPGSEGTLALGIARLIL -AESLYDSGALAMNGLEAKKLLAALDRYDLPRVAQLSGLPQGAIAEVAREFASTRPALALAGEMVAFQSNG -PESVRAVHLLNLLVGSLNRPGGIYPDAGSPSGPENSFAELIALIETMRGGHVKVAMIHGDPLYSVPPATG -FHDALAKVPFIVSFSSLLDDTALHADLVLPDHAALESWGDVIPVAGTREPLVGLMQPVVEPLFDTRQFPE -VLLATAHELGGRMAAALPDESYLELLKGAVRKQAGFGAGVDFEAAWVDLLQHGGLFKTKSVQPTGYRWSS -DAPPPLPEDPDFAGDQKTYPFHLIAYPATAFYDGRGAPYPWLQQLPDPMTTVVWGSWVEINPETAAEHGI -GFGDLVEVSSPQGTLRLPAVVYPGIRPDMVAIPLGQGHRGMGRYAQGQGVNPLALVARQGTKQQPAWNAT -RVRITRISGNGELVTAGHPQGSLRSELVEI - ->ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 -MKRRTFLQLSGMTAAGTVLSGCQSGNEKLIPYLVPPDEGVTPGKADYYASSCRFCPAGCGILVRVSEGRA -KKIEGNPAHPVNRGKLCAMGQAVLQELYHPDRVPQPLKRSGPRGSGAFTRISWEESLELLAGQLRALQRE -KATDRLALVTPQLNGTLVELTTRFMRVFGSPHHLSFDLLGPDWLRTATRRSFGQPGLPWYDVAETRYLLS -FGADFVEHHLSPVQYGYAFGRMRQGRDTVRGHFTYVGGRMSLTGASADRWMPARPGSEGALALGMARLIL -AESLSDAGSLAVNGLQTEKLLRRLEAYDLPRVAEQTGLPQRIIAEVAREFATTRPALAMAGETVAFQSNG -PDAVRAVQMLNLLVGNLNRPGGVYPDGGSRVGPENSFTELLSLVAAMRDGRFRVAMIHGDPVHAIPPATG -FQEALARVPFIVSFSSLMDDTALQADLILPDHAALESWGDVIPLAGTRDRVIGLMQPVVTPLFDTRQFPD -VLMAMADKLGGKTAAFPYQSYQEMLKGTMEKRVGRAARRDFETVWVELLRQGGLFETRQGQEKGYRRAPG -SSLPNPAEPRFAGDEKRFPLHLLVYPSIAFYDGRGAPLPWLQQLPDPMTTVVWDSWVEINPRTAAEMGIG -FGDLVEVTSPQGAMRLPAVIYPGIRPDMVAIPLGQGHRGMGRYARGRGSNPLVLLALITDGTETRPAWHA -TRVRLTRISEKGELVTAGHPQGSYRSELIEI - ->ACTB1_Geobacter_sp_M18_YP_004200644 -MKRRTFLQISGMTAASALISGCQSANEKLIPYLIPPDEGITPGKAVYYASSCRSCPAGCGILVRVSEGRA -KKIEGNPEHPVNRGKLCARGQALLQELYHPDRVPQPLKRSGPRGSGQFTRISWEEGLNLLTGQLKGLERA -GAAERLALMTPQLRGTLATLAATFMSSFGSPHHLSYELLAPDALRAANRASFGQPSLPWYDIAQTRYLLS -FGAEFVDHHLSPVHYGNAFGRMRQERDTVRGHFTYVGGRLSLTAASADRWMPARPGSEGALALGIARLIL -SESLHDRGALSANGLSATDLLAGLASYDLARVAELTGLSREAIAEVAREFATTRPSLAMAGEGVAFLSNG -PETLRAIGLLNLVTGNLNSPGGVYPDGSFPDGPENSFADLVSLVGAMAGGRIALALIQGDPLHRVPAATG -FPEALAKVPYIVSFSQIMDDTALQADLILPDHAQLESWGDVIPVAGGRFPLTGLMQPVVTPVFDTRQFPD -VLLAAAAALGGKTARALPFPSYQELVKKSVLQRAARVKGEEAEEIWTSLLQKGGDFREGPEQPKGYRWAP -GASLPAPQAPLFAGDERSFPLHLQLYPSTAFLDGRGAPLPWLQQLPDPMSTVVWDSWVEMNPKTAAGLGI -AHGDLVEVSSPQGSLRLPAVVYPGIRPDLVAIPIGQGMRGGGRYARGRGVNPLSLLAAKLKGTGPTPCWS -ATRVKLVRISGDGGLVTNGNPQGSYRSDLVGI - ->TtrA_Photobacterium_profundum_YP_133039 -MAALIMDRRQFLKMGAATTFTGGMAGISKATAGDSNQDISRYAPLSAEPEFILGPDNKLTNNPNQRFAFTKCFGCYNVCGARIRIDNNTDQILRVCGNPYALSTQSGNPVAMEVSPQEAMLQLVGEQGNENRATLCGRGNAVPDAITDSRRVTQCLKRVGKRGENHWQSISYEQLIKEVVEGGNLFGEGHVEGLSDIYDDKTVANPAYPDFGPKKNQLLMTGCSEDPARWGFYKRFSEASWGTPNIGNKDSYCGHQQVAGCALGVEDGANSGALPTTDFEHCEFAIFIGTNPGLSGISLNSASKRLADARTQNPNFKYVVIDPILRSLTSSSTPENCEWVPIRSSGDTALMHAMMQYIINNERYNKSYLASCSQEGAYKVSEINYTNAPYLVVTDKKHPLYRKFLTAAACGKGDADTKMVIDAKSQQLTTSDSSEPCNIKFSGKVTTEDGQAVKVETAFSLLAKRVNEHSMADYAAECQVPEAKIIELAKEFTSHGRRVSIETNTGCNASDGSQFAFAMIMLTTLVGAHNAKGGMLHTGSMGFENTSPLYDMMAFEHAHLSGFNAERSGDYRQSNEFKEKVKNGINPYPSEMPWNETFIQDNAGELLVAHANGNPFKFKAWIAWANNPLYACSGLKDQVEASIKDPKQLGLIIASDPYFNETNVYADYFVPDLAQYEQWGASRQWGSELMGDVVSFPIITPKTPLNAEGNRVCMEQFLIDVAKQIKLNGFGENAFKDTAGNAKAINTPEDYYIPVLANLAHSDEVLPTPTEEDVKFTSVDRIYSQLKERLKAEEIGPTMFLFTRGGRYLTVNSRYEGEFFNEMMRWDAQFQVYNEGLAHITNFHSGEYLDGLPVFDKQRFWDGTAIRDLWSENEYPFYFSTFKHQLRSPYSVALKSITALGVSNFIQMNENDAKKYGLTTGDKARIATPKGAAIEGIVQADTTVAKGCIAVPLGYGHTAFGASDITIDGKTLTGIPERKGGMAVNAFNAVDPTRKGASLYRDVTFGSTARHGIPMKIEKV - ->TtrA_Haemophilus_somnus_gb_ABI25172 -MNKQRRNLIKGALATTAATAFVAGYSPKVKEIAKGVIEGSSGQKTQDNINGNSLLPEYQVKEGNLLTNSQQVVCNTQCMGCWTLCGLRVRIDLEKNKVLRINGNPYHPLSSDHYLDYNQSIKQAELSVSGENGLQQRSTACARGAAFLDGINSPYRITQPLKRVGKRGEGKWKTISFEQLIDEVVNGGDLFGEGHVDGLKAIRDLQTPVNAQHPDFGAKVNQLMVTFAGPEGRQPLLKRFANNSFGTINFASHGSFCGLSYRAGSGAFMNDFANNSHAKPDWDHVEFILFMGTSPAQSGNPFKRQSRQLAKKRTEDNFEYVVIAPRLELTSTAAQDKNRWVPIIPGKDLSLALAMLRWIIENERYNEDYLSIPSEIAMQQANGVSFCNATHLFIADPNHKQYGQAIRNFHIEDLSEPEKLSDSDILVKDRQTGKFIAAKDCQSAVLFVEDRISLKDGSQVLAKSALQLFKESCFSYSIEEYSEQCGVPVDTIIQLAKKFTSHGPRAAVITHGGTMHSNGFYTAWAILLLNAMIGNMNKKGGMSMSGGKFKDFSAGPRYNLANFPNMVKPKGTNLARSKKDYEKSSEFKQKVAQGISPYPAKAAWYPFVGGQMSEMITSALQGYPYSLKAWINHMGNPIYGMTGIHHITQQKLKDPKILPLFISIDAFMNETTALADYIVPDTHNFESWGFSTPWAGVPTKTSTARWPVIASPNEKTSQGDTICMESFVIEIAKMMQLPGFGDNAILDKQNHSYPLNRSEDFFLRAAANIAYDGKQPVQDATQEDLLLTGVQRLMPSLQQVLKPEEIKKVATIYCKGGRFAPHSSAWQEDNMQARWKNCLQIWNENVAKAKHAQTGKNYHGCPTYFEDQFADNSTVESHYPKIQWPFKLISFKSNLMSSITAPLLRLHSIKPNGIVAINQQDATEYGLQHGDLVELNTPGGKAVVQLVVMNGVIKGTIAIEHGYGHKQLGATGYTINGKLIEGNAQIGSGVNINDLGLLDSTKEIASPWVDWVCGSAVRQGIPAKLVKLA - ->TtrA_Yersinia_enterocolitica_YP_001005907 -MAKSTRRQWLKGSLALGGVVAFGASYHAVARKTLAGLVDGSAGKLTLDPISGNALPTEGRVGPQWQANPQQAVSMTQCFGCWTLCGLRVRVDTQQNKILRIAGNPYHPLSHDHHFPYQLPVGEALQHLGGEQGMTGRSTACARGATLLEGVDSPYRITEPMKRVGPRGSGKWQRISFEQLVAEVTEGGDLFGEGPVEGLRAIRDLDTPIDAKQPSLGPKANQLLVTNAGDDGRDAFIQRFANQAFGTKNLGSHGAYCGLAYRAGSGALMGDLDKNAHVKPDWDNVRFALFLGTSPAQSGNPFKRQGRQLANARQRDDFNYVVVAPALPLTTTLANQHNRWVPVLPGTDAALAMGIIRWIIEQHRFNHAYLAIPGEMAMQAAGERSWTNASHLVITTETHPLAGQFLRANMLSGETVAEGEESPVLAQAIDGALQPAAQMLQAELFVTQDLTLHDGQNVQVQSGMTCLQQAAARFTLAEYSQQCGVPEATIIGLAREFTAYQRQAAVISHGGMMGGNGFYTTWAVMMLNAMIGNLNLKGGVSVGGGKFDGFADGPRYQLATFVGMVKPKGLPLSRSKQPYEKSEEYQQKIQQGQSGYPARGPWYPFVGGQLTEQLAPALAGYPYPLKAWISHMTNPLYGVAGLRNLIEERLQDPRQLPLFIAIDAFMNETTALADYIVPDTHNFESWGFSAPWAGVLVKASTARWPVVEPRTARTAQGEPVAMESFLIAVAKAMKLPGFGANAMQDSEGNSLSLDRAEDYYLRAAANIAYGGEKPLPAAVDDELRLTGVDRLWPALQRSLYPDEQRRVAYLLARGGRFAPYEKSWNGDATGSQWKKPLQIWNENVAKHHHAITGERYSGCPTWYPPRLADGSDVFQHYPVSDWPLRLMSFKSHLMSSSTAMIERLRAVKSTNLVAINPQDAQRNGIQHGDIVRLMTPGGQMEVQVSLLDGVMPGVVAIEHGYGHREMGSRAHTLDGVVMASDPRIGQGSNLNDLGFTDPTREIPNTWLDWVSGAAVRQGLPAKLQRIS - ->TtrA_Aeropyrum_pernix_NP_148724 -MVSRRDFVKGSIAIASLLVAGAGLQPVLSQLVRPKFERIAPDLQMGANVRYVYSSCLGCNVRCGIKARVVKVGDLEIVERIEGNPYHPYNRAVSLNGNGKLGSQHLRFYHLPYNTPVKEALTKWHGTLCPRGQDGIYYLYDPYRVLVPLKRAGPRGSGKWKPISWEQLIREVVEGGVIEETGERLPGLRDFFVYGKLREAGFEDPNAILSDMKKDVQEILEYAKKPETSYEDIVMKIEEFKEKWSKILGEKGLKLDDILIDPDRPDLGTKANMVAYLRGRGQGHTDYMSARWIAGFGSVNWLRHTSACQLGYYAANYLWAGYHDIQPDPVSSKVIIMAGASMGRLHPGTTGQGLLISRAGEGDLKIYYVNPTAPRTDAGGNIVWIPIKPGYDAALAFALIRWIIENERYNKEFLEIPNEEAAERKGYPVHSNATWLVIMEEGHEKWGEYLKAKDVGLEDSDKPVVFTGEGLATYDSVDNAEIDWEGEVVLTTGERVKVKTSFRILKDEALSRSIDQWLSVASPYEPGSSEFREWKEKVLEMARDFAEAAPMAGTYVHRGVGMHSNGEYAVWAYRALDTLVGNYHRKGGLLARAGHTKYNSYVYHVDKKGFGEPVKWGPPIDRHKAKYEDTLEYWLKVKKGENPYPAKRPWYPHTPEESYTEIFAGIAEEYPYKMGALILFYANPVLSANYGVKFIEVLKDTKKLPLFIAITTTINETMLYADYIVPDTTYLETGTLGMQYLYASSGGVLLAEAARSPVVMPLTQKIGEPERYASFWEFFIDTGKALGMPGFGKGAIKGLKYHEGKSYDLDSLWDYIMRVYANAAMHAKDMGIIPENVPEEEVKFVEENYPVAKFKHLIPDEWPYVAYMLARGGVFTSYEESFHPNGVSKRKVPSKRKKFKKTLMLWNEDLAKTRNSVTGAKFWGGPKYIPPSTYAPVKGGSKSFYGTPLREIYPESEYPFHLVFTTGPLFTKHRSQFYYAIKQISPENYLVVNPKDAEKLGLETGDVVEVETPTGRFKAPVVVEPTVPPGVIMVPYGMGRWADTVVKKPSYFEVKDSRLASLINELPEREEIPEEAVNPVKKLPELKKKVLFTKSTPAYYNQAEPDKWRFNGITPNVAEMSDPSLGGWPLLSIIGAAQAYYFNVARIRKTGEKHEFEKTYPYIVW - - ->PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 -MVTRRDFLKATALTATAISAGIKFQPKSYAEATAASGEVKFVPNICAMCPAACSIQVEVRDGKVHRIHGTPDHPINNGKICARGNAGVQRVYNPDRLKKPLIRTGEKGTWSFREASWEEALSLIASKVKEYREMGHPEYIGMLGGWLPCTYYKPFFKAFLAALGTPNGGGVPEALCFLSKALGWKSAYGFGAHPELLTDYENARYVIMLRRNVAGSISVVHGWRLGQNRRKFKLVVLDPRYSETAAKADVWLPIKPGTDLAFLLAMMNVIINEKLYDSNFLAKYSNAPMLLKDGKPFKVWDENGKKKYLVFDLAKGAAVEHDSAMLPALEGEYEVEGEKVIPAFEALKRRVAEYTPEWAEGITDIEAKKIREIAREFALRRGVIDSGWHGPKYRNSLLTWRAAAIVNALVGSVNNDGGLLFTGLAQFVTSKESTTEAPSQSVLRMWAEKRGIATAFLGHTVQAFYDAIVNEDPYPIKMLFVVGHNLLMNMPERQKWEEALKKLDFMVAVDILPQDHLYYADVVLPESTYIEKDDPLFPIAYAPAFGFHTRVKAIEPIYDTKHVIEMMVEIASRLGTEDTFFKALSKGLGVDAEKLKSYYHGEGVAGIRRAQAEAKGVNYNELLSKGYVLKAGRDKIVYNMPYKQPLPTPTGKVEIFSFMLANFASKASEPYWDALIKWVPPKVSERKLGSNEFYLAYSRSPFTTHSSTSDNPLLAKLIDDAELYYKGIWINSERAAELGIRNGDRVVVESVFTGDKTEAIAFVNELVRKDTIFTVSGFGQSSERLTNIPQRGMTMMRLIPLQFDTLSGTIMSQETIVRITKA - ->PsrA_PhsA_Thermus_thermophilus_YP_004130 -MQRREFLKLSALGVGAMALRGSGPAKALKAPWYAQEVKSVYQICEGCFWRCGIVAHAVGNRVYKVEGYEANPKSRGRLCPRGQGAPQTTYDPDRLKRPLIRVEGSQRGEGKYRVATWEEALDHIAKKMLEIREKYGPEAIAFFGHGTGDYWFVDFLPAAWGSPNAAKPSVSLCTAPREVASQWVFGRPIGGHEPIDWENARYIVLIGHHIGEDTHNTQLQDFALALKNGAKVVVVDPRFSTAAAKAHRWLPIKPGTDTALLLAWIHVLIYEDLYDKEYVAKYTVGFEELKAHVKDFTPEWAEKHTEIPAQVIREVAREMAAHKPRAVLPPTRHNVWYGDDTYRVMALLYVNVLLGNYGRPGGFYIAQSPYLEKYPLPPLPLEPAAGGCSGPSGGDHEPEGFKPRADKGKFFARSTAIQELIEPMITGEPYPIKGLFAYGINLFHSIPNVPRTKEALKNLDLYVAIDVLPQEHVMWADVILPEATYLERYDDFVLVAHKTPFIQLRTPAHEPLFDTKPGWWIARELGLRLGLEQYFPWKTIEEYLETRLQSLGLDLETMKGMGTLVQRGKPWLEDWEKEGRLPFGTASGKIELYCQRFKEAGHQPLPVFTPPEEPPEGFYRLLYGRSPVHTFARTQNNWVLMEMDPENEVWIHKEEAKRLGLKEGDYVMLVNQDGVKEGPVRVKPTARIRKDCVYIVHGFGHKAPLMRLAHGRGASDNYLQTRYKLDPISGGAGLRVNFVRLEKAERPRLPSLTGLAKRPFDERRM - ->PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 -[MLEQKITRRTFLKGSLAAGALATFGGKLIPIEPAKAAAAGQAETRVVPTLCEMCGVKCGVLAHVRDGRVWRLTGNPRDPQSGGRLCARGNAGTKTLYDPDRLKGPMKRVGEGQFQPISWEQAFQEIGSKLKELKEQYGPQSLVWLAHPELISPLEKHFMAAFGSPNYTGHGPTCYSSRNVAFEQMYGGVPGVDYRNVRYYIAFGRNLTGGIKNPDVQKIVAAKAEGAHLVAVDPRLSDFAYFADEWLPIRPGTDLAMVLAMINVLINENLYDAAFVAAYTTGFEELKKGVSGYTPAWAAGITGIEAGTISRIARELAAAKPAAAVDPGWHAVTGSQYGNSVQAGRAIAALNALLGNLGARGGLSLPPTIKLGSPAGIMGPKPPAATAPRWDGAGSEKWPLNKDHGMIQTFPERVKQDQPYPVKAVIIQHLNPVRSSTDSLAFIEALKKLDLVVAIDIQMNDTAYYAHYILPEATYLERYDPLMTVGNKVLLRQPAIKPLFDNKGAEEIIAGIGRAAGLSEYFNFTLEQYNDALLGPLGLTQAQLALTGVAEVEASKPDYSKLKTPSGKIELACPAFVKAGSTLTPAWEPPLVEPRDDSFRLIQGHVPMHTHTTTDNNSYLHAIMPENELWIHTSRAGKLGIKTGDLVEVASKVGKVRVKARVTEAIHPEAVFLAHGFGCRVPLRHLAYNRGANGGDLIPIMTAPVSGAAAQCETLVTVRKAG - ->PsrA_Wolinella_succinogenes_NP_906381 -MTRRDFLKSAGAAGAAGLVWSQTIPGTLGALEKQEIKGSAKFVPSICEMCTSSCTIEARVEGDKGVFIRGNPKDKSRGGKVCARGGSGFNQLYDPQRLVKPIMRVGERGEGKWKEVSWDEAYTFIAKKLDEIKQKHGAHTVAFTARSGWNKTWFHHLAQAYGSPNIFGHESTCPLAYNMAGRDVFGGSMNRDFAKAKYIINMGHNVFEGIVISYVRQYMEAIENGAKVVTLEPRLSVMAQKASEWHAIKPGHDLPFVLGFMHTLIFENLYDKKFVQKYCTGFEELKASIEPCTPEKMALECDIPADTIKRLAREFAKAAPKAIFDFGHRVTFTPQELELRRAMMMVNALVGNIERDGGMYFGKNASFYNQFLGEEDPKAKGLKKPKTPAYPKVEVPRIDRIGEKDGEFFLANKGEGIVSLVPKATLNELPGVPCKIHGWFIVRNNPVMTQTNADTVIKALKSMDLVVCVDIQVSDTAWFADVVLPDTTYLERDEEFTAGGGKNPSFGIGRQKVVEPLGDAKPGWKIAKELSEKMGLGEYFPWKDIEDYRLQQVDGDLDLLAKLKKDGSASFGVPLMLQEKKSVAEFVKKFPGAASKVNEEGLIDFPKKIQLFSPKLEEVSGKGGLGYEPFKYKEEDELYFVQGKTPVRSNSHTGNVPWLNNLMEYDAIWIHPKTASKLGIKNGDAIELYNKFSSQKSKALITEGVREDTLFGYFGFGHVSKDLKRAYGKGVNSNALMPSFTSPNSGMDLHVFGVKVKKA - ->PhsA_Wolinella_succinogenes_NP_906934 -MEIEISRRRFLQGSVALTIVGASSGALAVGGSSGNKTESQEKGERSVATLCEMCVNKCAAIARVKDGKVIKLDPNPLFPKSRNMLCARGNAGIKALYDEDRLKYPLIRAGERGDGKFKRVTWDEAYTYIQEKLVKIMDEEQDNRSAIGFCAGEGMGEHHFKEFNKVFGSSNWLNHSSVCLQSTVSGYTLTIGTYGNPDLANAKYVIMAGANRAEAIVTPDTMDLFKRTLGRGCQLVVIDPRYSHTAHKADLWLPIKAGTDLAFVLALTHVVLSEEIYNKKFVEEKFNGFEEYKAHILQQNYTPEWAEPITGISASDIRKVARDFMACAPQAIYYPGRRTTWAKNDFQLRRAMAIFTALGGGVDVKGGICYGKTLPIDEHSIPAPMYANAKSRIEQNKAAIVGGTGSWVAWRDMVAAKETPYPIRGMFIYKQNPMHCVPNTAKTAQMFKNMDLVVTIDTMPSDTAIMSDVILPECTYLERTDPVKSFGGIEPAIAQRNKVIEPLYETKPVLQILRELTAKLSRPLFENSLKHDEDLQEMIEEKASELASSNPNKGEEELKKLAIEEVFEDEMEGWDISQGYAHSEEEMNEHAVAKYAGAHEMLLKHGVFYPGINEQFKQVSANEYVYYPESKKAYSMRNGQFNTPSKKVECVIPSLASKGIDTMPTWREEYLPKTPAGQFRFVTGRHAQFTQSSTANNALLLDTMSENFIWINKRVAKERGIKFGDLLEISSKAGKTRIKAYPTEKIAPDTVFFVHGFGVQSKAMSRAYQNGGHDSMIIEEHIEPVFGAAAAHETLVEIRKV - ->PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 -MKKFSRRTFLKLSGAATAALAAAPTLPRMASLAANIQLEGSAEFKASYCEMCTSRCPIQAKVVDGKTVLI -NGNPEWAATGGTVCARGGSGFSQLYDPQRLKKPLIRTGERGEGKWKEVSYEEAYAYIAEKMQDIKARYGP -EAMAFACRKGPHMGYLYTLAKAYGSPNTFNHESTCPMAKTVALEATFGTAALGIDYANVKYLVTFGRNFF -EGIHVAQTRGVMTAVSKGAKLVSFDPRFSLTSAKAHEWFAIRPGTDLAVVLAINHVLIRDGLYDRDFIDK -YTEGFEAVKASLTACTPAWAEQESGVRAADIERIARELAAARPRAVVEFGWRTTSTPEEFELRRAIIITN -LLLGNLEVPGGTFFVKSANFINSLVGKPVIQPIAGPKLPPFPQPGRPRIDGAGSKGQPYSLVPPIDGVVQ -TIPEAALTGKPYPIRGWFIYRYNPVLTIPDTNRVIEGLKKMDLVVVCDINMSDTAWYADVVLPESTYLER -DEGFNDYSGAVPVYTLRQKVVEPLYDTRPHWQIFKELAEKLGLGAYFPWKDVEELRLIQMGGKADLVRMG -KEKGFVNFGLKPLFLRDRASVAEFVAKFPEAKELVNTQGIIDKPLLNLKTKSKKIELLSTEAEELFGRGV -PVYRPVKLAEAGEAYFVQGKVAVHTNGHTHNVPWLYNLMSENRLWLNPATAAKLGLKDGDKAILKTRTGQ -QQVKVLVTEGVRPDTVFGYFGFGRLSPGLGRAYKKGINSNLALPLVTADVCGSTIQTTGVTISKV - ->PsrA_Carboxydothermus_hydrogenoformans_YP_361367 -MKLTRRSFLKASAATGALAALSGGVMSFERWAAKAAETGEVKLIPSICEMCGTKCGIIVKVKNGRVVKIE -GNKEHPNGKGKICARGNAGMKLLYDPDRLKQPLKKEGDRFVPISWEQAFREIGEKLKEIKAKYGPEALVW -STHPELAYDYEVIFNQAFGSPNLSAHAPTCYSPRNVAYKTMYGEVPTVDYGNVKYYISCGRNLVEGINVS -QVTGIMKAKEKGAKLIALDPRYSNFAALASEWVPIRPGTDLAFLLAMIHLIIKNEWYDKEFVKNYTIGFE -EVAAEVEKYTPKWAEEITGIPAATIERITEEFAKAKPAAVVDPGWHTSRYMNSTEMVRAGAVINALMGNL -GMKGGLKFPKYKFTKVEEREGLWPKLEKPKAKRFDGAGGEKWPLAKGLGMIQMLPEHILSGQPYPIKAYI -VNHHNPVRSAGNSQKWIEALKKLELLVVIDVQMSETAMMAHYVLPESTYLERFDPPQIAGNAVALRQPAV -KPLHNTMGVDDIIKELAHEAGIGQYFNFTLEQFSDQMLKPFNVTFKQLVEKGVIALDDGKTEYKVPEIKT -ESGKIELASSAFEKAGAKKVPTWVPPGVTEGNGKLRFLHGHTAVHTHTSTFNNEYLHALMPENVLWINTR -TAEKLGIKNGDLVEVKSDYGKVTIKAKVTEAIHPDAVFMVHGFGGFSPYQKKAYKKGASTSFIIPCHVEP -VSGASADCEVLVEVRKVGGGANA - ->PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 -MQRRDFIRMSSAVASAALLGPTLAGCSRPAEWQRMMTEAPATETPTVCNICFWACAAKVHTRGERLWKIT -GNPEDAHCEGRLCTRGTGGVGAYYDPNRLVRPLVRMGKGADQRFEVASWDNALGLVAERMEKIAREHGPD -RLAALVHGPGAAHFSHLVRAFGSDSIAEPAFAQCRGPRDTGFFLTFGQGFGSPEQTDMAKARCIVLIGTH -IGENLHNSQVRTFTDGIRNDATIIVVDPRFSVAAGKANHWLPIRPGTDIALLLAWMNVILAERRYDAGYV -ARNTVGLEALCAHVAPFTPEWAYGETGIEPALIRETARLMAAAAPATVVHPGRHSTWWGDDTQRARAMAI -LAGLLGIWGREGGYYLPESVALPAYPVPAYPVPKTSWREIALPVFPLAGAPVTNVILDNAHGADAHYKGL -IVYDTNLPMTMPGIRRTLEAAAQSLELIVAVDVQPAEVTGYADVVLPECSYLERHDPLRNSGERYPALAL -RAPALPPRGESKPGWWIAREIGTRLGLGRYFPWTDYTEVIDWQLRQVGSSLKELETTGIRAFPRRTPAYF -APGETPRFATPSGKIELFSATLQQAGFDPLPRYTRPEAPPADHFHLNYGRAPQHSFSRTQNNPVLYQLMP -ENLVWIHPTAARRFGIRNGTYVRLVNQDGVVSNKVRVRVTERTRPDSVWLVHGFGHTAPGLSLARGRGAD -DSALMTRVLYDPIMGGTGMRGNFVTFRKENA - ->PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 -MPIMSRRSFLKTSGICTAGAIAATYLPDQFLLWAGEKGLAKTEKITTYCEMCFWKCGAIATVVGGRVVKL -EGNPLSATAKGKLCGRGNGGIGLLYDPDRLKHPLIRTGKRGEGQFRKASWDEALTHIADKLKKIKEEHGP -ESLALFTHGSPTEHFMPLLQGFGSNNFAMPSFAQCRGPRVVGYELTYGDDIGSPERLDMANSKVVVLIGS -HLGENMHNSQVQEFTDAIGNGAKIIVVDPRFSVAAGKAHHWLPIKPASDMALILAWINIIIREGWYDREY -VAKYTHGFDKLAAAVQQYTPEWAEKETDIPAAQIMATAREMGLHRPAVCIHPGRHVTWDGKDVQRSRAIA -ILGAILGTWGREGGAYLATRGSFPAVPPPSFPASNRPTLKKGGFPLGGAEGVTNAIREATSIGEPYPVKA -WMVTGTNLLAAMPGQKETIEAISKLDLLVVVDVIPSDTSLYADVVLPECTYLERHDGLIIGKGRALSASI -RQPAVAPMYDSKPAWWIAKELSKKLGLEDYFPWENFEDRLNELCLTYNIDYDELKQKGVISFPDTAKPFI -TADNQPVFKTKSGKIELYSKELEELGFEPIPAYEKNEEPPQGFYRLLYGRSAVHTFSRTVNNPALNELYK -ENELWLSSVQARKMGLTDGQYVALQNQEGITSNRVRLKVTERIREDCVYMVHGFGQQSKGLTKAFRRGAD -DQQLISSYPVDPICGGTGMRCTFVKLVKGA - - ->TtrA_Pyrobaculum_arsenaticum_YP_001152643 -MTSRRTYLKAIAAAAALGVALWGYWPVVDKIIKPKRNPYGPDPQYGKNVRYVHTTCLGCNVRCGIRVRVV -KYGDVEVIERIEGNPYHVYNRAVSFDSQVKRYKQLPYNTPVKEALERWSGTLCPRGVDGIHYVYDPYRVL -KPLKRAGPRGSGKWKVITWEQLNNEVVNGGIIEETGERLPGLKDFFVYGKLKEAGFEDPNAVLSEMKADV -DNIMKIARDPNKTYDELVKAIEGFKAKWSQKLGEKGLKLEDVFIDPDRPDLGTKANMVMYLRGRGQPPTD -YFSQRWIYAFGSVNWTRHTSACQLGFYTGNRIWAGYTDIQADPVGAKVIIGAGWSMGRLHPGATGQGLII -ERACEGDLKLYYINPVAPRTPCNGNIIWIPVKPGEDATLAFAVIRWLIENKRYNEEFLSLPNRDSAKKAG -YPVNTNATWLVITEGQRFGEYLKARDIGLENSDKPVVWTGEKFATYDSVDKADLYYVGKVTLPTGEAVAV -KTAFMILREEAFSRSFEEWLAIASPYEPGTPEFRDYVKKVEQMARDFADAAPRAGTMIHRGVGMHPNGEY -ITWAYRAIDTLIGNFHRMGGLLGRAANTSYLSYVYNVGYSGFGEPPRWGPPIDRHNYAYEATLEYWLRVK -EALKEGKSWEDAVKAAFPTKRPWYPLTPEESYTEIFAGIAEGYPYKIGAFIMFYANPVLATNYGVKFVEV -LKDTSKIPLFIAITTTINETAMYADYIVPDTTYLETGTMGVQFLYATSGGVTLAEPWRSPAIMPLTQRIS -DCPNGHPRYASFWEFFIDTAKALGMPGFGDRAVPGVKGKKYEGRWFPLHCEWEYVMRVFANAALDAKDRG -LIPEQVPEEEVKFVEENYPIAQFKDIIPPEEWKYVAYGLARGGVFTSYEQSFDERGVSKRSVPGRGTLYL -WDETLAKTRNSVTGEKFWGGPKYFPIATYAPAGPAFQKADKWLHGTPLRQLYPEKDWPFMLVFYTGPIYT -KHRSQFYYWIKQIAPENFVLINPEDAAKIGVETGDVVRVETPVGFFEAPAVVEPTVAPGVIMVPYGMGRW -ADTVLVKPKYFELRDAKLKLTVDGLPEKMEVPEDAVNPVKGLPDVVKKILFTKSPAEYYEKGLAPDKWRF -NGVTPNVVQMSDPSLGGWPLLSWLGASQAYFDTPVRITKTGQKHKFETPYIVW - ->TtrA_Pyrobaculum_aerophilum_NP_559177 -MTSRRAYLKAIAAAATLGIALWGYWPVVDKIIKPKRTPYGPDPQFGTNVRYVFSSCLGCNVRCGIVARVV -KYGDVEVIERIEGNPYHVYNRAVSFDKQIKRYAPLPYNTPVKEALEKWSGTLCPRGADGIHYVYDPYRVL -KPLKRAGPRGSGKWKAITWEQLINEVVNGGVIEETGERLPGLKEFFAYGKLKEAGFEDPNAILSEMKIDV -DNIMKVARDPNKTYDDLIKAIEEFKAKWSQRLGEKGLKLEDLLIDPDRPDLGTKANMVMYLRGRGQGHTD -YFSQRWIYAFGSVNWTRHTSACQLGYYAGNSIWAGYHDIQADPIGAKVIIGAGWSMGRVHPGATGQGLMI -ERACEGELKLYYVNPVAPRTTCNGNIIWIPVKPGEDAALAFAVIRWLIENKRYNEEFLSIPNRDSAKKLG -YPVNTNATWLVITEGERFGEFLKARDVGIEDSDKPVVWTGERFATYDSVDKADLYYVGKVTLPSGETVTV -KTAFMIVRDEAFSKSFEDWLAIASPYERNTPEFADYVKKIEQMAKDFADAAPKAATTLHRGVGMHPNGEY -IVWAYRTIDTLVGNFHRMGGLLARAAHTAYENYVYNVGRSGFGEPVRWGPPIDRHRYAYENTLEYWLRVK -KALKEGKSWDEAVKAAFPTKRPWYPHTPEESYTEIFAGIAEGYPYRIGALILFYANPVLATNYGVKFIEV -LKDPAKLPLFIVITTTINETALYADYIVPDTTYLETGTMGIQYLYATSGSVTLAESWRSPVIMPLTQRIS -DCPNGHPRYASFWEFFIDTAKALGMPGHGDKAIPGVKGKKYEGKWFSMHCEWEYILRVFANAALDAKDKG -LIPEDVPEEEVKFVEENYPIAQFRDILPPDEWKYVAYGLARGGVFTKYEESFDERGISKRRVPGRGTLYL -WSEEVAKTRNNVTGEKFWGGPKYFPIATYAPAVPAFQKADEWLHGTPLRQLYPEKEWPFILILYTGPLYT -KHRSQFYYWIKQVVPENFVLINPEDAAKLGVETGDVIKVETPVGAFEAPAVVEPAVAPGVIMVPYGMGRW -ADTVVVKPKYFELKDARAKSLIDELPDKVEIPEDAVNPVKHLPDVVKKLLFTKSPAEYYEKGLAVDKWRF -NGVTPNVAEMADPSLGGWPLLSWLGAAQAYFDTPARIVKTGQRHKFEVPYIVW - ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 -MSHLLDQLRFFNRKQGEFADGHGETRIESRDWENVYRSRWQYDKIVRSTHGVNCTGSCSWKIYVKNGLIT -WETQQTDYPRTRNDLPNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLKLWREARRNMTPVDAWASIVE -DKAKAESYKSKRGMGGFIRSSWDEVNEIIAAANVYTVKQYGPDRVIGFSPIPAMSMVSYAAGSRYLSLIG -GVCLSFYDWYCDLPPASPQIWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVAI -TPDYAEVAKLTDLWLNPKQGTDAALAQAFAHVIFKEFHLEKPSEYFRDYAKRYTDLPVLVRLNEKDGSYI -ADRFLRASDLADNLGQENNPEWKTIAVDGSTGELVSPLGSIGYRWGEKGKWNIEAREGKDGRDVDLSLTQ -IEGGETAEVAFPYFGGILHEHFQHAEGESIQLRRVPVRTITLADGSTTKVATVFDLMAANLGIDRGLGGG -NVASSYDDASVPGTPAWQEVITGVSREKAIQIAREFADNADKTHGRSMIIVGAAMNHWYHMDMNYRGLIN -MLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLDWSRPPRQMNGTSFFYNHSSQWRHEKMSIHEVL -SPLADKSQFPEHMLDYNIRAERAGWLPSAPQLNRNPLQICRDAEAAGMSPVDYVTQSLKDGSLKFACEQP -DNPDNFPRNMFVWRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDLGKRADGFKPTEAEWQDEGAIGKLDLV -TTLDFRMSSTCVYSDIVLPTATWYEKDDMNTSDMHPFIHPLSAAIDPAWEAKSDWEIYKGIAKAFSKMAE -GQLGVEKDLVTVPLLHDSPGELAQPFGGTDWKTAGVDPQPGKNCPNMAVVERDYPATYKKFTSLGPLLDK -LGNGGKGINWNTQDEVDFLGELNYKVRDEGVSQGRPQIESAIDAAEVILSLAPETNGHVAVKAWAALSEF -TGRDHSHLALPKEHEAIRFRDIQAQPRKIISSPTWSGLEDEHVSYNAGYTNVHEYIPWRTITGRQQFFQD -HPWMQAFGEQLMSYRPPINTRTIDYVKGKKSNGNPEIVLNWITPHQKWGIHSTYSDNLIMLTLSRGGPIV -WMSEVDAKKAGIEDNDWIECFNANGALTARAVVSQRVMEGMVMMYHAQERIVNVPGAESTKTRGGHHNSV -TRVVLKPTHMIGGYAQQAYGFNYYGTVGCNRDEFVVVRKMAKVDWLDGPNGNDLPQPLPQDI - - ->NarG_Pseudomonas_fluorescens_gb_AEV63780 -MSHLLDQLRFFNRKQGEFSDGHGETRKESRDWENVYRSRWQYDKIVRSTHGVNCTGSCSWKIYVKNGLITWETQQTDYPRTRNDLPNHEPRGCPRGASYSWYIYSANRLKYPKIRKPLLKLWREARQTLPPVEAWASIVEDKAKADSYKSKRGMGGFIRSNWEEVNEIIAAANVYTVKEHGPDRVVGFSPIPAMSMVSYAAGSRYLSLIGGVCLSFYDWYCDLPPASPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQGTDAALAQAFNHVIFKEFHLDKPSAYFTEYAKRYTDLPVLVMLKPMLGAAPGAGYQPDRFLRASDLTDNLGQDNNPEWKTIALDAAGELVSPQGSIGYRWGEKGKWNILPREGGEGREIDLKLSLIGGDVAEVAFPYFAGEAQEYFQHVAGDAVQFRRVPVHSVVLADGSVAKVATVFDLSAANLAIDRGLGGANVAKDYNDASVPGTPAWQEQITGVSREKAIQIAREFADNADKTRGRSMIIVGAAMNHWYHMDMNYRGLINMLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLDWNRPPRQMNGTSFFYGHSSQWRHEKMSMHDVLSPLADKSQFPEHALDYNIRAERAGWLPSAPQLNTNPLHICRDAAAAGMEPKDYVVKSLQDGSLRFACEQPDSPVNFPRNMFIWRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDIGHSTECKPTEAEWVDEGAIGKLDLVTTLDFRMSSTCVYSDIVLPTATWYEKDDMNTSDMHPFIHPLSAAIDPAWESRSDWEIYKGIAKAFSAMSVGHLGVEKDLVTVPLMHDSVGELAQPFGGTDWKSAGVAPVPGKNAPNLQVVERDYPNIYKQFTSLGPMLEKLGNGGKGINWNTDTEVKFLGELNHKEVEAGISQGRPKIDSAIDAAEVILSLAPETNGHVAVKAWAALSEFTGIDHSHLAISKEHEAIRFRDIQAQPRKIISSPTWSGLEDDHVSYNAGYTNVHESIPWRTITGRQQFYQDHPWMQAFGEQLMSYRPPVNTRTIAGVKGKRSNGETEIVLNWITPHQKWGIHSTYSDNLLMLTLSRGGPIVWLSEIDAKRAGIEDNDWIECFNVNGALTARAVVSQRVKEGMVMMYHAQERIVNVPGSETTKTRGGHHNSVTRVVLKPTHMIGGYAQQAYGFNYYGTVGCNRDEFVVVRKMVKVDWLDGSSGDDLPRPLPTDIEEN - ->NarG_Halomonas_maura_gb_AAT47523 -MSHFIDRLNFFRKAREPFANDHGEVRDESRGWEDGYRQRWQHDKVVRSTHGVNCTGSCSWKIYVKNGLVTWETQQTDYPRTRPDLPNHEPRGCPRGASYSWYLYSANRLKHPLVRKPLLKLWREALEEKGDPVDAWASIVEDPAKTKQYKRARGMGGFVRADWNELNELIAASNVYTAKQYGPDRIIGFSPIPAMSMVSYAAGSRYLSLIGGVCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVSVTPDYAEVSKLTDEWLSAKQGTDAALAMAMGHVILKEFHLDRPSAYFTDYVRRYTDMPCLVELEAREDGSYVPGKQLRASDFEASLGQDNNPEWKTVAWDETRDQLVVPRGSIGFRWGEEGKWNLEPRDAEGAEIKTRLSLAEAHDDVARVAFPYFGGIAHEHFDHVKSGGASDELLFHSLPAKRLTLADGREILAVTVFDLMCANYGIDRGFRSQEGKEGEDDGATAYDQVKPYTPAWQEKITGVPAEQCLRIAREFADNADKTHGRSMIIVGAGMNHWYHMDMNYRGLINMLVMCGCIGQSGGGWSHYVGQEKLRPQTGWLPLAFGLDWQRPPRHMNSTSFFYNHSSQWRYXKLEIKEILSPLAKPADYSGSLIDFNVRSERMGWLPSAPQLATNPLSLAGKAAEAGQSTADYVVDQLKAGGLRFAAEDPDDPQNFPRNMFIWRSNLLGSSGKGHEYLLKYLLGTRHGIQGKDLGEDGGQKPEEVVWHEAAPEGKLDLLVTLDFRMSTTCLYSDIVLPTATWYEKDDLNTSDMHPFIHPLTAATDPAWESRSDWDIYKGIARAFSKACVGHLGEETDLVTLPLQHDSPAELAQPEVKDWKRGECEPIPGKTMPALVEVKRDYPATYERFTSVGPLLDSLGNGGKGIGWKTEKEVELLGKLNYVKTEGPAKGRPRIESAIDAAEVILTLAPETNGQVSVKAWEALSKITGRDHRHLAEPKEEEKIRFRDVVAQPRKIISSPTWSGLEDEHVSYNAGYTNVHELIPWRTVSGRQQFYQDHAWMRAFGESLLVYRPPIDTKAAVSLADDKGNGNPEIALNWITPHQKWGIHSTYSDNLLMQTLSRGGPIVWLSKDDARSIGVEDNDWIELYNANGAIAARAVVSQRVKNGMAMMYHAQERILNMPGSEVTGTRGGIHNSVTRVCPKPTHMIGGYAQLAYSFNYYGTVGSNRDEFVIVRKMKKIDWLDGEGNDYEQEAVK - ->NarG_Escherichia_coli_NP_415742 -SKFLDRFRYFKQKGETFADGHGQLLNTNRDWEDGYRQRWQHDKIVRSTHGVNCTGSCSWKIYVKNGLVTWETQQTDYPRTRPDLPNHEPRGCPRGASYSWYLYSANRLKYPMMRKRLMKMWREAKALHSDPVEAWASIIEDADKAKSFKQARGRGGFVRSSWQEVNELIAASNVYTIKNYGPDRVAGFSPIPAMSMVSYASGARYLSLIGGTCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVAVTPDYAEIAKLCDLWLAPKQGTDAAMALAMGHVMLREFHLDNPSQYFTDYVRRYTDMPMLVMLEERDGYYAAGRMLRAADLVDALGQENNPEWKTVAFNTNGEMVAPNGSIGFRWGEKGKWNLEQRDGKTGEETELQLSLLGSQDEIAEVGFPYFGGDGTEHFNKVELENVLLHKLPVKRLQLADGSTALVTTVYDLTLANYGLERGLNDVNCATSYDDVKAYTPAWAEQITGVSRSQIIRIAREFADNADKTHGRSMIIVGAGLNHWYHLDMNYRGLINMLIFCGCVGQSGGGWAHYVGQEKLRPQTGWQPLAFALDWQRPARHMNSTSYFYNHSSQWRYETVTAEELLSPMADKSRYTGHLIDFNVRAERMGWLPSAPQLGTNPLTIAGEAEKAGMNPVDYTVKSLKEGSIRFAAEQPENGKNHPRNLFIWRSNLLGSSGKGHEFMLKYLLGTEHGIQGKDLGQQGGVKPEEVDWQDNGLEGKLDLVVTLDFRLSSTCLYSDIILPTATWYEKDDMNTSDMHPFIHPLSAAVDPAWEAKSDWEIYKAIAKKFSEVCVGHLGKETDIVTLPIQHDSAAELAQPLDVKDWKKGECDLIPGKTAPHIMVVERDYPATYERFTSIGPLMEKIGNGGKGIAWNTQSEMDLLRKLNYTKAEGPAKGQPMLNTAIDAAEMILTLAPETNGQVAVKAWAALSEFTGRDHTHLALNKEDEKIRFRDIQAQPRKIISSPTWSGLEDEHVSYNAGYTNVHELIPWRTLSGRQQLYQDHQWMRDFGESLLVYRPPIDTRSVKEVIGQKSNGNQEKALNFLTPHQKWGIHSTYSDNLLMLTLGRGGPVVWLSEADAKDLGIADNDWIEVFNSNGALTARAVVSQRVPAGMTMMYHAQERIVNLPGSEITQQRGGIHNSVTRITPKPTHMIGGYAHLAYGFNYYGTVGSNRDEFVVVRKMKNIDWLDGEGNDQVQESVK - ->II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 -MHLRRLSRRTFLKAAVATSAATAVLSHWPRSGRGIQEGATPAQERWVKSVCLQCPAACGI -MVRVVKDSLGERAVKIEGNPNHPSNQGGICPKGHIGLQILYDPDRLQGPLRRVGPRGEGK -WEPISWEEALQIVTERLKKLRERGEPHKLVIMSGRNRGQMGALIDRFLAAFGSPNHVGHS -SICSDGAKLAHYLTQGFKHYAAYDWDNCNYLLSFGAGFIEAWRPTVRLLRAFGHMRRGRP -IRAKIVQIETRFSVTAAKADEWLPINPGTDGALALAIAHVIVREGLYNKKFVEEHTFGFE -DWEDEQGHFHQGFKTLIRQYTPAWAAPITGVPEETIVRIAREFATTPPQIAAGQRGAMMQ -TNGIYNYMAIHALNALVGSIDAPGGVLVQIDPPLTPWPPLAQDEIAQTGVKQPRIDHAGT -EEFPLAANVYAALPDFIINEDPYAIDTLMLYYTNPVFSSPDAPKYSQAFEKIPFIVSFSP -FLDDSSLFADLILPDHTYLERWHDDVIYPSLGYPVYAVRQPVIAPLYNTRNTGDLLIELA -HRLGGTVKESFPWKDFLELIQFRARGIYESGRGNIQANSFEEFWQQLLEVGFWTDPPYPF -GQWERVFKTPSKKFEFFSQKLAHTLEDLAKKKAEHEGIPEEEALDKILTRLKITARGDAA -FMPHYEEPRFVGDPKEYPLYLNTYKLMAHAEGRGANSPWLQEILGTHVGRRWETWVEINP -TTAQKLGITEGDWVWVESPLGKIKVRAKLHPGAKPDVVNIPFERGHRSYGRWAVGFGANP -NEVLAREYDYLGGDAAFFSTRVKVYKAQEGE - ->QrcB_Syntrophobacter_fumaroxidans_YP_844744 -MKVGRRAVLQFMAGAVGGTLLSPLPWKLTDDAAIWSQNWFWRPSPARGEITRKPTVCALCEGGCGVQARL -VDGKRAILLEGNPNHPVNQGGICALGAAGLQFLYAPYRIAQPLKQTKRRGDPTGFQPIAWNEAVGELAKK -LGQMRADGKPNGLAGITRRRCSSMDALLNQFFAAYGSPNLFKMPAHADSLKLAGAVTTGREAPFGCNIED -APYILSFGAGLVEGWGSPGRMQAAFRRWRQGGKSAAKIVQVDSRCSTTAAMADRWIAVPPGTEAALALGI -AHLMVKDKLYDAEFMADRVFGFEDWTDSQGKNHKGFKFLVQTDAYTPEAISKLTGVDPAKIRELAKEFGT -QKGAVAVWGQPQGSVPKDMYNELSFLALNALKGNIKAGGAIGLAPEVPLGALPELPGDPSALKGLKQLRL -DLASSQKGPPPVLPGNNLHGFLDAVSNGGKYPIEVMLVHEANPAYGLCENKLFQQALTKIGTLVSLSSYM -DETAQQADLILPIHTAFEGFDDVIGIPGAPYAYYGVCAPVLKPHLNTKAAGDIVMSVAKQLGGSIAAALP -WASHEEYLKKRAEGLAASARGALADKKGVELWKLQPEEAVKPNYKDGADLWKKLAGGACWYDAPVDPLKD -LKTESGKFELAAQLLLAKGQTGDDDQVYLPHFSQVPPRGSDKDYPLLLVTYQMSALADRDLANPPFMTKT -VFDFILRQNDQFVEINPATASELGMAEGDSAVLKTPQGEVPVRVHLYAGARPKVVYLAQGLGHKAYDEYI -KDKGVNANGVVEVQLDRVTGLGTVWAARAHLRRA - ->ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 -MKLLETLINRRRFLKATGAVAGAGVVAGGAGVVPGLTTLSHARSPAPSADTTITKNICHQCPARCGIDVY -TTGGRVHAIYGTSDHPISNGKLCPKGPLGAYILYDPDRFKGPMKRTNPNKGRDQDPGFVPISWNEALDMV -ADRLNGLREREESHRFALLYGRGWGASCAGLLGNFGKLYGSPNVAIGHSSMCSDGSIISKKAVDGIGGYN -SYDYKNANMLLMFGAGFLEAFRPYNNNMQVWGYIRGVKVPKTRITAVDVHMNTTLAGSDRALLIKPGTDG -ALALAIAHVILVDGLWEKAFVGDFSDGVNRFIPGETVDPDSFEEKWVKGLVEWWNAELKDRSPRWAAQVT -TLYERDILATAREFGTTRPAIALYERGAHAHSNGIFNGMAIHTLNALVGSLYAKGGLAYQVGPSYGPLPV -NADDYLDDWARTGGWKAQPRIDLKGHPDGYLLANNMMQEIGPNSLQGKPYKLDTIMFYLNNAIWTAPDVK -AWEEALKELFVIETSPFPSETAMFADVILPDHTYLERLQDAPTYPFQGWPMTQLRVPAVKPLYDTKYFGD -VLIELGKRIQGSMGEYYQALDNTENVIRHLAKGFESDPGDNGVNSFESWKEKGVWYKRVYPYRQIDGEFY -EWDGQDHTRLMSADEVRGALFKTASGKFEIRSGWLEAHADWIAAKTGRDPSRLMFPIWEEPSHPGGGDLY -MVTPKVALHAEGRGANLPVAIANMQPTLGGRNTIYIEINPKTARARGIPDGSRVRISSDLGAIEGYCKYY -EGVRPDTLVFPMEHGHWAHGRWAKGRKPGHSGEITVNQSDRITGQCSYYTTKVRIERA - ->ArrA_Wolinella_succinogenes_NP_906980 -MEINRRDFLKATALTAGAVGIAQIPEIEANTQVSGEVGKWVASTCQGCTSWCSIQGYVVDGRLVKVRGNPNAKGNHGKICPRPHLAIQQVYDPDRVKTPLKRTNPKKGKGIDPQFVPISWDEAIDTIADKIMALIKSGESHKFALFRGRYTHMNEILYNTFPKLIGSPNNISHSSICAEAEKFGRYYTEALWDYADFDLDNTRYVLGWGADPLASNRQVPHFINIWGKVRDQARIAIIDPRLSATAAKADHWLPIIPGEDSALAVAMAHVILAGGAWNKGYVGDFVDGHNYFKPGELVPESIEVEGKIIPVEFKEKHTYGVVKWWNLELFDKTPEWAEPITGIPAKQIRQVALEFAAAGSRAISWVSPGACMQIRGSYASMAAHALNGLVGSCDSVGGILQGTSVPSGKTPDIKPYLSEEIASALKQKKIDQRGTPKFPALNKKTGGGVVTANVANAILDEKPYDLKMAIGYWNNFVFSINGTHLWEKAMEKLPFYAHITTHMAEMTMYADIVLPAKMHMFERYGFSKNKQNLHGYLSIHQPMVKPLGEAKTDETEIVFMIAQALAKKGHDAPLRYYQENFKDPETGKIPSTPEEFDLFSVKYFTQPIWDGSSNDKGDSINSWKELLEKGVWSTKRYSIGKKIDNFKTETKKFEFYSETLKKVLEEHVEKNKLSSIDEAIEASNNTARGERVFVPHYEPSVRYGDPKIYPLIFAEHRSRLNREGRSQNAPWYYEHKDVDPGDEIEKDVAKINPETAKQFGIKTGDRIRIVGTQASIETEVKLWEGIRPGIVVKCYGQGHWAYGSVASEKFGSKPRGTNNNDIHIHEYDRLSGSTARHGGTARVKIEKI - ->ArrA_Bacillus_selenitireducens_gb_AAQ19491 -EQGEWIASVCQGCTAWCAVQVYRIDGRATKVRGNPNAKANHGHSCVRSHIGLQQVYDPDRVKQPMKRTNPNKGRDEDPEFVPISWEEAMDTIADKIIELRENNETHKFSVWRGRYTSNNGILYGNMPKIIGSPNNISHSSICAESEKFGRYYTERYWGYADYDHENALYEIFWGGDPIATNRXVPHTASIWGELSDRATLACVDPRFSTTAANQMNGCRLIPGEDGAIASAIAHVILTEGVWYKPFVGDFKDGQNRFVEGRDVNEDDFEEIQTHGLVKWWNLELKDKTPEWAAERSGIDADQIYRVARGFANAAPKAISFSSPGSSMTIRGGYTAMTQAALNGLVGSADNLGGVISNGISVPNNGFPDPSDYIDEIAANGLEQDRIDWGGRLEFPALKDSKSGGVKVTNTVADAVLAEDPYEFKSRIELLDELQFLQPRNGSLGQSFGQDSIHGAYDCQSGEQTHFADIVLPVPHSQFERQSPVAGSNGNLHRHLHLQNKVIESPFDIRVDETEIPWMIGESLEKKGYSNLIDYFRNEFRDPETGEAPTNAAEFDEIATKHYTHPVWDPTFEKDGDQIDGWEEYKRLGTWNTNKYEFRQKWDGNWGTETGQFEFYSETLKVALQDHADKHNASIDDVMEATFNTAKGELAFVPHYEPAMRVGDESEYPLIFMEHRSKLNREARSANTSWYQEFKDIDLGDEAWDDVAKLNPKDAAELGIQNGDMVRLVTPEGQIEVKAKLWEGTRPGVVAKCYGQGHWAYGHIASLDRRRQIARGGNNNIILAPVHEALSGSGARHGGQTRVRVEKV - ->ArrA_Chrysiogenes_arsenatis_gb_AAU11839 -MRIKRREFLKASAAVGAVAVASPTLNAFAQTGTGASAMGEAEGKWIPSTCQGCTTWCPVEFLFRMAVRSKYAATQLSKANNGYCCVRGHLMLQQLYDPDRIKTPMKRTNPVKGRKEDPKICPYHMGMKQWDTIADKIMELRKNNETHKYLLMRGRYSDHNSIFYGDLTKMIGSPNNISHSAICAEVEKMGSMATEGFWGYRDYDLDNMKYLIAWACDPLSSNRQIPNAIRKIQGVMDRGKVVAVDPRMNNTASKAQEWLPIKPSEDGALALAMAHVIITKGLWSKEFVGDFKDGKNKFVAGKTVKEEDFEEKLTNGIVKWWNLEVKDRTPKWAAKVTGIDEATIIRVATEFAQAAPACAIWYGPNMQPRGSYAVMCIHALNGLVGASDSEGGLCTGMGSPSSSYPKIDAYQDDVAKAGAKNKKIDQRGTLKFPAMGSAKPGTGVVTNNVADALLAADPYDIKVAIGYFCNFNFSGTDGARWDKALAKVPFFVHCVPMFSEMTYFADIVLPAALHHTEDWAVIRSKANLHGHTSIQQPVVERMFDVKGVETEITWLLAEKLKAKGFENMYNWLYNEYKDPETGKNPTNSLEFALYATKIRSKKCWDPKENAEYKGDKLNGWADFMEKGIVNSPKFKFRQKWEKGFPTETKKFEFYSETLKKGLLAHAEKNKVTVDQVMEATNYEARGELAFIPHYESPKRHGDVKEFPFSLIDMKSRLNREGRSTNATWYHAFKKCDPGDVNQEDVLQINPADAKKLGINEGDMVKVTSVIGSLTVKARLWEGVRPGCVAKCYGQGHFAMGRVSAKDFGKAVARGANFNDIMPADYDRITGATARNGGFTGVKIEKA - ->ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 -MSRNKTSGISRREFLKVMGSTGAALGLGLSATSGNKVLAEEDPYEVLPEGEHKSGEWVPTGCAGCTSWCSLEANVVDGRVIKIRGNSRSKVNGESSCPRSHLSLQQVYDPDRIKRPMKRTNPEKGRDVDPEFVPISWEEAFEEIADKIIELRENGESHKFVLWRGRYTRLRDILYGILPEFVGSPNKISHSSICAEAEKFGPYYTEGYWAYRDYDLQNSDYILIWGTDPIQSNRQVSLYSREWGNILEGARIATVDPRFSRTAAKSNEWLPVKPGEDGALALAMAHVILTEGLWHKEFVGDFVDGENKFTAGEEVDEDEFEENYTHGVVKWWNEELKDRTPEWAADKTGIPAEQIVRVAAEFGEAAPHACVFMGGGGVMQTRGGYNSMAIHGLNGLVGSIDNEGGAVRGASVPNQSFPDHSEFLDDISREGLDHEMIDRRGRLEFPAFKDGESGGGVVTNLSADGIIEEDPYEIKMGIGYWNNFNFAAPETERWDEAMSKLDFYVHLVTHQSEMTQYADIVIPSTHHMFEQWGMLYQKGNLHTHFWLSRPMINRHWELIEPEAEFSWLLAEKLAEKGYSNMLDYFKTIVDPETGEEPEDYREFAKYATKHYMQPVWDPEMESHGDQFDGWEDFKEAGVWNSDEFEFQQYWGEFTNSTGDFEFYSETLKEALEEHAEKHDVSIEEVLEACKYEAEGELAFLPHYEEPYTVGDDEEYPLLLVDSKSALNREGRSANANWYYDLKDIDPGDSTEADVIKIHPRDAEELGLEDGDEVVVSSPAGEITCQLNVWEAVKPGTASKTFGMGHWAYGRVAAEDFADGEPRGGNNNEIIPAEYERLSGSTSFYSHIKVNIERA - ->ArrA_Sulfurospirillum_barnesii_gb_AAU11840 -TSWCPIQGLVVDGKVVKVRGNPNSPSMGRICPRPHLAIQQVYDPDRVKTPLKRTNPKKGKGIDPKFVPISWDEAINTIAEQILGLIKAGESHKFVLMRGRYTHMNEILYNTFPKLIGSPNNISHASICAKTEKFGRYYTEGFWDYADFDLTIPVIFWDGERDMVSSNRQIPWFMNQQGYVKDRAKITIIDPRLSATAAKADRWAPIIPGTDSALAVAIAHVILSEGRWNKSFVGDFQDGKNYFIPGSTVPTEVIVDEKSLPVVFEENHTYGVVAWWNLELKERTPEWAEKITGISAKDIRTIAREFSDAGSKAISWVTTGASMQIRGAYASLAAHALNGLVGSVDAVGGTLQGSXAPSGKTPDIKPYLPAEFEAALKQKKIDQRGTLKLGAFNKKTGGGVVTQQVADSILTDKPYDVKVAIGYWNNFVFSINGANVWEKAMEKLPFYAHITTHLAEMSMXADIVLPAKMHMFERYGFSKNKQNLQGYLTIHQPLVKSFADAKTDETEIPFLIAQALAKKGFDGPLRYFQDNFKDPESGKAPTNPRRVDLYAVKQFTXPIWSGESNEKGDTINSWNELLDKGVWKTKKYKIGKKVDNFATETKKFEFYSETLKKVLIEHAEKNKVTVDEALEALNYTCRGELGFVPHYEEAVRHGDEKTYPFIFAEHRSRLNREGRSQNAPWYYEIKDVDPGDVAGKDVTKINPLDGKKLGLKDGDKIKITSVQGSIESEVKLWEGTRPGT - ->Halorhodospira_halophila_YP_001001949 -MSVLDHLVSRRRFLQATGVGGGAVAAGGVGHLLSFSAGGSHARADGPVGGGETQITKNVCHQCPARCGID -VYTTDGRVHAIYGDPGNPIANGRLCPKGHLGSYILYDPDRFKGPMKRTNPNKGRDEDPQFEAISWDEALG -IVAERLNRLREQEESHRFALMYGRGWGASCAGLLGPFAKLYGTPNVIGHSSMCSDGSMVAKGLTDGNESY -NAYDYRNTNYILNFGAGFLEAFRPYNYLMQVWGHMRTKSPKTRVTAVDVHMNPTLAAADRAVTIKPATDG -AMALAIAHEMLVNGYWDRDFVGDFTDGANRFEAGTEIDPDDFEEVWTQGLIRWWNDELKDRTPEWAESIT -TVPAETIRRVAYEFGTTRPAMAIMERGPTSHSNGTYNGMAIHALNALAGTLFTEGGLFYQMDVPYGDGPA -DPDDYLDDYAGRMQERFDEGEIPRIDKLGTDRWPLARNMMQEVGPNHAAGEPYKLDTILFYLNNPIWTAP -DATAWEEALKDVFIIDTSPFPGETARYADLILPDHTYLERLQDAPTYPFEGYPMTALRTPAVEPLYDTKV -FGDILIEIGKRLDGPAGEYWQAVGDTENLLRHLAEGFRDHPGDNGVEDFESWKAKGVWYKKPYHWKQERG -VFYEWVEDDGDYTHEMSAEEVADKLMPTPSGRFEFFSEKLQEHADFVASEFGIDHERAGLIQWVDPDHPG -GGDLYFSTPKTALHAEGRGANIPHAIAHVQPVMGGRTTVYLEIHPRTARERGIRSGDRVRIVSDVGEIEA -YARLFEGTRPDTVCLPMEHGHWAQGRWAEGRKPGHSGEVTVNQSDRISGLASYYTTKVRVERA - ->Alkalilimnicola_ehrlichii_ABI55571 -MKMILDTLLNRRRFLKATGATGAAAATTAGVGKLAGFTAASTTSTHVNARPGGETRVTKNICHQCPARCG -INVYTTNGRVHAIYGDPGNPIANGKLCPKGHLGTQLLYDPDRFKGPMKRTNPNKGRDEDPEFVPISWDEA -FDIVAERLNRLRERGESHRFAHFYGRGWGSSDAGLYGDFGKLYGTPNSAIGHASMCAEGSKRAKRATDGN -DSYNSYDYRNTNYILNFGAGFLEAFRPYNYLMQVWGHMRTKSPKTRVTTIDVRMNPTMAASDRALMIKPG -TDGALALAIAHVILTEGLWDKEFVGDFEDGRNHFRTGETIIPDAFQANWTHGLAEWWNGELKDRTPEWAE -EITTIPAKHIYTVAREFATTRPAMAIMERGPTAHFNGTYNGMAVHALNALVGSMFAEGGLFYQMGPSYGP -LPVSADDYMDDYAREMQGKHPRIDMAGTEKWPMAGTMMQECAKHHLAGDPYKLDTAMFFVTNPIWTAPDP -RLWEEALKDVFIIDTSPYPGETAMYADIIMPEHTYLERLQDSPTYPFEGWPMAALRTPAVDPVYDTKHFG -DMIIEIGKRINSPMADYYRELGDVENMLRHRAAGFANDPGDNGVNDFESWKEKGVWYKKPYHWRYWRGTF -YEWDGEGYNIEMSEDEVKDKLMPTASGKFEFKSSFLENNANYIAREMGIAEDRVGLIQWVEPRHTGDGDL -HFVTPKTPLHAEGRSANIPQAQAYMQPIVGGRGTCYLEIHPKTAQERGINDGDTVRLSAQVRGETKSILA -VARYMPGHRPDTLVLPMEYGHWAQGRWATAQGRDMKPGHSGDLTENLSDPISGLACYYTAKVRLEKA \ No newline at end of file diff --git a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model b/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model deleted file mode 100644 index a39f2545..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model +++ /dev/null @@ -1,581 +0,0 @@ - - -ProtTest 3.2 Fast selection of the best-fit models of protein evolution -(c) 2009-2010 Diego Darriba (1,2), Guillermo Taboada (2), Ramón Doallo (2), David Posada (1) -(1) Facultad de Biologia, Universidad de Vigo, 36200 Vigo, Spain -(2) Facultade de Informática, Universidade da Coruña, 15071 A Coruña, Spain -Contact: ddarriba@udc.es, dposada@uvigo.es ----------------------------------------------------------------------------------------------- - -Thu Apr 25 13:41:55 MDT 2024 -OS = Linux (3.10.0-1160.88.1.el7.x86_64) - -Citation: Darriba D, Taboada GL, Doallo R, Posada D. ProtTest 3: fast selection of best-fit - models of protein evolution. Bioinformatics, 27:1164-1165, 2011 - - -ProtTest options ----------------- - Alignment file........... : dmso_refs.fasta.phy - Tree..................... : BioNJ - StrategyMode............. : Fixed BIONJ JTT - Candidate models......... : - Matrices............... : JTT LG DCMut MtREV MtMam MtArt Dayhoff WAG RtREV CpREV Blosum62 VT HIVb HIVw FLU - Distributions.......... : Uniform +G +I +I+G - Observed frequencies... : false - - Statistical framework - Sort models according to....: - BIC - Sample size.................: 871.0 (not calculated yet) - Other options: - Display best tree in ASCII..: false - Display best tree in Newick.: false - Display consensus tree......: false - Verbose.....................: false - -********************************************************** -Observed number of invariant sites: 2 -Observed aminoacid frequencies: - A: 0.098 C: 0.011 D: 0.055 E: 0.053 F: 0.033 - G: 0.091 H: 0.024 I: 0.052 K: 0.051 L: 0.078 - M: 0.023 N: 0.041 P: 0.059 Q: 0.032 R: 0.059 - S: 0.052 T: 0.054 V: 0.071 W: 0.025 Y: 0.037 - -********************************************************** - - - -Model................................ : JTT - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77104.53 - (seconds)) - -Model................................ : JTT+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 77032.91 - (seconds)) - -Model................................ : JTT+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.767 - -lnL................................ = 75965.79 - (seconds)) - -Model................................ : JTT+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.916 - proportion of invariable sites... = 0.003 - -lnL................................ = 75938.30 - (seconds)) - -Model................................ : LG - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 76250.92 - (seconds)) - -Model................................ : LG+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 76186.27 - (seconds)) - -Model................................ : LG+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.812 - -lnL................................ = 75187.90 - (seconds)) - -Model................................ : LG+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.971 - proportion of invariable sites... = 0.003 - -lnL................................ = 75162.49 - (seconds)) - -Model................................ : DCMut - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77745.30 - (seconds)) - -Model................................ : DCMut+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 77663.69 - (seconds)) - -Model................................ : DCMut+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.545 - -lnL................................ = 76472.93 - (seconds)) - -Model................................ : DCMut+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.719 - proportion of invariable sites... = 0.003 - -lnL................................ = 76442.91 - (seconds)) - -Model................................ : MtREV - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 81641.26 - (seconds)) - -Model................................ : MtREV+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 81620.49 - (seconds)) - -Model................................ : MtREV+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.151 - -lnL................................ = 79797.61 - (seconds)) - -Model................................ : MtREV+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.169 - proportion of invariable sites... = 0.002 - -lnL................................ = 79793.93 - (seconds)) - -Model................................ : MtMam - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 85263.49 - (seconds)) - -Model................................ : MtMam+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.005 - -lnL................................ = 85241.92 - (seconds)) - -Model................................ : MtMam+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.35 - -lnL................................ = 82190.94 - (seconds)) - -Model................................ : MtMam+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.351 - proportion of invariable sites... = 0.001 - -lnL................................ = 82190.85 - (seconds)) - -Model................................ : MtArt - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 83730.92 - (seconds)) - -Model................................ : MtArt+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 83711.55 - (seconds)) - -Model................................ : MtArt+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.408 - -lnL................................ = 80931.73 - (seconds)) - -Model................................ : MtArt+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.414 - proportion of invariable sites... = 0.001 - -lnL................................ = 80929.13 - (seconds)) - -Model................................ : Dayhoff - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77755.96 - (seconds)) - -Model................................ : Dayhoff+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 77674.16 - (seconds)) - -Model................................ : Dayhoff+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.536 - -lnL................................ = 76479.03 - (seconds)) - -Model................................ : Dayhoff+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.709 - proportion of invariable sites... = 0.003 - -lnL................................ = 76448.96 - (seconds)) - -Model................................ : WAG - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 76009.19 - (seconds)) - -Model................................ : WAG+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 75929.91 - (seconds)) - -Model................................ : WAG+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.468 - -lnL................................ = 75177.79 - (seconds)) - -Model................................ : WAG+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.74 - proportion of invariable sites... = 0.003 - -lnL................................ = 75142.56 - (seconds)) - -Model................................ : RtREV - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 76648.25 - (seconds)) - -Model................................ : RtREV+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 76576.75 - (seconds)) - -Model................................ : RtREV+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.027 - -lnL................................ = 75659.47 - (seconds)) - -Model................................ : RtREV+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.245 - proportion of invariable sites... = 0.003 - -lnL................................ = 75630.40 - (seconds)) - -Model................................ : CpREV - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77052.70 - (seconds)) - -Model................................ : CpREV+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 76973.87 - (seconds)) - -Model................................ : CpREV+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.08 - -lnL................................ = 76046.86 - (seconds)) - -Model................................ : CpREV+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.267 - proportion of invariable sites... = 0.003 - -lnL................................ = 76014.06 - (seconds)) - -Model................................ : Blosum62 - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 75915.50 - (seconds)) - -Model................................ : Blosum62+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 75849.78 - (seconds)) - -Model................................ : Blosum62+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 4.24 - -lnL................................ = 75230.55 - (seconds)) - -Model................................ : Blosum62+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 4.538 - proportion of invariable sites... = 0.003 - -lnL................................ = 75199.67 - (seconds)) - -Model................................ : VT - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 75962.73 - (seconds)) - -Model................................ : VT+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 75896.24 - (seconds)) - -Model................................ : VT+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.669 - -lnL................................ = 75166.63 - (seconds)) - -Model................................ : VT+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.909 - proportion of invariable sites... = 0.003 - -lnL................................ = 75137.60 - (seconds)) - -Model................................ : HIVb - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 79715.18 - (seconds)) - -Model................................ : HIVb+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 79632.32 - (seconds)) - -Model................................ : HIVb+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.407 - -lnL................................ = 78258.49 - (seconds)) - -Model................................ : HIVb+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.558 - proportion of invariable sites... = 0.003 - -lnL................................ = 78228.20 - (seconds)) - -Model................................ : HIVw - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 83544.07 - (seconds)) - -Model................................ : HIVw+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.005 - -lnL................................ = 83433.56 - (seconds)) - -Model................................ : HIVw+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.2 - -lnL................................ = 81960.13 - (seconds)) - -Model................................ : HIVw+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.373 - proportion of invariable sites... = 0.003 - -lnL................................ = 81919.21 - (seconds)) - -Model................................ : FLU - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 79156.27 - (seconds)) - -Model................................ : FLU+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 79066.08 - (seconds)) - -Model................................ : FLU+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.477 - -lnL................................ = 77863.83 - (seconds)) - -Model................................ : FLU+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.635 - proportion of invariable sites... = 0.003 - -lnL................................ = 77828.33 - (seconds)) - -************************************************************ -Date : Thu Apr 25 17:59:51 MDT 2024 -Runtime: 4h:17:51 - - - -*************************************************************************** -Best model according to BIC: VT+I+G -Confidence Interval: 100.0 -*************************************************************************** -Model deltaBIC BIC BICw -lnL ---------------------------------------------------------------------------- -VT+I+G 0.00 151432.82 0.99 75137.60 -WAG+I+G 9.91 151442.73 0.01 75142.56 -LG+I+G 49.77 151482.59 0.00 75162.49 -VT+G 51.28 151484.10 0.00 75166.63 -WAG+G 73.60 151506.42 0.00 75177.79 -LG+G 93.82 151526.64 0.00 75187.90 -Blosum62+I+G 124.12 151556.94 0.00 75199.67 -Blosum62+G 179.11 151611.93 0.00 75230.55 -RtREV+I+G 985.58 152418.40 0.00 75630.40 -RtREV+G 1036.96 152469.78 0.00 75659.47 -Blosum62+I 1417.58 152850.40 0.00 75849.78 -VT+I 1510.51 152943.33 0.00 75896.24 -Blosum62 1542.26 152975.07 0.00 75915.50 -WAG+I 1577.84 153010.66 0.00 75929.91 -JTT+I+G 1601.38 153034.20 0.00 75938.30 -VT 1636.72 153069.53 0.00 75962.73 -JTT+G 1649.60 153082.42 0.00 75965.79 -WAG 1729.64 153162.45 0.00 76009.19 -CpREV+I+G 1752.92 153185.74 0.00 76014.06 -CpREV+G 1811.75 153244.56 0.00 76046.86 -LG+I 2090.56 153523.38 0.00 76186.27 -LG 2213.09 153645.91 0.00 76250.92 -DCMut+I+G 2610.62 154043.43 0.00 76442.91 -Dayhoff+I+G 2622.71 154055.53 0.00 76448.96 -DCMut+G 2663.88 154096.70 0.00 76472.93 -Dayhoff+G 2676.07 154108.89 0.00 76479.03 -RtREV+I 2871.53 154304.35 0.00 76576.75 -RtREV 3007.75 154440.57 0.00 76648.25 -CpREV+I 3665.77 155098.59 0.00 76973.87 -JTT+I 3783.85 155216.67 0.00 77032.91 -CpREV 3816.66 155249.48 0.00 77052.70 -JTT 3920.31 155353.13 0.00 77104.53 -DCMut+I 5045.40 156478.22 0.00 77663.69 -Dayhoff+I 5066.34 156499.15 0.00 77674.16 -DCMut 5201.86 156634.68 0.00 77745.30 -Dayhoff 5223.18 156655.99 0.00 77755.96 -FLU+I+G 5381.44 156814.26 0.00 77828.33 -FLU+G 5445.67 156878.49 0.00 77863.83 -HIVb+I+G 6181.20 157614.02 0.00 78228.20 -HIVb+G 6235.01 157667.82 0.00 78258.49 -FLU+I 7850.18 159283.00 0.00 79066.08 -FLU 8023.79 159456.61 0.00 79156.27 -HIVb+I 8982.66 160415.48 0.00 79632.32 -HIVb 9141.61 160574.43 0.00 79715.18 -MtREV+I+G 9312.65 160745.47 0.00 79793.93 -MtREV+G 9313.23 160746.05 0.00 79797.61 -MtArt+G 11581.48 163014.30 0.00 80931.73 -MtArt+I+G 11583.06 163015.87 0.00 80929.13 -MtREV+I 12958.99 164391.81 0.00 81620.49 -MtREV 12993.76 164426.58 0.00 81641.26 -HIVw+I+G 13563.22 164996.03 0.00 81919.21 -HIVw+G 13638.29 165071.10 0.00 81960.13 -MtMam+G 14099.91 165532.73 0.00 82190.94 -MtMam+I+G 14106.49 165539.31 0.00 82190.85 -HIVw+I 16585.14 168017.96 0.00 83433.56 -HIVw 16799.38 168232.20 0.00 83544.07 -MtArt+I 17141.12 168573.94 0.00 83711.55 -MtArt 17173.09 168605.91 0.00 83730.92 -MtMam+I 20201.87 171634.68 0.00 85241.92 -MtMam 20238.23 171671.04 0.00 85263.49 ---------------------------------------------------------------------------- ---------------------------------------------------------------------------- -*********************************************** -Relative importance of parameters -*********************************************** - alpha (+G): 0.000 - p-inv (+I): 0.000 - alpha+p-inv (+I+G): 1.000 - freqs (+F): No +F models - -*********************************************** -Model-averaged estimate of parameters -*********************************************** - alpha (+G): 3.669 - p-inv (+I): NaN - alpha (+I+G): 3.908 - p-inv (+I+G): 0.003 - -*************************************************************************** -Best model according to LnL: VT+I+G -Confidence Interval: 100.0 -*************************************************************************** -Model deltaLnL LnL LnLw -lnL ---------------------------------------------------------------------------- -VT+I+G 0.00 75137.60 0.92 75137.60 -WAG+I+G 4.96 75142.56 0.08 75142.56 -LG+I+G 24.89 75162.49 0.00 75162.49 -VT+G 29.02 75166.63 0.00 75166.63 -WAG+G 40.18 75177.79 0.00 75177.79 -LG+G 50.30 75187.90 0.00 75187.90 -Blosum62+I+G 62.06 75199.67 0.00 75199.67 -Blosum62+G 92.94 75230.55 0.00 75230.55 -RtREV+I+G 492.79 75630.40 0.00 75630.40 -RtREV+G 521.86 75659.47 0.00 75659.47 -Blosum62+I 712.17 75849.78 0.00 75849.78 -VT+I 758.64 75896.24 0.00 75896.24 -Blosum62 777.90 75915.50 0.00 75915.50 -WAG+I 792.30 75929.91 0.00 75929.91 -JTT+I+G 800.69 75938.30 0.00 75938.30 -VT 825.13 75962.73 0.00 75962.73 -JTT+G 828.18 75965.79 0.00 75965.79 -WAG 871.59 76009.19 0.00 76009.19 -CpREV+I+G 876.46 76014.06 0.00 76014.06 -CpREV+G 909.26 76046.86 0.00 76046.86 -LG+I 1048.67 76186.27 0.00 76186.27 -LG 1113.32 76250.92 0.00 76250.92 -DCMut+I+G 1305.31 76442.91 0.00 76442.91 -Dayhoff+I+G 1311.35 76448.96 0.00 76448.96 -DCMut+G 1335.33 76472.93 0.00 76472.93 -Dayhoff+G 1341.42 76479.03 0.00 76479.03 -RtREV+I 1439.15 76576.75 0.00 76576.75 -RtREV 1510.64 76648.25 0.00 76648.25 -CpREV+I 1836.27 76973.87 0.00 76973.87 -JTT+I 1895.31 77032.91 0.00 77032.91 -CpREV 1915.10 77052.70 0.00 77052.70 -JTT 1966.93 77104.53 0.00 77104.53 -DCMut+I 2526.09 77663.69 0.00 77663.69 -Dayhoff+I 2536.55 77674.16 0.00 77674.16 -DCMut 2607.70 77745.30 0.00 77745.30 -Dayhoff 2618.36 77755.96 0.00 77755.96 -FLU+I+G 2690.72 77828.33 0.00 77828.33 -FLU+G 2726.22 77863.83 0.00 77863.83 -HIVb+I+G 3090.60 78228.20 0.00 78228.20 -HIVb+G 3120.89 78258.49 0.00 78258.49 -FLU+I 3928.48 79066.08 0.00 79066.08 -FLU 4018.67 79156.27 0.00 79156.27 -HIVb+I 4494.71 79632.32 0.00 79632.32 -HIVb 4577.57 79715.18 0.00 79715.18 -MtREV+I+G 4656.32 79793.93 0.00 79793.93 -MtREV+G 4660.00 79797.61 0.00 79797.61 -MtArt+I+G 5791.53 80929.13 0.00 80929.13 -MtArt+G 5794.12 80931.73 0.00 80931.73 -MtREV+I 6482.88 81620.49 0.00 81620.49 -MtREV 6503.65 81641.26 0.00 81641.26 -HIVw+I+G 6781.61 81919.21 0.00 81919.21 -HIVw+G 6822.53 81960.13 0.00 81960.13 -MtMam+I+G 7053.25 82190.85 0.00 82190.85 -MtMam+G 7053.34 82190.94 0.00 82190.94 -HIVw+I 8295.95 83433.56 0.00 83433.56 -HIVw 8406.46 83544.07 0.00 83544.07 -MtArt+I 8573.95 83711.55 0.00 83711.55 -MtArt 8593.32 83730.92 0.00 83730.92 -MtMam+I 10104.32 85241.92 0.00 85241.92 -MtMam 10125.88 85263.49 0.00 85263.49 ---------------------------------------------------------------------------- ---------------------------------------------------------------------------- -*********************************************** -Relative importance of parameters -*********************************************** - alpha (+G): 0.000 - p-inv (+I): 0.000 - alpha+p-inv (+I+G): 1.000 - freqs (+F): No +F models - -*********************************************** -Model-averaged estimate of parameters -*********************************************** - alpha (+G): 3.668 - p-inv (+I): 0.003 - alpha (+I+G): 3.896 - p-inv (+I+G): 0.003 diff --git a/assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt b/assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt deleted file mode 100644 index 47ec8bde..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt +++ /dev/null @@ -1,12 +0,0 @@ -K00370 -K00371 -K00374 -nitrate reductase -nar -NAR -narG -narH -narI -narJ -EC: 1.7.99.4 -EC: 1.7.5.1 diff --git a/assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv b/assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv deleted file mode 100644 index d7836d63..00000000 --- a/assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv +++ /dev/null @@ -1,76 +0,0 @@ -gene call -sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1 other-None -riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60 other-None -providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4 other-None -NASQAN2015_111_B_bin.76_k121_226837_116 other-None -NASQAN2014_190_B_bin.96_k121_3766_2 other-None -muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5 other-None -icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5 other-None -icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14 other-None -greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1 other-None -sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1 nxr-None -riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32 nxr-Nitrifier -riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5 nxr-Nitrifier -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4 nxr-Nitrifier -blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11 nxr-Nitrifier -blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9 nxr-Nitrifier -NASQAN2011_330_B_bin.17_k121_430440_3 nxr/nar-N utilization -gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3 nxr/nar-N utilization -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7 nxr/nar-N utilization -Yukon_2004-1_F_bin.10_scaffold_25058_1 narG-N reducer -Yukon_2004-1_F_bin.10_scaffold_678_1 narG-N reducer -yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1 narG-N reducer -yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1 narG-N reducer -whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7 narG-N reducer -nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5 narG-N reducer -NASQAN2016_164_F_bin.17_scaffold_1152_1 narG-N reducer -NASQAN2016_164_F_bin.17_scaffold_8891_2 narG-N reducer -NASQAN2015_227_F_bin.21_scaffold_2406_1 narG-N reducer -NASQAN2015_227_F_bin.21_scaffold_4919_3 narG-N reducer -NASQAN2015_227_B_bin.17_k121_559871_7 narG-N reducer -NASQAN2015_172_B_bin.54_k121_327740_1 narG-N reducer -NASQAN2015_010_A_bin.16_Ga0466474_000034_25 narG-N reducer -NASQAN2011_286_F_bin.29_scaffold_54_27 narG-N reducer -NASQAN2011_286_B_bin.1_k121_764018_13 narG-N reducer -NASQAN2011_265_B_bin.52_k121_465271_4 narG-N reducer -NASQAN2011_265_B_bin.52_k121_959771_6 narG-N reducer -NASQAN2011_028_B_bin.24_k121_53788_5 narG-N reducer -logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2 narG-N reducer -littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6 narG-N reducer -littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7 narG-N reducer -lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5 narG-N reducer -lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1 narG-N reducer -lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1 narG-N reducer -lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206 narG-N reducer -lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3 narG-N reducer -king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1 narG-N reducer -eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23 narG-N reducer -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1 narG-N reducer -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5 narG-N reducer -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17 narG-N reducer diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json b/assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json deleted file mode 100644 index 5050a094..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json +++ /dev/null @@ -1,25 +0,0 @@ -{ - "files": { - "aln_fasta": "nar_nxr_seqs_for_tree_aligned.faa", - "phylo_model": "phylo_modelNQB2rG.json", - "tree": "nar_nxr.tre", - "tree_stats": "RAxML_info.nxr_nar_raxml" - }, - "rollback": null, - "log": [ - "Stripped refpkg (removed 0 files)", - "Loaded initial files into empty refpkg" - ], - "metadata": { - "create_date": "2022-08-01 19:38:05", - "format_version": "1.1", - "locus": "16s_rRNA" - }, - "rollforward": null, - "md5": { - "aln_fasta": "e8299c2a452284b846fbe1954d731e61", - "phylo_model": "8ddf52f289613477eb526cf7accab5f0", - "tree": "21dd28b872d3f481dee55388c088ebc0", - "tree_stats": "0dd942d28693dd101dbc1c19e8e95c30" - } -} diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml b/assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml deleted file mode 100644 index 00d9db3d..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml +++ /dev/null @@ -1,95 +0,0 @@ - - -IMPORTANT WARNING: Sequences g_8 and g_9 are exactly identical - - -IMPORTANT WARNING: Sequences g_11 and g_12 are exactly identical - - -IMPORTANT WARNING: Sequences g_13 and g_14 are exactly identical - - -IMPORTANT WARNING: Sequences g_40 and g_41 are exactly identical - - -IMPORTANT WARNING: Sequences g_43 and g_44 are exactly identical - - -IMPORTANT WARNING: Sequences g_60 and g_61 are exactly identical - - -IMPORTANT WARNING: Sequences g_76 and g_77 are exactly identical - - -IMPORTANT WARNING: Sequences g_82 and g_83 are exactly identical - -IMPORTANT WARNING -Found 8 sequences that are exactly identical to other sequences in the alignment. -Normally they should be excluded from the analysis. - -An alignment file with sequence duplicates removed has already -been printed to file /home/projects-wrighton-2/GROWdb/USAfocus_FinalBins110121/dereplicated_bin_analyses/metabolism/nxr_nar//nxr-nar_seqs_for_tree_aligned.faa.phy.reduced - - -This is RAxML version 7.7.2 released by Alexandros Stamatakis on July 31 2013. - -With greatly appreciated code contributions by: -Andre Aberer (HITS) -Simon Berger (HITS) -Nick Pattengale (Sandia) -Wayne Pfeiffer (SDSC) -Akifumi S. Tanabe (NRIFS) - - -Alignment has 1565 distinct alignment patterns - -Proportion of gaps and completely undetermined characters in this alignment: 40.94% - -RAxML rapid hill-climbing mode - -Using 1 distinct models/data partitions with joint branch length optimization - - -Executing 1 inferences on the original alignment using 1 distinct randomized MP trees - -All free model parameters will be estimated by RAxML -GAMMA model of rate heteorgeneity, ML estimate of alpha-parameter - -GAMMA Model parameters will be estimated up to an accuracy of 0.1000000000 Log Likelihood units - -Partition: 0 -Alignment Patterns: 1565 -Name: No Name Provided -DataType: AA -Substitution Matrix: WAG -Using empirical base frequencies - - - - -RAxML was called as follows: - -raxmlHPC -m PROTGAMMAWAGF -n nxr_nar_raxml -s /home/projects-wrighton-2/GROWdb/USAfocus_FinalBins110121/dereplicated_bin_analyses/metabolism/nxr_nar//nxr-nar_seqs_for_tree_aligned.faa.phy -p 11 - - -Partition: 0 with name: No Name Provided -Base frequencies: 0.073 0.060 0.047 0.065 0.011 0.031 0.053 0.083 0.031 0.048 0.064 0.059 0.031 0.036 0.057 0.050 0.060 0.030 0.049 0.063 - -Inference[0]: Time 7855.233752 GAMMA-based likelihood -104967.862139, best rearrangement setting 5 -alpha[0]: 1.530755 - - -Conducting final model optimizations on all 1 trees under GAMMA-based models .... - -Inference[0] final GAMMA-based Likelihood: -104967.862114 tree written to file /home/projects-wrighton-2/DRAM/scratch_space_flynn/jul_27_22_trees/second_try/RAxML_result.nxr_nar_raxml - - -Starting final GAMMA-based thorough Optimization on tree 0 likelihood -104967.862114 .... - -Final GAMMA-based Score of best tree -104967.862114 - -Program execution info written to /home/projects-wrighton-2/DRAM/scratch_space_flynn/jul_27_22_trees/second_try/RAxML_info.nxr_nar_raxml -Best-scoring ML tree written to: /home/projects-wrighton-2/DRAM/scratch_space_flynn/jul_27_22_trees/second_try/RAxML_bestTree.nxr_nar_raxml - -Overall execution time: 11244.438291 secs or 3.123455 hours or 0.130144 days - diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre b/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre deleted file mode 100644 index 72500eef..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre +++ /dev/null @@ -1 +0,0 @@ -(OOP57237|Brocadia_caroliniensis:0.010806074,(RIK02127|Brocadia_sp:0.000910858,(KKO18748|Brocadia_fulgida:0.000000005,OQZ00558|Brocadia_sp_UTAMX2:0.000914005)0.781:0.000917034)0.992:0.013579216,(WP_052562588|Brocadia_sinica:0.009341785,(OHB44699|Planctomycetes_bacterium_GWE2_41_14:0.028539476,((WP_070066136|Brocadia_sapporoensis:0.005501886,RZV59451|Brocadia_sp_BROELEC01:0.002673850)1.000:0.025826757,((((OHB72803|Planctomycetes_bacterium_RBG_16_41_13:0.009726587,(WP_099324707|Kuenenia_stuttgartiensis:0.000917459,NxrA_Candidatus_K_stuttgartiensis_CAJ72445:0.000000005)0.998:0.017229244)1.000:0.098072241,((((RBG1_10:0.249943905,((GCA_001803565_00046|MHDQ01000004unannotatedprotein:0.399259377,((BBJ23760|Nitrotoga_sp_AM1:0.0,BBJ23368|Nitrotoga_sp_AM1:0.0):0.003761140,((RFC31618|Nitrotoga_sp_SPKER:0.006020303,((SPS06998|Nitrotoga_fabula:0.0,SPS06751|Nitrotoga_fabula:0.0):0.042255811,(RFC37636|Nitrotoga_sp_CP45:0.000000005,(RFC33776|Nitrotoga_sp_LAW:0.000000005,RFC30723|Nitrotoga_sp_MKT:0.001768416)0.953:0.002651540)0.916:0.006621566)0.695:0.008594937)0.950:0.008908972,BBJ23476|Nitrotoga_sp_AM1:0.013693167)0.440:0.001391552)1.000:0.666812638)1.000:0.321755680,((((greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3:0.011379394,(NASQAN2014_190_B_bin.96_k121_3766_2:0.017081478,(NASQAN2015_111_B_bin.76_k121_226837_116:0.021392246,icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5:0.002525334)0.985:0.013886431)0.102:0.014633186)1.000:1.045689577,((flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14:0.290495020,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1:0.289900857)1.000:0.977544665,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3:0.182186058,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4:0.220237367)1.000:0.733397499)0.485:0.198655286)0.560:0.125080923,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1:0.429037937,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1:0.433198646,((NASQAN2011_330_B_bin.17_k121_430440_3:0.641466723,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7:0.393884505,(gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3:0.324547720,((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1:0.157095605,((whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1:0.167523285,(NASQAN2011_265_B_bin.52_k121_959771_6:0.026017376,NASQAN2011_265_B_bin.52_k121_465271_4:0.000000008)0.818:0.115349202)1.000:0.087988271,(logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2:0.159911107,(lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5:0.020931878,(watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30:0.032515342,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1:0.071100891)0.951:0.024998611)0.985:0.042982912)1.000:0.086501401)0.986:0.042923050)1.000:0.086203118,(((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6:0.320376687,(flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9:0.147904578,(nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5:0.099435688,lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3:0.013429712)1.000:0.121234242)0.749:0.040234813)0.863:0.055442056,((king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1:0.156531059,NASQAN2015_010_A_bin.16_Ga0466474_000034_25:0.177178519)0.992:0.044604086,((((NarG_Escherichia_coli_NP_415742:0.203008887,NarG_Halomonas_maura_gb_AAT47523:0.153894902)0.981:0.047232779,watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1:0.311887965)0.998:0.063567006,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6:0.106781950,(NASQAN2011_286_B_bin.1_k121_764018_13:0.005660724,NASQAN2011_286_F_bin.29_scaffold_54_27:0.000000005)1.000:0.123919793)1.000:0.131403606,(NarG_Pseudomonas_stutzeri_gb_AAZ43099:0.046987015,(NarG_Pseudomonas_fluorescens_gb_AEV63780:0.078508524,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16:0.074914222,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11:0.000000008)0.885:0.078978122)0.708:0.032866426)1.000:0.168519259)0.242:0.019184033)0.998:0.047390479,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1:0.199222465,((littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6:0.090260755,(littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7:0.175888927,watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2:0.078834694)0.544:0.015106087)0.765:0.040298684,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1:0.189261863)0.493:0.037097247)1.000:0.139855980)0.732:0.020426298)0.995:0.035229012)0.458:0.027215325,((((((NASQAN2015_172_B_bin.54_k121_327740_1:0.048321373,((cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17:0.003316375,Yukon_2004-1_F_bin.10_scaffold_678_1:0.110287220)0.999:0.034293344,(cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5:0.010147982,(NASQAN2015_227_F_bin.21_scaffold_4919_3:0.024300445,NASQAN2011_028_B_bin.24_k121_53788_5:0.000000005)0.990:0.014294289)0.365:0.007073108)0.988:0.017900532)0.950:0.016382079,(watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1:0.104162330,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1:0.054766712)0.871:0.041502925)1.000:0.076566993,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4:0.104610952,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2:0.070583667,eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23:0.043655384)1.000:0.048776638,((yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1:0.089459252,cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1:0.023635532)0.326:0.001148673,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1:0.090302159)0.885:0.013388066)0.878:0.032405321)0.565:0.021969185,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2:0.152164297,(NASQAN2016_164_F_bin.17_scaffold_1152_1:0.081072836,NASQAN2015_227_F_bin.21_scaffold_2406_1:0.055593684)0.976:0.109893377)0.649:0.067627453,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2:0.064995222)0.815:0.039464533)0.963:0.029952893)0.148:0.015135463,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17:0.129369944)0.861:0.019065424,(((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1:0.392541235,yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1:0.171599398)0.840:0.248083204,((Yukon_2004-1_F_bin.10_scaffold_25058_1:0.105822798,NASQAN2016_164_F_bin.17_scaffold_8891_2:0.030238438)0.312:0.015380827,NASQAN2015_227_B_bin.17_k121_559871_7:0.039959075)0.928:0.056585084)0.234:0.007394197,(watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7:0.604640728,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3:0.181397923)0.845:0.147304633)0.903:0.041551231)0.908:0.028658570,lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206:0.136445862)1.000:0.145006781)0.508:0.034596552)0.999:0.098317003)0.563:0.079911427)0.999:0.168588838)0.985:0.135263217,(CRI68048|Thiocapsa_sp_KS1:1.094261762,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4:0.488541056,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1:0.401066831,((GCA_003453735_00577|DMNE01000186unannotatedprotein:0.309801231,(((AFN37208|Nitrolancea_hollandica_Lb:0.039042664,AFN37205|Nitrolancea_hollandica_Lb:0.011623567)0.981:0.018883572,(AFN37207|Nitrolancea_hollandica_Lb:0.059889634,AFN37206|Nitrolancea_hollandica_Lb:0.035086850)0.741:0.017421853)1.000:0.237080104,((WP_005004540|Nitrococcus_mobilis:0.005243894,Nitrococcus_mobi_EAR23355:0.002640284)1.000:0.244172179,((WP_011314088|Nitrobacter_winogradskyi:0.002534990,(Nitrobacter_sp_Nb_311A_ZP_01048070:0.009400785,(A_Nitrobacter_hamburgensis_YP_578638:0.031550923,B_Nitrobacter_hamburgensis_YP_578186:0.023740548)1.000:0.053836401)0.978:0.022733577)0.963:0.016265428,Nitrobacter_winogradskyi_gb_ABA05326:0.037260949)1.000:0.216806507)0.880:0.055888930)1.000:0.201356108)0.974:0.063994885,(blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11:0.000000005,blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9:0.000000005)1.000:0.282418622)0.992:0.095642727)0.132:0.041822075)0.986:0.188699247)0.017:0.049701189)0.871:0.184584331)0.173:0.116759705)1.000:0.987285179)0.550:0.236304701,(providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4:0.472026440,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60:0.325258151,(icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14:0.332187014,muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5:0.705095308)0.418:0.106182937)0.994:0.312896913)1.000:0.774651657)1.000:0.778950754)0.975:0.154198707)1.000:0.231811834,((((cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor:0.000877951,cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor:0.000943888)1.000:0.055806636,(GCA_003523945_00056|DOFS01000023unannotatedprotein:0.004579427,DJ_nxrA:0.006504779)0.999:0.028051194)0.999:0.046515340,(DJ_nxrA2:0.074233359,DJ_nxrA1:0.060036576)0.694:0.026270877)0.990:0.045759227,(((((WP_053378142|Nitrospira_moscoviensis:0.008325164,(riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5:0.012480447,GCA_002083555_01644|MSXN01000007unannotatedprotein:0.002680030)0.924:0.008235322)0.880:0.003077004,(((GCA_002420115_02525|DIHK01000043unannotatedprotein:0.012092376,GCA_002483475_03556|DLHZ01000062unannotatedprotein:0.002691200)1.000:0.023236403,(GCA_900078535_00262|FJVM02000053unannotatedprotein:0.014982211,(GCA_001458695_00808|LN885086unannotatedprotein:0.023036213,GCA_002451055_00821|DKBD01000269unannotatedprotein:0.007573759)0.688:0.003976613)0.390:0.001522946)0.694:0.004052451,GCA_002331335_02310|DCZO01000011unannotatedprotein:0.017101140)0.922:0.006393889)0.980:0.016473529,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32:0.002308752,GCA_002737345_00863|NSIK01000010unannotatedprotein:0.006832549)1.000:0.023034521)0.393:0.016407361,WP_080886776|Nitrospira_japonica:0.032980329)1.000:0.048957408,(((Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein:0.0,Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein:0.0):0.048648714,((CBK42946|Nitrospira_defluvii:0.0,NxrA2_Nitrospira_defluvii_YP_003798871:0.0):0.003132849,GCA_900170025_02937|FWEX01000006unannotatedprotein:0.002326236)1.000:0.046043049)0.987:0.028241355,((CUS31266|Nitrospira_nitrosa:0.032070423,CUS38776|Nitrospira_nitrificans:0.014206130)1.000:0.059565512,(GCA_001567445_02228|JZQY01000048unannotatedprotein:0.031898730,((CBK42928|Nitrospira_defluvii:0.0,NxrA1_Nitrospira_defluvii_YP_003798853:0.0):0.020188049,GCA_003456605_00391|DMQK01000091unannotatedprotein:0.020042828)0.973:0.029005902)1.000:0.049275974)0.916:0.026734542)0.987:0.030138243)0.163:0.019579673)1.000:0.351067665)0.984:0.079553236,((OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14:0.144751486,OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b:0.164104591)0.967:0.106906909,(((OUC07869|Chloroflexi_Litorilinea_aerophila:0.108541565,RCK74665|Chloroflexi_Anaerolineae_bacterium:0.109258954)1.000:0.169950317,(KRT77589|Armatimonadetes_bacterium_CSP1_3:0.210493116,KRT68888|NC10_bacterium_CSP1_5:0.135568128)0.411:0.038266264)0.915:0.031759119,(GBC85351|bacterium_sp_HR11:0.152552869,(GCA_002328125_01442|DCWK01000050unannotatedprotein:0.001947491,GCA_002685755_01556|NYYB01000002unannotatedprotein:0.001760896)1.000:0.300590274)1.000:0.072067691)0.853:0.038248286)0.986:0.048595639)0.582:0.046460101,((MSP_nxrA:0.025354205,(((MBL09191|Acidiferrobacteraceae_bacterium:0.033838550,TDJ60388|Nitrospina_sp:0.042298150)0.934:0.011901270,((Nitromaritima_KMP11423|SCGC_AAA799_A02:0.031363214,((GCA_002705185_00880|PAJA01000060unannotatedprotein:0.0,MAX17737|Nitrospina_sp:0.0):0.009948403,(GCA_001542995_01387|LFLA01000024unannotatedprotein:0.011368914,(GCA_002453875_01196|DKHT01000003unannotatedprotein:0.0,GCA_002454045_00625|DKID01000024unannotatedprotein:0.0):0.025625262)0.731:0.006753767)0.957:0.010197443)0.837:0.006601827,cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor:0.016703925)0.925:0.009659103)0.780:0.008734629,PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15:0.031915291)0.638:0.007806333)0.907:0.014421329,(WP_042250442|Nitrospina_gracilis:0.018020385,WP_042251421|Nitrospina_gracilis:0.040064063)0.228:0.014895744)1.000:0.388356661)1.000:0.140833958)0.990:0.036064959,((((WP_007222969|Jettenia_caeni:0.0,NxrA_planctomycete_KSU_1_ZP_10101005:0.0):0.002251376,TLD40744|Candidatus_Jettenia_ecosi:0.013337202)0.983:0.006913180,TLD41279|Candidatus_Jettenia_ecosi:0.021669001)0.000:0.000000005,WP_007220240|Jettenia_caeni:0.000000005)0.998:0.026966168)0.882:0.017606145,((WP_070067449|Brocadia_sapporoensis:0.003688908,(OQZ04816|Brocadia_sp_UTAMX1:0.003783493,RZV56287|Brocadia_sp_BROELEC01:0.003479253)0.233:0.001151055)0.997:0.020857077,(KKO18624|Brocadia_fulgida:0.021890769,(OOP55454|Brocadia_caroliniensis:0.024026386,(WP_052561322|Brocadia_sinica:0.000917852,KXK29028|Brocadia_sinica:0.000923980)1.000:0.023040103)0.993:0.017011726)0.725:0.010490186)0.877:0.013675102)0.965:0.015645586)0.779:0.007537636)0.931:0.007662564)0.935:0.007110293); diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa b/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa deleted file mode 100644 index 8620f8d1..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa +++ /dev/null @@ -1,5425 +0,0 @@ ->RBG1_10 -----------------------------------------------MTLSRRRFLKISSL -SAAGA---------LVDLPELKFLQFLET------VENPLEYYPNR------DW-EKIYR -DQYRY------DSSFTFVCT-PNDTHACRLRAYVRNGIVIRVEQAYDVQNYTDLYGNKAS -VMWSPRGCNKGYNLPRRVYGPYRVKHPMVRKGWKE----------WAE----------AG -FPDPTLPENQQKYF--RRGEDSWVKVSWDEGFELVAKGLLHTMEKYSGEKGAEIL-RKQG -YPEEMIEAM------HGSGAQTIKIRGAMPLLGATRIFGFYRFAN-MLGLYDGK------ ----LGARGWSNFSWHGDLPPGHPMVTGVKCSDPELNDFRHSKLLVFLGKNMVESKMADAH -WWIETIERGGKVVNISPEYSATSSKSDYWIPIRPG-TDTALLLGVTQIIIQEKLY----D -------QDFIKKHTDLPLLIRMDNLKLLRPTDIIKG---YK----------NQILTG--- ---------------YSVKVQKIKPELREKW---------GDFVVWDLKTKK--PQTVT-- --------REDLGEKIERKGL------N---------------------PALEGNY----- -------------------------------------KIKLV-NGKEIEVKTVFQL----- ----YKELLSE-YDLETVS-----------------------------QITGSPKNLIYQL -AQDL-----------ATIKPASIHTGEGVNHFFHCD-LVTRAVWLPLALTGNIGKPGA-N ---VGHWAGNYKGEVFD--------GLG--------------------------------- -------------------------------VYLNE-----DPFNPNLDPSAKLEDIKLKK -YYK------GEEVCYW-----NY---------------EDRPLIVKG----------KCF -TGKTHMPTP---TKAEWVGNGN-LLNNAKWAHN----------------MIANVE--GKV -EMIVYNEIEWTASCEYADVVFPVHSWMELTLPDMTASCSN-PFLQV----W-KGGIKPIF -DTKQDNEVLAGVAAKLSELT---------------------------------------- ----------------HDNRY--KDYWKF-------------------------VLEG--- --------------------------------NNEVYLQRILDACSTTKGYKIDELL-KSD ------RG----WLMNFRT----Y-PRIPFW----EQIQESK--PFYTKT----------- --------------------GRMEFYREEDEFIDYGENLIVHREPVEATPYL--PNVILG- -THKAIR---PNSYGISPESIN---ADERQVRNLKMSWKQVKLSKNPLWEKGFRFYCLTPK -SRHTVHSSWSVLDWNMIWQSNFGDPYRMDNRTPGVGEHQMHMNPLDAKELGINDGDYAYV -DANPEDRPYTGWKEEDPFYKVSRLMVRVKYNPAYPRGITMIKHASFIATHKSVKAHESRP -DKRAVSED-TGYQSSFRYGSQQSIT---RGWLQPTMMTDSLVRKNYMGQEIGEGYEIDVN -APN-TCPKETLVKIIKAE-DGGMGGKGKW---EPARTGYTPAG--ENKDMKKFLEGGFIL -KV-- ->cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLITQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ECLVTQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_003523945_00056|DOFS01000023unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAVMTKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRM-REQG -YPPEMIEMT------KGSAIRSFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENLY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLSKNQ--AVPIH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-NGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPECIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAIMSKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRL-REQG -YPPEMIEMT------KGSAIRAFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENMY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLNKNQ--AVPLH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-SGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDISFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA2 -----------------------------------------------MLVTKRQFLKITAG -TVAAVA--------LADNALA--LTALQP--VVE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDMYGNRGT -FAHNPRMCLKGYTYHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPELD-PTVMTKYKFSARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEAGARRL-REQG -YPPEMIEMM------KGSGVRSMKFRAGMPVLGVIGKMGITRMNGGCGALLDSWVRKVGP -DSAQGGRYFNNLTWHGDQDPSQPFWSGAQAIDCDLSDMRFSKMNTSWGKNFVENKMPEAH -WKLESIERGGRVVVITPEYNPTAQRADYWMPVRPE-TDGALFLGACKIILDDGLQ----D -------NDFIRSSTDFPLLIRTDTLQYLDPRDVIKD---YA---------FPDFSKS--- ---------------YSGKVQGLSPSQIARL---------GGFMVWDLNQDK--AVPLH-- --------RELVGWHFKKSGI------D---------------------PALTGSF----- -------------------------------------RVKLL-SGREADVMPLFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDN-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAAMVMTLTGNMGKFGS-G ---CHTWSGNYKVGVWA-ATPWSGEGIG--------------------------------- -------------------------------IHTGE-----NPFKITTDPNAHGKEINYRP -YYY------GEETTYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKLRWVANVN-ILNNSKHHYD----------------MVKNVD--PHI -ETIVTQDIEMTSDVNHADVSFAVNGWMEFTYPEMTATVSN-PWMQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDAGSTSYGYSADTML-KSE ------KG----WMVMTRT----Y-PRIPLW----EETNESK--PMWTRS----------- --------------------GRLETYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHVNPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQLDSLPGKMANKWKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA1 -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTMHRRVYGPYRLKGPLMRRGWKQ----------WMD----------DG -SPEFT-PAIQTKYKFNARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEYGARKL-REQG -YPPEMIEMM------KGSGVRAFKFRAGMPVLGIIGKMGITRMNGGCGALLDSWVRKVGP -ENAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDIDLSDMRFCKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAYRADYWIPIRPE-SDGSFFLGACKMIVDEGLF----D -------ADFVRANTDMPLLVRTDTLQYLDPRDVIKD---YQ---------FPDFSNT--- ---------------YSGKVQTLKPAEIARL---------GGIMVWDLNKNQ--AVPIH-- --------RELVGWHFKKSGI------D---------------------PALTGTH----- -------------------------------------RVRLL-TGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QICRSPKDLIVRW -ARDM-----------GTVKPAAIHNGEGVCHYFHMT-QNGRAAALTLIYSGNMGKFGS-G ---CHTWSGNYKAGTWA-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFKITTDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNSKHHYD----------------MVKNVD--PHN -ECLVHQEVEMTSDVNHFDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRLLDAGNCSYGYNADTML-KSE ------KG----WMVMTRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRVETYRVEPEAIEYGENFIVHREGPEATPYL--PNAIMS- -SNPYIR---PDDYGVPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPFVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHPVAWKFKWGFAIDHH -AVN-TTPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_001567445_02228|JZQY01000048unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPIFQL----- ----YQVHLQD-YDLDTVH-----------------------------QVNRSPKDLIVRW -ARDC-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLTTDAHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNSKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVSAKLKELT---------------------------------------- ----------------GEARM--ADTYRF-------------------------VYQN--- --------------------------------RMDIYVQRILDASTTFYGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFIVHREGPECTPYL--PNAIMS- -TNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYCFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42928|Nitrospira_defluvii ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->NxrA1_Nitrospira_defluvii_YP_003798853 ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->GCA_003456605_00391|DMQK01000091unannotatedprotein ----------------------------------------------MMQVSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VVE-VDNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLVVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPYEVVKE---YQ---------LPDFTKS--- ---------------YSGRIQGLTQDHIRRL---------GGMMVWDLAKGQ--AVPLH-- --------REQVGLHFAQTGI------D---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDVMPVYQM----- ----YTIHFQD-YDLDTVH-----------------------------QINRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLKDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFSGVAVKLKEIT---------------------------------------- ----------------GDQRM--ADTYKF-------------------------VYQN--- --------------------------------RVDIYVQRILDASSTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFISHREGPECTPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKQQANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQANFRYGAQQSFT---RSWLMPMHQTDSLPGKQANAMKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMAKWLKGEHIK -IKV- ->Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42946|Nitrospira_defluvii ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->NxrA2_Nitrospira_defluvii_YP_003798871 ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900170025_02937|FWEX01000006unannotatedprotein ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -DKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPLRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NGREIDVMSIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS31266|Nitrospira_nitrosa -----------------------------------------------MVITRRQFMKASAG -TIAAIA--------VADKVLA--LTALQP--VTE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLIRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFASRFLDDMLRVSWDTAFTYAAKAMVVIATRYSGEAGARRL-REQG -YAPEMVEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPVLDTWVRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARLAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMH----D -------VDYLKQFTDMPLLVRTDTLQYLDPREVIPD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDLAKQK--AVPLH-- --------REQVGWHFDSSGI------Q---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDAQPIYQM----- ----YQIHFQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-SNGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWS-ATPWSGSGSG--------------------------------- -------------------------------VHLSE-----DPWQINLDPNAHGKEIKYKS -YYY------GEEPGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAARLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRVEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPHVR---PDDYGIPVTAQH---HDDKTIRNIKLPWVEIKRHTNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS38776|Nitrospira_nitrificans -----------------------------------------------MLVSRRQFMKATAG -TIAAAA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WAD----------DG -SPELT-PEAKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPLLDTWIRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMQ----D -------IDYLKQFTDMPLLVRTDTLQYLDPRDVIQD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDMAKKQ--AVPLH-- --------REQVGWHFDKSGI------E---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDALPIYQL----- ----YLIHLQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-ANGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWN-ATPWSGVGGG--------------------------------- -------------------------------VHLSE-----DPWHINLDANAHGKEIKYRN -YYY------GEEPAYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPIAAQH---HDDKMIRNIKLAWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_080886776|Nitrospira_japonica ---------------------------------------------MTMFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMMRVSWDTAFTYAAKSMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVTS -DQAQGGRYWSNYTWHGDQNPSQPWWCGAQASDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGGRIVVITPEYNPTAYRADYWMPLRPQ-SDGAIFLGAMKIITDENMH----D -------IDFLKGYTDAPVLVRTDTLQFVDPRDVVRD---YK---------FPDFSKS--- ---------------YSGRVQTLKPEQVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYSNSGI------D---------------------AALTGTY----- -------------------------------------RIKLL-NGREIDVMPVWQL----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLLVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHMT-VNSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWV-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PSI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQV----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEIT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYMN--- --------------------------------RVDVYVQRLLDASATFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRVPFW----EETNESK--PMWTRT----------- --------------------GRFETYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYCR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHANGLKWKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRVQSLKPEQVERL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-STPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002737345_00863|NSIK01000010unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRTFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPREVVAD---YQ---------FPDFSKS--- ---------------YSGRVQSLKPEGIARL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002420115_02525|DIHK01000043unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDSWIRKVSP -DQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFMGAMKIIIDENMH----D -------VDFLKQFTDAPILIRTDTLQYLDPRDVVPD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGVPITAQH---HDDKTIRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002483475_03556|DLHZ01000062unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------VDFLKQFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGCWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_001458695_00808|LN885086unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -APELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGVQGSDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFLGAMKIIVDENMH----D -------VDFLKSFTDAPILVRTDTLQYLDPRDVIPD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIQRL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIHTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VVNNAKHHYD----------------MVKNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRPEAEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWDEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPFVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGCQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900078535_00262|FJVM02000053unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------IADNVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------SDFMKQFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQTLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKQ -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTIRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMSKHAPYVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002451055_00821|DKBD01000269unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRRYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIMVDENMH----D -------IDFMKSFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKGEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-ANARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VVNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAVAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002331335_02310|DCZO01000011unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVIMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFMKSFSDAPILIRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKAEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDVEMTSDVNHNDIAFACNTWVEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYSN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMTKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_053378142|Nitrospira_moscoviensis -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIVATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGTAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYLN--- --------------------------------RVDVYAQRMLDASSTFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAYIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVNP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFIGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDT------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->GCA_002083555_01644|MSXN01000007unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMVIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVKD---YA---------FPDFSKS--- ---------------YSGRMQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALNGTF----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYTN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002328125_01442|DCWK01000050unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDTFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNL------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVH-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPETAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->GCA_002685755_01556|NYYB01000002unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDIFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNI------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVY-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPEAAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->WP_042250442|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKIRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDDTFTYLAKGHVAVGKAYSGQRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGIYRLAN-MVGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVCPEYNPPSTKADYWIPCRAGASDISIFLGCAKIIMDEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDTNTDK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDSVN-----------------------------QISHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------SMVAE-----DPFNPVLDISKNVDWANVKG -YLK------GEEVGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---SKLIWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYADFVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTAGMGYNIDDII-NGK ------YGEPGACLLLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTAMMKHSCWTSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMFGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQY-- ----- ->WP_042251421|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRVTWDETFTYLAKGHVAIGKAYSGSRGAQRL-KNEG -YQPEMIEAM------GGSGSRSMKYRGGMGLLGVVGKYGIYRLAN-MMGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPTRAGLADISIFLGVAKILMDEGLV----D -------GEYVKEYTDMPLLVRTDNLIRLHPEDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNYDRDKM---------PDFVVWDTNTDK--PVALT-- --------REDIGAKMRRKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWSGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVLDVTKNVGWENIKA -YAK------GEEPGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLLWFVNVN-VINNAKWFYE----------------MVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQIT---------------------------------------- ----------------GDKRF--ADYMK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTSTSGMGYNIDDII-NGK ------YGEPGCCLLLYRT----Y-PRSPFW----EMYTESK--PFYTAH----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTSMMKHSAWQSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKSKTKMKFVHGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPARTGYTPESPLKDRFAEMYLAGQY-- ----- ->MBL09191|Acidiferrobacteraceae_bacterium -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNRYPMIRVGWKQ----------WAD----------DG -FPYLD-KANREKYKMTSRGTDEFVRMSWDDTFTYLSKGHIAVGRAYSGPRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISVFLGCAKIIMDEGLV----D -------IEYVKDYTDMPLLVRTDNLKRLHADDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFSRDQM---------PDFAVWDANTNK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DVKLT-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLVVRV -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDPAQNTDWKNVKG -YLK------GEEVSYW-----AH---------------RDEALIVNTP-----RYGRKVF -TGRSHMPTP---TKLFWFVNVN-VINNAKWFYE----------------LVFNTD--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFARRMSEVT---------------------------------------- ----------------GDKRF--GEFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -XGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKFGYEADNH -AVN-ATPXEXLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->TDJ60388|Nitrospina_sp -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKRVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRLSWDQTYTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MMALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPVRAGLSDISVFLGAAKIIMDEGLV----D -------VPFVKEYTDMPLLVRTDTLVRLHPDDYIPG---YK---------VQALPKD--- ----------------GFTTKWLKNFNRSKM---------PDYTVWDTNTNK--PVAIT-- --------REDIGAKMLKKKI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPMYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLIIRL -SRDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---AHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFHIILDPAKNVDWKNVKG -YLK------GEEISYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLMWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIIAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLMHREFGKRMAQIT---------------------------------------- ----------------GDKRF--ADFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PYYTPN----------- --------------------GRLQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEEEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYTR -VKI- ->MSP_nxrA ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPLYEM----- ----YKIHLKD-YDLETVN-----------------------------QISHAPKDLVVRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPEMDPAKNTTWAQIKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRMAEVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTGTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPH----------- --------------------GRLQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15 -------------------------------------------------------MQVSAG -VATAMA--------LTSKKVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGSRVMKYRGGMGLLGVVGKYGIYRLAN-MVALLDAIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------VNFVKEYTDMPLLVRTDTLMRLHPDDFIPG---YR---------NQDLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDANTDK--PVAIT-- --------REDIGSKMKKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTIPVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIMPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVMDIAKNTDWANVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRSHMPCP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNCWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFARRLAEVT---------------------------------------- ----------------GDKRF--SDYMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWASTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->Nitromaritima_KMP11423|SCGC_AAA799_A02 -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTGKKVG---AQLKP--VVK-VGNPLDTYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRLSWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTMKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGVNKIIMEEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDFIPG---YK---------AQQLPKD--- ----------------GFTTKWMKNYNRNQM---------PDFTVWDTNTNK--PVAIN-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DVKLV-NGKTITVMPLYEM----- ----HKIHYKD-YDIDTVN-----------------------------QISHAPKDLIIRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFTPLMLTGNVGPKGS-G ---SMTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----TPFDTELDPAKNIDWNRVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PFYTPN----------- --------------------GRTQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPFMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWTATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor ---------------------------------------------------------MSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGVRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVIGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISIFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDNLIRLHPEDFIPG---YK---------VQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFTVWDINTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKVHLKD-YDIDTVN-----------------------------QISHAPKDLILRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTVLDASKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEFGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFLHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002705185_00880|PAJA01000060unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->MAX17737|Nitrospina_sp ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_001542995_01387|LFLA01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSKRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAVAPEYNPPATKADYWIPVRAGLSDISLFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDANTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNIVMDPSKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRMAEVT---------------------------------------- ----------------GDKRF--MDHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002453875_01196|DKHT01000003unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GCA_002454045_00625|DKID01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GBC85351|bacterium_sp_HR11 -----------------------------------------------MKLTRREFMQTTAA -GAAALV--------LDDALRG--LRLLQP--VVE-VGNPLAAYPNR------DW-EAVYR -DQYRY------DRSFTWVCS-PNCTHECRLRAFVRNGIVLRSEQNYDLHRISDLYGNKAT -AHWNPRGCLNGYTFQRRVYGPYRLKYPMIRRGWKQ----------WAD----------DG -FPELT-PENMAKYKFDSRGTDTFVRVSWDEAYTYVARGMIAIARRYSGEEGRRRL-LEQG -YPEEMLEHW------EGSGVRTFKLRGGMGLLGVIGKYGLYRFAN-MLALLDAHVRKVPP -EEAKGARIWSNYTWHGDQAPGQPFVHGLQTSDVDMNELRFARLHIQCGKNLVENKRPESH -FFIELMERGAKIVAIIPEYGPQATKADYWIPIRPA-TDAALWLGITRVMIDNGWY----D -------VDFLKKWSDMPLLIRTDTLRRLRAHEVFPG---YR---------GGLDPKG--- ---------------PSFQVQDLKPDQYEKI---------GDFVVFDEKSQS--LKPLT-- --------RDDVGGRLTAKGI------D---------------------PALSWRG----- -------------------------------------KVRLV-DGTEVECMTLWEA----- ----YKIHLQD-YDLDTVC-----------------------------EITHAPKELVLRL -ARDIWETTQEVRRQNPDMGAVAIHIGEGLNHWFHAT-EMNRAVYLPLILTGNIGKPGA-G ---CHTWAGNYKAALFQ-GSPWTGPGFL--------------------------------- -------------------------------GWIAE-----DPFHPLLDPKADGTQVKVKK -YTH------DEEPAYW-----NY---------------DDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKLMWFTNVN-LLNNAKWVYE----------------MIKNVN--PKV -ELIIAQDIEMTSSCEYADVILPANSWMEMETYEITASCSN-PFLQI----W-KGGIRPIF -DTKDDVLIMAELAKKLGEIL---------------------------------------- ----------------KDRRF--ADYWKF---A----------------------LER--- --------------------------------KTEVYIQRLLDTCTTTKGYRVEDIL-AGK ------YGEPGAALMLFRT----Y-PRVPFW----EQVHDDL--PFFTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNVIVS- -SNPLIR---PEDYGIPLDHMG---RDERQVRNVKLPWSEVKKTKNPLWEKGYRFYCLTPK -TRHATHSSWQVTDWHLLYNNDFGDPYRLDKRSPGVGEAQLHMNPQAAKDLGINNGDYVYV -DANPADRPYVGWKPGDPFYRVARLMLRVKYNPAYPYHVVMMKHAAWIATEKSVRAHETRP -DGRALSED-TGYQASFRYGSQQSVT---VGWLMPMHQLDSLFHKAKAKVGFIFGGEADNH -AVN-TTPKETLVKVTKAE-DGGLGGKGVW---EPARTGYTAGD--EDDFMKRYLNGELVE -IVGE ->WP_099324707|Kuenenia_stuttgartiensis -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALSPS--GYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->OHB72803|Planctomycetes_bacterium_RBG_16_41_13 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKAKYMFDNRGNDELLRASWDEAFTYASKGILHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVDP -DQALGGRNWTNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKIVVITPEYSPSSQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLVRTDTLKRVSPKDIIPN---YK---------LQDISEG--- ---------------PSYQIHGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PALEGSF----- -------------------------------------KLKTV-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------DMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAANFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITTSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEH---WDDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDAFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELVK -VDA- ->WP_070066136|Brocadia_sapporoensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IVNKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFSD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------AAIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTIRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->RZV59451|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKTIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYSGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->OHB44699|Planctomycetes_bacterium_GWE2_41_14 -----------------------------------------------MKLTRRTFLQIAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFVCS-PNDTHGCRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGALGIIGKYGMYRFNN-MLSLVDSHHRGVGA -DKALGGRNWSNYTWHGDQAPGHSFSHGLQASDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSSQKADYWIPIKCN-TDTALFLGVTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQPKDIFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREIV---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLRD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GYVAE-----DAFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPENAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGVW---DPVKTGYTTGN--ENDFMKKYLNGELIK -VEKA ->WP_052562588|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGILHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIIRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKIKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMTKYLNGELIK -VEKA ->OOP57237|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREIL---------GDFVVWDAKTNG--PQPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFYQI----W-KGGIRPVN -DSKDDVMVIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTAKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVTMIKHSSWIATEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVTKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -VEKS ->RIK02127|Brocadia_sp -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPSLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->KKO18748|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->OQZ00558|Brocadia_sp_UTAMX2 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGVGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->TLD40744|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->TLD41279|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------MKHSACISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELVK -MEKA ->WP_007220240|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNIGYPGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->WP_007222969|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->NxrA_planctomycete_KSU_1_ZP_10101005 -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->WP_052561322|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRADTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->KXK29028|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWIYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->OOP55454|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFS--------LADKTMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRSFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGFTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISQG--- ---------------PSFKMHGLHDDQRETI---------GDFVVWDAKTNG--PSPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPYAPATDLKVRG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWAEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSRDDVMILAGMAAKLGDLL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFDAIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAEVKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAMDMGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAD-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMRRYLSGELIK -IEKA ->KKO18624|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LADKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRRGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDEAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPVRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFLN---YQ---------LEDISQG--- ---------------ASFKIHGLHDDQREII---------GDFVVWDTKTNS--PKPIT-- --------RDDVGDKLVGKGI------D---------------------PALDGTF----- -------------------------------------MVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVMILAGMATKLGELL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRMQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDNYGIPESAEH---WDERTVRNIKKSWSDTKQTRNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNPSYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGVW---DPAKTGYTAGN--ENDFMKRYLNGELIK -IEKA ->WP_070067449|Brocadia_sapporoensis ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------RGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTNG--PKAIT-- --------RDDVGDKLVAKDI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLRNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->RZV56287|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPESAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->OQZ04816|Brocadia_sp_UTAMX1 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLVENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVVKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRVKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->KRT68888|NC10_bacterium_CSP1_5 -----------------------------------------------MEITRRTFLKAAAT -GATAF---------LADDAWA--LRLLQP--AVE-VGNPLSEYPDR------GW-ERIYR -DQYGY------DRTFTFVCS-PNDTHACRLRAYVRNGVVMRIEQNYDVSRYADLYGNKAT -PHWNPRGCLKGYTLHRRVYGPYRVKYPLVRKGWKR----------WAD----------DG -FPDLT-PANKTKYRFDSRGTDELMRISWDDAYSYIAKGMIQIARRYSGEEGVRRL-REQG -YPEEMIRET------HGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-TLALLDVHVRGVGP -DQALGGRTWSNYTWHGDQAPGHPYSHGLQGSDVDLNDFRFSKLHIQCGKNLIENKMPESH -FFNELMERGAKIVVITPEYSPPAAKADYWIPIRPN-TDTALFLGLTKILMEERHY----D -------AAFVKRFTDFPLLVRTDTLKRLRAHEVFPG---YR----------GRLPEN--- --------------GPSFTIQGLTKEQYEKL---------GDFVVFDAKSQS--LKPLT-- --------REDVGDRLAQQGT------D---------------------PTLDWQG----- -------------------------------------KVKLA-DGTEVEAMTLWAM----- ----YTIHLKD-YDLDTVH-----------------------------EITHSPKELIQRL -ARDI-----------ATIKPVAIHIGEGINHWFHAT-LSNRAFYLPLMLTGNIGVPGA-G ---SHTWAGNYKAALFQ-GSSWSGPGFK--------------------------------- -------------------------------GWVAE-----DPFNPNLDPNAPGQAVKVKG -YTK------DEEPAYW-----NH---------------GDLPLIVNTP-----KYGRKVF -TGLTHMPTP---TKVMFFNNVN-LINNAKHVYE----------------MLKNVN--PRV -EMIISVDIEMTASIEYADFALPANSWMEFQTPEITASCSN-PFLQI----W-KGGIKPLY -DSKDDVTILAELAQKLGAIV---------------------------------------- ----------------NDHRF--AAYWRF-------------------------ALEG--- --------------------------------RPEVYIQKLLDTSSTTAGYRVDEIM-AGK ------YGEPGACLMLFRT----Y-PRVPFW----EQVHDSD--PFYTDT----------- --------------------GRLHAYCDIPEAIEYGENFIVQREGPEATPYL--PNVIVS- -TNPYIR---PEDYGISPDAMH---WDERTVRNIKMAWADAKRTTNPLWEKGYRFFFLTPK -TRHRVHSQWSVCDWNQIWDSNFGDPYRMDKRMPGVGDHQLHMNPQAAKDLGINDGDYVYL -DANPADRPYIGWKPSDPFYRVSRCMVRVRYNPAYPYQVVMMKHAPYIATERTVKAHETRP -DGLALSE--TGYQANLRYGSQQSLT---RNWHMPMHQTDTLFHKAKATMSFLFGGEADNH -ALN-TVPKETLVKVTKAE-DGGMRGKGIW---EPARTGFTPGN--ESDFMKRYLAGEIVQ -IKKR ->OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------MIWDSNFGDPYRMDKRTPWVGENQLHINPQAGKALGINDGDYVYV -DANPADRPYIGAKPEDPFYKVARLMLRAKYNSAYPYHIVMMKHAPNIATERSVKAHETRP -DKRALS-E-LGYQSNFRYGSQQSIT---RNWHMPMHQTDSLFHKAKVFMGFLFGGEADNH -AVN-TVPKETLVRVTKAE-DGGLGGKGVW---APATTGYTPGA--ESEAMRKYIDGGFVS -T--- ->OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b -----------------------------------------------MNESRRDFLKISAV -TAVTLA--------LSNKPFL--LWALEP--VAN-VENPLAYYPNR------DW-EKIYR -DQYRY------DRTFSWVCS-PNDTHACRALAYVRNGIIIRSGSEYNYETYGDLYGNKAT -QNWNPRQCAKGFTFHRLMYGPYRLKYPLVRRGWRE----------WAD----------AG -FPDLT-PENKTKYKFDSRGTDQLEKATWDEAYTYIANGIMSIAKRYSGVEGKRKL-LAEG -YPEEMLAPM------KGAGTRTMKFRGGMGLLGVFGKYGMYRLAN-TMALLDVNIRGVSE -EGAMGGRAWSNYTWHGDQAPGHPWVHGLQNADCDFNDLRFSKLIIQDGKNLVENKLTDSH -WFIECMERGAKLVTISPEYSPPASKSDYWIPIRPQ-TDAALFLGITRLMIDQGWY----D -------KEFVAQFTDFPLLVRTDNLKRLRAADIFPD---YK---------LGLSKNG--- ---------------PSFKYQGLKQEQYEKL---------GDFVVWDETKGA--PVAIT-- --------RDDVGKNLSKKGI------N---------------------PALEGSY----- -------------------------------------KVKTV-DGKEIEVTTLFSL----- ----YKIHLRD-YDLDSVV-----------------------------EITKAPKDLIEQL -AKDI-----------AAIKPVAIHQGEGINHWFHAT-EMNRAAYLPLMLTGNIGQKGA-G ---AFGWAGNYKAALFQ-GSAWTGPGFK--------------------------------- -------------------------------GWVAE-----DPFHPNLDPQTPGKAINAHA -YFR------DEEPAYW-----NH---------------GDRALIVDTP-----AEGKKVF -TGSTHMPTP---TKAMLFTNVN-LINNAKHTYD----------------MLKNVN--PNV -EMILSIDIQMTASIEYADIALPANTWMESEGLEVTASCSN-PFLQI----W-KGGIPPIF -DSKDDLVILSEIAAKLGDLT---------------------------------------- ----------------GDARF--RDYWKF-------------------------ALEG--- --------------------------------KREVYIQRLLDSSTTTTGYKLDDIM-KGK ------YGPPGGALMLFRT----Y-PRIPFW----EQVHEDQ--PFYTDH----------- --------------------GRLQAYTDVPEAIEYGENFIVHREGPEATPYL--PNVIVS- -SNPYIR---PKDYGIPLDAEH---WDERTIRNVKLPWSEVKNTKNFLWEKGFQFFCLTPK -SRHRVHSLWSNVDWHQIWDSNFGDPYRMDKRTPGVGEQQIHLNPQAAKDLGINDGDYVYV -DANPADRPYRGAKPGDPFYKVARLMLRAKYNSAYPYHVAMMKHGTYIATEKSVKAHETRA -DKRALSEG-GAYQANFRYGSQQSVT---RNWHMPMHQTDTLFHKAKVFMSFIFGGEADNH -AVN-TVPKETLVRISKAE-DGGLGGKGLW---EPVKTGYTPAH--ENDVMKQYLHGGFIK -T--- ->KRT77589|Armatimonadetes_bacterium_CSP1_3 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------MDFNELRHARLHIQVGKNLIENKMPESH -FFNELMERGAKIAVITPEYSPPAAKADYWMPIRPQ-TDAALFLGITRLMMDRRWY----D -------EAFVKQFTDFPLLIRKDTLKRLRAAEVFPG---YK----------PGLDPD--- --------------GPSFKRHNLKLDQYEKL---------GDFVVFDRKTRK--LQAIT-- --------RDQVGERLAQAGL------D---------------------PDLRWRG----- -------------------------------------KVKLI-DGREVECLTLWEA----- ----HRDHLRD-YDLDTVA-----------------------------EITQTPRAMIERL -ARDI-----------ATIKPVSIHIGEGINHWFHAT-LANRAFYLPLMLTGNIGKPGA-G ---CHTWAGNYKAGIFQ-GSPWTGPGIT--------------------------------- -------------------------------GWLFE-----DPFHAALDPATSGTEIKVKK -YLK------DEEPAYW-----DH---------------GDVPLIVNTP-----KAGRRVF -TGTTHMPTP---TKVMWYNNVN-IINNAKWAYG----------------VIKHVN--PNV -ELIINQDIEMTASAEYADIILPANSWVEFETPELTASCSN-PFLQI----W-KGGIKPLF -DTKDDGVIIAEVAAQLTAQT---------------------------------------- ----------------GDRRF--RDYFKY-------------------------LLER--- --------------------------------RPEVYIQRILDSSTSTVGYRVADVV-NGK ------YGEPGAALMLFRT----Y-PRIPFY----EQVHDSE--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENFIVHREGPEATPYL--PNVIVT- -TNPLVR---PEDYGIPLDALH---WDQRTVRNVKLAWRDVKKTKNPLWEQGYRFYLLTPK -TRHRVHSSWSTVDWNMIWDSNFGDPYRLDKRAPGVGEHQLHIHPQAARDLGINDGDYVYV -DAYAADRPYIGWKPSDPFYRVARCMVRVRFNPAYPYSVLMMKHAPFMATEKSVRAHETRP -DKLARSAD-TGYQANLRYGSQQSVT---RDWLMPMHQTDTLFHKSKGTMAFIFGGEADNH -AVN-TVPKETLVKITKAE-DGGIGGKGLW---EPARTGFSPGR--EGDFMKRYLAGTLVK -VTKR ->OUC07869|Chloroflexi_Litorilinea_aerophila ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------EITASCSN-PFLQI----W-KGGIPPLY -NTRDDARILAEVSAALADEI---------------------------------------- ----------------GEPRL--RDYWRF-------------------------ILEG--- --------------------------------RPEIYIQRLLDSSLTTSGYRVEDII-AGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSV--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENIISHREGPEATPYL--PNVIVT- -RSRFVR---PEDYGIPADHMG---WEERTVRNIALPWNQVKETKNPLWAQGFHFYCLTPK -TRHRVHSSWSTVDWTIILDSNFGDPYRADKRLPGPGDHQLHMNPQAAKDLGIEDGDYVYV -DANPADRPYIGWKPDDPFYKVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVKAHETRP -DGLAKSEG-TGYMANLRYGSQQSVT---RDWSMPMHQTDTLFHKQKTGMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGLDGKGPW---EPTKTGYTPAH--ENEFMLRYLAGETIE -VTT- ->RCK74665|Chloroflexi_Anaerolineae_bacterium ----------------------------------------------MSHLSRREFLKLSSV -AALGTV--------INDLD----WKLLDP---IQ-VDNPLAAYPSR------DW-EAVYR -NQYRY------DSSFTFVCS-PNDTHACRLRAFVRNGIILRAEQNYDVERYSDLFGNTAT -AHWHPRGCKKGQTFHRRLYGPHRLKGPLMRKGWKE----------WAD----------AG -FPELD-EENKTKYKFNARGQDELLPVSWETAYDYIARGMIAIARRYSGEEGARLL-RKQG -YPEEMIQAM------SGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-MLALLDVHVRNVPP -EEAKGGRTWSNYTWHGDQAPGIPFVTGLQASDEDLNDLRNSRLHIQCGKNLVENKMAESH -FFIEAMERGAKIVTITPEYSPPATKSDYWIPIRPA-TDTALFLGLARWIIENQKY----D -------EQFVKRFTDFPTLVRADTLKRLRADEVFSN---YQ---------PGLDPQG--- ---------------ASFTLQGLKPEQYEKL---------GDYVVINEKTGR--PQAIT-- --------RDQVGEVMDKAGI------Q---------------------PLLDWKG----- -------------------------------------KLRLV-DGSEVEVLTVWSM----- ----YLEHLKD-YDLETVL-----------------------------EITHVPKDLFLRL -AEDI-----------TTLSPVALHIGEGINHWFHAT-LANRAQFLPLMLTGNIGKPGA-G ---LYTWAGNYKAALFQ-GSAQSGPGFK--------------------------------- -------------------------------GWVGE-----DPFAPNLDENASGKEIKVHA -YTK------DEEPAYW-----NH---------------SERPLIVDTP-----KYGRKVF -TGQTHMPTP---TKVQFFTNVN-LLNNAKHHYE----------------MIKNVN--PNV -ELIISVDIEMTSTVEYADFALAANTWAEFETYEITASCSN-PFLQI----W-KGGIPPLY -DSRDDARILGELAARLGELL---------------------------------------- ----------------EDNRF--RDYWKF-------------------------ILEG--- --------------------------------RPEVYIQRLLDSSITTSGYRFTDII-EGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSI--PFYTDT----------- --------------------GRMNTYCDIPEAIEYGENLISHRESPEATPYL--PNVIVT- -SSRFVR---PEDYGIPPDATG---WEERTVRNLKMPWSEVKNTRNFLWEAGYHFYCLTPK -TRHRVHSSWSTVDWTLILDSNFSDPYRVDRRQPGVGEHQLHINPQAAKDLGLEDGDYVYV -DANPADRPYIGWKAEDPFYRVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVLAHETRP -DGLARSAD-TGYQANLRYGSQQSIT---RDWSMPMHQTDSLFHKQKTAMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGIEGKGIW---EPAKSGYTPAH--ENEFMSLYLQGKTIE -IKR- ->GCA_001803565_00046|MHDQ01000004unannotatedprotein --------------------------------------------MSFDRVSRRQFLETLAA -TATAAL--------VSKPAIGLALEKLQP--IPE-IKNPLEHYPPR------EW-EKIYR -DIYNP------DSSYIFACT-PNDTHNCYLRAYIKNGIVTRIGPSQRYRDATDIYETKAS -ARWDPRICNKGVAMVGRFYGDRRVKYPTVRKGFKE----------WVE----------KG -FPRD--ENGQPPLKYFKRGEDQWEKVSWDEAYTIVAQSMIDTVKTYSGTKGAELL-QKQG -YDAKMIEKM------MGAGTQAMKFRGGMPLLGVIKLFGLYRMAN-SMALLDSYIRGVGP -DKAIGGIGFDNYSWHTDLPPGHPMVTGQQTIDFDLVNAEYANIILCWGMNWICTKMPDGH -WLSEARLKGAKVVTITTDYNSTSSKADEIVIIRPG-TDPAFALGLAQVIINERLY----D -------EEFVEGFTDLPFLVRMDTRELLRAHEIISG---YN---------NAELKYT--- -RVIKKEEKPPPPFATNLGMPAVSSDMRQEW---------GDFVVWDSNAKK--ATPVS-- --------RDDTGERFTNKGV------K---------------------PALEGEF----- -------------------------------------EISLT-NGEKIKVRPIFDI----- ----IKQHLEDTWNVDSTS-----------------------------KITWAPKEAIINL -AREI----------AANKEKVLFTVGMGPNQLFNAD-QKDRAIFLVAALTRNVGFFGG-N ---VGSYAGNYRAALFN--------GMP--------------------------------- -------------------------------QYIAE-----DPFNIILDPTKPA---KVKP -YFK------MQSAHFY-----AH---------------GDTPLKVHDI----------YF -NGETHMPTP---TKFFWFAASNSILGNSKGMYD----------------VVMNLLRNRKI -EAVVVNEWWWSASCEYADVVLPADSWGEYNVHDMTASVTN-PFVMV----MPLTGVSRIW -DTKSDSETYAGVSEKLGELT---------------------------------------- ----------------GDSRF--KDYWRF-------------------------IADG--- --------------------------------KAKPYLQRIIDHSNTMKGYQIDNLISKAK ------DGIP--ALLMSRT----Y-PKFIGY----DQSVESA--PWYNKT----------- --------------------GRLEFYREEPEFLDYGENLPVHREPVDATFYE--PNVIVAK -GHPLIKPKTPTDYGWPMDDLS---GETRQVRNVVYTPDELLNTKHPLRKEGFTHIYLTPK -FRHAVHTFGVDLDLLSIWFGPFGDMYRRDKRKPWVNEGYVEINPDDARELGIEDGDYIWV -DPDPKDRPFKGWQDKPADYKVARCLLRARYHPNLPKGITRTWFNMYQATHGSVRGHESRK -DGLARNPD-TNYQSMYRYGGHQSST---RSWLRPTLLTDTLVRKNLMGQMIGKGFEPDVH -CAN-GAPRESFVKFTRAE-DGGESGKGKW---RPAVLGFRTGY--ENVAMKKYIKGGFIS -KGGK ->SPS06998|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->SPS06751|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->RFC37636|Nitrotoga_sp_CP45 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC33776|Nitrotoga_sp_LAW ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC30723|Nitrotoga_sp_MKT ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-STAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC31618|Nitrotoga_sp_SPKER --------------------------------------------------------KLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGA -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIIPD---YK---------LAELTHH--L -KVMKPGEGPTMPPAFQ-STAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVTPVFQL----- ----QKEYLEE-YTAENTS-----------------------------IMTGVPSEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KMAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--TIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGH -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23760|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23368|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23476|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRAGFKA----------WVE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYAGDKGAALL-TRQG -YDPEMIASM------HGCGCKVMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGS -DEASGAKVMDSYSWHTDLAPGCPMVSGHQQLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGEEPTQPVAFQ-ATAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVAPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HVAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------KEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYHAPE-------------- ---RTISVPKSPMRGNKRAGGHNSPT---RVHLKPSLMVGGYGQ---------FTYSFNYW -GPT-GVNRDTFILVRKLP------GKPEF------------------------------- ----- ->CRI68048|Thiocapsa_sp_KS1 ------------------------------------------------------------- -------------------MSK--TKDDNG--NGG-SRWFRELDEPR------KW-EDFYR -RRWQY------DKSVRTSHS-VNCSGSCSWEVFVKNGMITWELQKTDWPQI-----NDET -PNYEPRGCQRGISASWYPYSPVRPKYPYVRAVLLDFWRAERAAGKDPI----------AA -WGAIVENPERSKAYRNARGKAGWRRTTWDEATEIIAAAKIYTIKEH-------------- ----------GADHLASFSPIPAMSMVSFLSGHRL-------------------------- -SNLLGGTMLSFYEWYHDLPHVMPMIWGDQTDVHESADWYQSAYWIVMGSNLPMTRTADAH -FASEHKYNGGKLVNLSPDYSDVTKFADLWVPVRPG-TDTAFILSCIHVILQEFHV----N -RRSEYFHSYVAQYTNLPFLVILD-----QEGDHFASGRFLR---------ASDVAAY--- ---------------------AD--EELADW----------KLPCFD-KEGE--LRLPGGT -LGFRWEEKNTGRWNLKNEDAVTAQPFD---------------------PLLTLMDGEFEE -VIVEYADFTHTFNVEFGTTALRGEKARKSLRGVPSRVLTKK-DGTK---VRVATA----- ----YDLLLAS-FGVNRGLSGSGYPKDYDDASEAYTPAWQE-------QETGVDRNLAIRV -AREW------ADTAEKTKGKCLFITGSGILHWYHGGSLTYRSEAVMGILTGCQGRNGG-G ---FAHYVGTEKIRNMA---AIGTIGNAADWGNVGRQQNSTSYFYFHTDQWR-YDGMSLDP -LWAPRAKEMPARANHAADMNAVAVRNGWLPFFPQF-----DERNPTDVMQDARKAGCKSL -EDVK-----TWVAQQF-----KE---------------RKLKFALPNVDAPK-NHPKVLW -IYRGNLIGT---SMRGHELNLKHMLGTHNNVLGGETRA----KDMVNEIDWTENAPLGKL -DLIYNVNLRMDSSANYSDIVLPTAHWYEKFDLTCTD--LH-SFLHP----F-TPAHDPAY -ESKHDWEAFRLIAEKISELAKVHLPDPIEDLVMTALSTDTPDEMAQPM---GELRDWWKG -ESEPIPGKTFPNVSVVTRDY--TKIHDMYTTLGPAVTKPNSYGAKGIKGDLAEVYEQMKE -SYLVGEKQGRPNMETAAKVCEVILRISPESDGELSY-----------QIFKNLEKR---- ------CGVPLAHIVEPER----E-TAYHYP-DLISQPRRALTSPHWSAIETKGRTYSPWT -LNIEALKPFHTLT------GRQEIYYDHRMFRDLGEDFPVYKPPVDMV--S--IGDVAQ- -------------------------KDIKMKGAKLFRF-------------------ITPH -QKWGIHSMFGDSWQMQNMFR---------------GGPTVWINDDDARDIGVKDNDWV-- ----------------EIFNENGIQVARAVVSHTVPRDMSIVYHQTERH-------VNVP- ---FSSLAR-ERGASDLRGGNNNATT---RIMMNPATMVGGYANWTYWLNYQGTS------ -----PSERDCVVLIRKKP-METRGRKVIY---QESQL--------NVGA----------- ----- ->NASQAN2011_330_B_bin.17_k121_430440_3 rank: A; amyy:YIM_22320 narG; Nitrate reductase alpha subunit; K00370 (db=kegg) -----------------------------------------------------MFHNASLG -HTATMGRTDDVPNGTEEALIK--FGRFFAGGEVSKDLLSVTKAGGR------EG-DVFYR -DRWSH------DKVVRSTHG-VNCTGSCSWKVYVKDGIITWETQQTDYPSVG-----PDS -PEYEPRGCPRGAAFSWYTYSPTRIRFPYIRSVLLE---------MYREAKGRL-GDSVLA -WADVVDNSENRQRYHRARGKGGLVRVSWSEVSEIIAAAHVHTIKKY----GPDRI-FGFS -PIPAMSMAS------HAAGARFISL----------------------------------- ----MGGSMLSFYDWYADLPVASPQVFGDQTDVPESADWFNASYLIMWGSNVPVTRTPDAH -FMTEARYKGQKVIAISPDYADNTKFADEWVAPHPG-TDGALGMAMGHVILKEFFV----D -KQVPRFQDYVKKFTDLPYLVSLRK----KDGSWVPDKFLVASD-------LGDVSEG--- -----SRFKTVVLDSSTGETFVPNGSLGHRY-------NDSSTGKWNLDLEGVDPLLSV-- --------YGKKGAVSAPVLM----------------------------PRFDQGQ----- -------------------------------------EVSES-GGVLARGVPVIEIAGKTV -TTVYDLMLAQ-YGVAREG--------LDGDWPEGYDDRSPYTPSWQEEITSVPAVQAIRI -AREF------AQNAIDSEGRSMILLGAGTNHWFHSD-TMYRTFLALVTLTGCQGVNGG-G ---WAHYVGQEKCRPVT---GWAQLAFGADWSRPARQMIGTAFWYVSTDQWRYDALGSDLL -------ATPLGEGRFKDMTAIDVIAQSARMGWMPS-----YPSLN-RNSLDLVDEAREKG -VDPA-----QHVINEL-----KS---------------GDLQFAIENPDAPE-NWPRVLT -VWRANILGS---SSKGNEYFLKHLLGTDNSVRA----NENEPDARPKDVKWHEDAPEGKL -DLLVSVDFRMTSTGLFGDILLPAATW--YEKHDLSSTDMH-PFVHA----F-TPAINPPW -ETKTDYEIFQMLGRQVSEQAKGHLGER-EDLVVVPLLHDTPDAMATPG---GVVLDWKKG -EVEPIPGVTMPKLVVVKRDY--SQIGEKMAALGPLIDTLGTNTKGVPVSVLPEIELL--- -------RHSNGVASTGVGAGRPSLARDVDACEAILALSGTTNGRVAVAGFRALEKR---- ------TGQKLTDLALDNE----G-KRITFA-DTQARPVPVITSPEWSGSEHGGRRYTAFA -INVERLKPWHTLT------GRQHFFIDHDWMSELGEQLPVFRPPLNMHRIF--GS----- -------------------------QGDGVAKEVTVRY-------------------LTPH -SKWSIHSEYQDNLFMLSLSR---------------GGQEIWMSVEDAEIIGVKDNEWI-- ----------------EAYNRNGVVVARACISHRMPSGTVFMYHAKD-------------- ---RVVDVP-LAETSGKRGGIHNSLT---RLVIKPTHLIGGYAQ---------LTFAFNYL -GPT-GNQRDEVTVIRRRS--------------------------QDVEY----------- ----- ->GCA_003453735_00577|DMNE01000186unannotatedprotein ------------------------------------------------------------- --------------------MG--------------WIKDIFDPKAR------LW-EEFYR -SRWQY------DKKVRSTHG-VNCTGGCSWEVYVKDGIITWEMQETDYPLLE-----PGL -PHYEPRGCQRGITFSWYIYSPLRIKYPYIRGVLLD---------LWRKAKSIH-TDTVAA -WESVVENEESRRSYQKARGKGGLRRTTWEEALEIIAASTIYTAKKY----GPDRV-IGFT -PIPAMSMLS------YASGTRFLQL----------------------------------- ----FGGVALSFYDWYADLPPASPEVWGEKTDVAESADWYNSKYIVAMGANLSMTRTPDVH -FVAEARNNGTKLVVLSPDFSQVSKYADWWLPVTAG-HDGAFWMAVDHVILKEFFV----D -RQVQYFSDYLKRYSDAPFLVEIE-----GGEGSLRAGRFLR---------ANTLSRY--R -DAENGEWKLLVFDGKAKEPRMPNGSVGFRW--------QERKGQWNLEM----------- --------KDGADDTIIQPLLSLFEDRD---------------------AAVSINF----- ---------------------TEFASGRTFKRAVPVKYLQTE-KGR----VLVATV----- ----FDLLMAQ-MGVGRGL--------EGDFAEDYNDAERPYTPAWQEQFTGVSRDTLVCF -AREW------AVTAEKTKGKCTIIVGSGVNHWYHSN-LNYRAGITALILCGCVGVNGG-G ---MNHYTGQEKVAPEA---SWKSIAFALDWIKPPRLQNTPSFHYVHSDQWRYAE------ --------PENGIKVLEYMHPMDVLVNAVRMGWLPF-----YPQFN-RNPIDLVREAEESG -AKS------EQEIIEWLVLQLKD---------------KKIRFAVEDPDAPE-NWPRVWY -IWRGNAILA---SMKGHEYVLKHYLGTSTNAVA-----DEIVSASIKEVHSKGSAPEGKL -DLVIDINFRMDTSALFSDIILPAATW--YEKDDLNTTDLH-SFIHP----L-SAAVPPCW -EAKNDWDIFKEIALKISQLAPAHFSEPFREIVATPLMHDTRQEISQPQ-----VKDWHKD -KCQAIPGKTMPKFSVVERDY--TNLFKQFISYGHKEKEEGMGERGIQWKIGDMYDEF--- --------MKGVPVEQWGGERYPSLSEARDAANVILHFAPETNGEIAYRGFKALEEI---- ------TGMPLSDLAERQR----S-VRTIFP-DLLDQPKRILTSPCWSGITNGGRAYAPYC -INVERLMPWRTLTGRQHXAGRQHFYLDHEGYISFGENLPTFKSRVLLQN----------- ----------SGDIG----------KSTAIEKSLVLNF-------------------LTPH -GKWHMHTTYYDNLLMLTLSR---------------GVEPFWLNSKDAEDIGVKDNDWV-- ----------------EVYNDNGVVVTRAVVSARTPAGVGIFYHAPERT------------ ----ISFPK-SPLRNMKRGGGTNSLT---RIRLKPVLMVGGYAQ---------FSYAFNYW -GPI-GPDRDTYAYVHKLD------GKPVF------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------MRGALLD-------------------------------LW-QEARR -QH-------------------------------------------------------PDD -PV--------------------------------------------------------AA -WASITDDPARRKRYQEARGKGGFRRVSWSEAQELIAAANLHTVKKY----GPDRL-VGFS -PIPAMSMIS------YAAGARFLQL----------------------------------- ----MGGLCLSFYDWYCDLPPASPEIWGEQTDVAESADWFHSKFIATVGSNVLMTRTPDAH -FLVEARHKGAKVVVFSPDFSQTSKVADEWIPINQG-SDTAFWMAVNHVILREFHA----E -RSVPYFQTYLRENTDAGFLVVMKA----DAQGNYRPGSLLR---------ASQLAET--Q -GEENAEWKSFVLD-TQGNLRVPVGQVGHRW--------QKSKGQWNIKQED--ARTGE-- --------AFEAALTLRDSAT----------------------------GAVKAVF----- ------------------DDFSEGRTDRVRVREVPVREVQTV-EGP----VYVTTV----- ----YDLHLAQ-HGVNRGF--------GGDWPTGYADDTHPFTPAWQEQYTGIKAETVINF -ARQW------ATTAEKSQGKCTVIIGAGVNHWYHNN-LIYRACINALIYCGCVGRNGG-G ---LNHYVGQEKLVPQA---SWGPIAFGTDWSAPPRLQNAPSFHYMHSDQWRYDRKFDEMC -------PVADKSHLMASGHTADKQALAVRSGWLPC-----YPQFTEHN-FKLVQEAEDRG -ADPV-----QHVVGRL-----KD---------------RSLKFAMEDVDNPA-CFPRVWY -IWRGNAIQA---SAKGHEYFLKHYLGTHHNSIA-----VEHAREDVKEVTWHDKLELGKM -DLIVDVNFRMDTSALYSDIVLPTASW--YEKDDLSSTDMH-SFIHP----L-QAAVPPCW -EAKSDWKIFRGIAEETSRMAQRYLPEPVKDFVCTPLMHDTPAEIAQPT-----VKDWAKG -ECEAIPGKTMPNMKVVERDY--TKIFQKYITLGRNFRNNGLGIHGTTYPVDDLYDAY--- --------LQDHPVEEVDGERYPSLRADRSVCEAILHFAAETNGELAYRAYEAESHK---- ------TGIDHTHLAAPTR----G-VRYNFA-DLCTQPRRSLTTPFWTGITNGSRTYSAYC -QNVEERIPWRTLT------GRQHLYFDHEAYVAYGEHLPTFKPRADLRTTR--DLDMTG- ----------------------------VESGALVLNY-------------------LTPH -GKWHIHSTFGDTLRMETLSR---------------GIEPFWMNEQDAGLLGIHDNDWI-- ----------------EVLNDHGTVVTRACVSARIPRGICFIYHATERT------------ ----IGNPK-SKHRGMRRAGGHNSLT---RARLKPLFMIGGYAQ---------FTYAFNYW -GPQ-GVNRDTFVVVKKLD-------KPEW------------------------------- ----- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MN-WIEEISNPHAR------QW-EEFYR -NRWQH------DRVVRSTHG-VNCTGSCSWMIYVKDGIVTWELQALDYPVLN-----NGL -PPYEPRGCQRGISFSWYQYSPIRVKHPYMRGVLMD---------LWRKAKETH-QDPVEA -WTAVVEDEAARKSFHQARGKGGFRRASWDEVTEIIAASTMYTIKKY----GPDRI-IGFS -PIPAMSMLS------YAGGSRLMQL----------------------------------- ----LGAVSMSFYDWYSDLPPASPETWGEQTDVAESADWFNSKYIVSVGSNMSMTRTPDVH -FAAEARHNGTKLVVFAPDFNQVAKYADWWVPVNAG-QDGAFWMAVNHVIMNEFHY----Q -NPTPYFLDYMKRYTDSPFLVELN-----EVDGKFVPGRMVR---------AGQVERT--K -DVENGEWKFLVWDELSNAPRMPQGSLGFRW--------QQQKGQWNLEPKD--G------ --------LDGSEIRPQLTFL---GATD---------------------EQLSVSF----- ---------------------AEFGEGKSFQRNIPVRTIETA-NGK----VAVATI----- ----YDLLMAQ-YGVGRGL--------EGDYPASYDDENLSYTPAWQERYTGIDRQTVIQF -AREW------ATTAEKTEGKCMIIIGAGVNHWYHNN-LIYRACIGALMLTGCVGRNGG-G ---LNHYVGQEKLAPAA---PWASIAFALDWQKPPRQMNSPSFHYINSDQWRYERTYTEPQ ---PVSRPDSESHRDMTQEHTLDANIRAVRMGWLPS-----YPQFN-VSSLEIIRKAEQAG -AKS------DAEIRQWVVNQLKS---------------GELKFAVQDPDAPE-NWPRLWF -IWRGNALNA---SAKGQEYFFKHYLGTHHQIIS-----EEVDKSHFNEVTYRDEAPEGKF -DLVVDINFRMDTSALYSDIVLPTASW--YEKDDLNSTDMH-SFIHP----L-QMAVPPSW -ESKSDWDIFKILAEKFSELAPTHFPEPVRDLVAMPLQHDTPAEMAQAH-----IRDWAKG -ECEPIPGVTMPNFIVTERDY--VNLGKRFVSLGPKVEKEGFAIHGIHMEVGDLYREL--- --------LKSKPTVTWNGQTYPSLTVARDAANIILNLAPETNGEVAYRAFKAEEER---- ------IGLKLTDLAEPTR----A-VRTDFK-DVVRQPRRLLNSPIWTGIMTDGRPYAAYT -LNVERLVPWRTLT------GRQHFYLDHEGYLAYGEHLPTYKPRPD-------------- ----------PLAFGDLEKSHS-------EGKTIQLNY-------------------LTPH -AKWHIHSNYFDNDRMLTLSR---------------GLEPLWISEKDAKEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYH----------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3 rank: A; htq:FRZ44_42870 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------ILDKLMF--FKAGTE--RFA-DGYGAVTEESR------AW-EDGYR -QRWQY------DKVVRSTHG-VNCTGSCGWQVYVKSGFVTWETQVLDYPLTR-----PDL -PNHEPRGCARGASASWYLYSSNRIKYPLMRRQLMD---------LWREARRRH-KDPVEA -WRSIVETPELARRYKQARGRGGFVRAEWDEANELIVASNTYTIKEY----GPDRV-VGFS -PIPAMSMVS------YSAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSNFLIVWGSNVPQTRTPDAH -YFAEVRYKGTKTVVVTPDFSEAAKFADLWLDPKQG-TDAAMAMAMGHVILKEFHA----D -NPEPYFRDYCQQYSDLPFLVRL-----VKQGEHYVPERFVR---------ASDFADG-QG -QDNNPEWKTLGFDELTDELVVPNGSIGFRW---------GEDGRWNLEQKD--A------ --------RSGVAAKLRLSLL------EAPSEAPGPKSERSTQVANVAFPYFGGRH----- -----------------HEFFESSPQDEIQVRNVPARTLALK-DGE----YLVATV----- ----FDLMLAH-YGIDRGL---------GGVAASSYDDDVPYTPAWQERITGVSRDKVIAV -ARGF------ADNAAKTRGRSMVIIGTGVNQWFNND-MTYRAVINMLILCGTVGRSGG-G ---WAHYVGQEKLRPQP---GWQTLAFALDWSRPPRLMNGTSFWYAHTDQWRYEKVQASEL -------LSPTREQGDWDVSLIDYNVRSERMGWLPS-----APQLE-KNPLRLGREIHEQK -LDAP-----TAVAHQL-----ET---------------RTLRLSCEDPDNPR-NFPRNLF -VWRSNLLGS---SSKGHEYFLKHLVGAKHGVLG--ADLKELGERLPTEVDFHDEAPEGKL -DLLVTIDFRMSSNCMYSDIVLPTATW--YEKNDLSTTDMH-PFIHP----L-TGAVDPLW -ECKSDWEIFRGFAEKFSEVCEGHLGTE-YDVVLQPLQHDAPGELGQAL----GVVDWKKG -ECRAIPGKTMPNVQLVERDY--PATYKRFVSLGPLVNSLGMSTKGLKWDATEEVELL--- ------KEKNGEVAEAGVGHGRPRIQTDLHACETILALSPETNGRVAVKAWKALEVR---- ------TGRQHAHLAEGRA----A-ERITFD-DVVAQPRKVITSPTWSGAESEKVTYSAGY -INVEEQVPWRTLT------GRQQTYQDHPWMRAFGEHFPSYKPPIDTK--T--VGTLLR- -------------------------SQENGNPQLVLNF-------------------LTPH -QKWGIHSSFTDTQMMLTLSR---------------GGPNIWVSEQDARRLGISDNDWI-- ----------------EAYNSNGALVARAVVSQRIKAGCAFMYHSQD-------------- ---KTVNAP-GTETTGTR-GIHNSIS---RIVVKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDDFVVIRKVR-----------------NLDFMDGTPVRILAPAVSVGGAE-- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7 rank: A; ddz:DSYM_27970 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--FERVQS--TFS-GGHGIVTNEDR------KW-EDAYR -NRWRH------DKIVRSTHG-VNCTGGCSWKIFVKNGLVAFEMQQTDYPRTR-----DDL -PNHEPRGCQRGASFSWYLYSPHRIKHPLVRGRLLD----------LYRAERKSGKDPVEA -WEAIQADPAKRIQYTAVRGLGGFVRTNWDEVTEIAAAANVYTIKKW----GPDRI-YGFS -PIPAMSMLS------YAAGSRYLSL----------------------------------- ----IGGACGSFYDWYCDLPAASPQTWGEQTDVPEAADWYNSTYLIICGANLPMTRTPDAH -FATEVRYKGAKVVSMAPDYAEFVKFADLWMPVKQG-TDSAAFLAMGHVALKEFHV----K -RQDPYFQEYIRKYTDLPMLVMLR-----KTDDGYASDRTLR---------ASDFTGN-LG -ESNNPEWKTIVYDEKTKSYVAPNGSVGFRW---------GEEGKWNLLPKNAANQEEILA -ELTCIDSRDDV----ASVGF----------------------------PHFNAGE----- --------------------------PGLLYRNVPVRKLKLA-SGEDVLVSSV-------- ----YDLQVAQ-YGIDRGL-------GGGNVTDSYEDDKVAYTPAWAEKVTGVKRADLIRT -GREF------AENASKTKGKSMVIMGAAINHWYHND-LSYRAIMNLLHMCGCVGQSGG-G ---WAHYVGQEKLRPQA---GWAPIAFATDWHRPPRHMNSTTFWYFQTDQWRYEKVSADGL -------LADNAKSKYKGYQLADYNVVSQRLGWLPS-----APHFN-KNPIDIVTEAEKAG -ATD------EASIAKHMVEQLKS---------------GKLYFASEDVDAPE-NFVRNLF -VWRSNLLGC---SAKGHEYFLKHLIGAQNGVLQ-----EGVEGRACKEIKWHENGPTAKL -DLMVDINFRLNSTGAYSDIILPTATW--YEKHDLNTTDMH-PFVHP----L-SEAVSPGW -ESKSDWQIFQNIAKAFSKLAEKHLGTK-KDVVALPMQHDSPFELAQAM----GVKDWKKG -ECEPIPGKTLPLLKVVSRDY--PNTLKKFQAIGPLLNKLGNNVKGIDWNTDQELNEL--- ------KSLNGEILEDGISKGMPSIAADIAACDAVLRMAPETNGEVAHKSWSALSKK---- ------TGIDHHHLYAGRH----E-DKITFR-DIQAQPRKIITAPTWSGIESETVSYTAGY -TNIHEHIPFRTLT------GRAQFYQDHEWMLDFGEGFCAFRPGLDMKAIEATPKSVLA- ------------------------------KPHLVLNW-------------------ITPH -SKWGIHSSYQDNLRMLNLFR---------------GGPYFWIAEDDAKSIGLEDNDWV-- ----------------EAVNGNGATVARVVVSQRVPRGMALMYHAQE-------------- ---KIVNVP-GSPTTGKRGGILNSVT---RVVVKPTNMVGGYAQ---------LSYGFNYY -GTV-GTQRDEFVVVHKIE-----DKDVDW-----LERPLTPER--EGKLNPPGVGPR--- ----- ->NASQAN2011_286_B_bin.1_k121_764018_13 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D-----------AHDGFVNVCFPYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->NASQAN2011_286_F_bin.29_scaffold_54_27 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D--------AHDGFVNVCF---PYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6 rank: A; thes:FHQ07_07000 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSY--------FLDRLNF--FKPAPE--PFA-DGHGAARREDR------SW-EDSYR -RRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLIRAALLK---------LWREARKS--KSPVEA -WASIVSDPVKAKSYKQKRGMGGFVRSTWDEVNEIIAASNLYTVKEF----GPDRV-VGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGGCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVAITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHV----D -QPSQYFTDYCRQYSDMPMLVRLER----RADGRLVPERYLR---------AADLGGL--G -ETNNPEWKTLAIDDNSGDITVPNGSVGFRW---------GEKGKWNIEEKD--------- --------SAGRETRLRLSLK------D--------HADGVESVSF---PYFGGIE----- -----------------NEYWTESKFSDVLERNVPVKRLNLA-DGKEWVVASV-------- ----YDLLLAQ-YGVDRGL--------GGGNVASSYDDNVPGTPAWQEKITGVPRAEVIQI -AREF------ARTADKTHGRSMVIVGAAMNHWFHND-MNYRGLINMLVMCGCVGQTGG-G ---WAHYVGQEKLRPQS---GWAPIAFGTDWSKPPRQMNGTSFFYFNSSQYRYEKLGVEEI -------LSPLADKSKYSGSLADYNLRAVRMGWLPS-----LPQLN-TNPMKLVREAEAAG -VAPV-----DYAVGKL-----KD---------------GSLDFAFADPDAPE-NYPRNLF -IWRSNLLGS---SGKGHEYMLKHLLGTRHGLQG--KDLGERGAAKPEEIKWRDEAPEGKL -DLLVTLDFRMCTTALYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIFKGIARTVSQLAPGVLGIE-KDLVLVPTLHDTPNEIAMPY----GVTDWKKG -ECDLIPGKTAPSMVVVERDY--PNLYKKFTSIGPLLDTQGNGGKGMNWDTTHEIEFL--- ------GKLNHEVLEAGVSHGRPQLETAIDCAEAIMHLAPETNGHVAVKAWASLETF---- ------TGREHQHLAVGKE----H-EAIRFR-DIQAQPRKIISSPIWSGLEDENVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHEWMRDFGEGFMQYRPPVDTKTIK--P--IIG- -------------------------KKPNGNREIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKSAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRMMNGIAMMYHAQE-------------- ---RILNTP-GSEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------LAYGFNYY -GTV-GTNRDELVVVRKMN-------KVDW---LDGEPVPATKEAAR-------------- ----- ->NarG_Escherichia_coli_NP_415742 -----------------------------------------------SK------------ ---------------FLDRFRY--FKQKGE--TFA-DGHGQLLNTNR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKYPMMRKRLMK---------MWREAKALH-SDPVEA -WASIIEDADKAKSFKQARGRGGFVRSSWQEVNELIAASNVYTIKNY----GPDRV-AGFS -PIPAMSMVS------YASGARYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYAEIAKLCDLWLAPKQG-TDAAMALAMGHVMLREFHL----D -NPSQYFTDYVRRYTDMPMLVMLE-----ERDGYYAAGRMLR---------AADLVDA-LG -QENNPEWKTVAFN-TNGEMVAPNGSIGFRW---------GEKGKWNLEQRD--GKT---- --------GEETELQLSLLGS------Q----------DEIAEVGF---PYFGGDG----- -----------------TEHFNKVELENVLLHKLPVKRLQLA-DGSTALVTTVYDL----- -------TLAN-YGLERGL--------NDVNCATSYDDVKAYTPAWAEQITGVSRSQIIRI -AREF------ADNADKTHGRSMIIVGAGLNHWYHLD-MNYRGLINMLIFCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWQPLAFALDWQRPARHMNSTSYFYNHSSQWRYETVTAEEL -------LSPMADKSRYTGHLIDFNVRAERMGWLPS-----APQLG-TNPLTIAGEAEKAG -MNPV-----DYTVKSL-----KE---------------GSIRFAAEQPENGK-NHPRNLF -IWRSNLLGS---SGKGHEFMLKYLLGT-EHGIQGKDLG-QQGGVKPEEVDWQDNGLEGKL -DLVVTLDFRLSSTCLYSDIILPTATW--YEKDDMNTSDMH-PFIHP----L-SAAVDPAW -EAKSDWEIYKAIAKKFSEVCVGHLGKE-TDIVTLPIQHDSAAELAQPL----DVKDWKKG -ECDLIPGKTAPHIMVVERDY--PATYERFTSIGPLMEKIGNGGKGIAWNTQSEMDLL--- -------RKLNYTKAEGPAKGQPMLNTAIDAAEMILTLAPETNGQVAVKAWAALSEF---- ------TGRDHTHLALNKE----D-EKIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLS------GRQQLYQDHQWMRDFGESLLVYRPPIDTRS----VKEVIG- -------------------------QKSNGNQEKALNF-------------------LTPH -QKWGIHSTYSDNLLMLTLGR---------------GGPVVWLSEADAKDLGIADNDWI-- ----------------EVFNSNGALTARAVVSQRVPAGMTMMYHAQE-------------- ---RIVNLP-GSEITQQRGGIHNSVT---RITPKPTHMIGGYAH---------LAYGFNYY -GTV-GSNRDEFVVVRKMK-------NIDW---LDGE---------GNDQVQESVK----- ----- ->NarG_Halomonas_maura_gb_AAT47523 ------------------------------------------------------------- ----MSH--------FIDRLNF--FRKARE--PFA-NDHGEVRDESR------GW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKHPLVRKPLLK---------LWREALEEK-GDPVDA -WASIVEDPAKTKQYKRARGMGGFVRADWNELNELIAASNVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVSVTPDYAEVSKLTDEWLSAKQG-TDAALAMAMGHVILKEFHL----D -RPSAYFTDYVRRYTDMPCLVELEA----REDGSYVPGKQLR---------ASDFEAS-LG -QDNNPEWKTVAWDETRDQLVVPRGSIGFRW---------GEEGKWNLEPRD--------- --------AEGAEIKTRLSLA------E--------AHDDVARVAF---PYFGGIA----- -------------HEHFDHVKSGGASDELLFHSLPAKRLTLA-DGREILAVTVFDL----- -------MCAN-YGIDRGF-RSQEGKEGEDDGATAYDQVKPYTPAWQEKITGVPAEQCLRI -AREF------ADNADKTHGRSMIIVGAGMNHWYHMD-MNYRGLINMLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWLPLAFGLDWQRPPRHMNSTSFFYNHSSQWRYXKLEIKEI -------LSPLAKPADYSGSLIDFNVRSERMGWLPS-----APQLA-TNPLSLAGKAAEAG -QSTA-----DYVVDQL-----KA---------------GGLRFAAEDPDDPQ-NFPRNMF -IWRSNLLGS---SGKGHEYLLKYLLGT-RHGIQGKDLG-EDGGQKPEEVVWHEAAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAATDPAW -ESRSDWDIYKGIARAFSKACVGHLGEE-TDLVTLPLQHDSPAELAQPE-----VKDWKRG -ECEPIPGKTMPALVEVKRDY--PATYERFTSVGPLLDSLGNGGKGIGWKTEKEVELL--- -------GKLNYVKTEGPAKGRPRIESAIDAAEVILTLAPETNGQVSVKAWEALSKI---- ------TGRDHRHLAEPKE----E-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTVS------GRQQFYQDHAWMRAFGESLLVYRPPIDTKAAV--SL----- ----------ADDKG-------------NGNPEIALNW-------------------ITPH -QKWGIHSTYSDNLLMQTLSR---------------GGPIVWLSKDDARSIGVEDNDWI-- ----------------ELYNANGAIAARAVVSQRVKNGMAMMYHAQE-------------- ---RILNMP-GSEVTGTRGGIHNSVT---RVCPKPTHMIGGYAQ---------LAYSFNYY -GTV-GSNRDEFVIVRKMK-------KIDW---LDGE---------GNDYEQEAVK----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7 rank: C; this:HZT40_10960 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FKQRKT--PFA-QGHGAVTHEKR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASFSWYIYSANRLKYPLIRKPLME---------LWRSAKARH-TDPVVA -WESIVENPLSTNDYKTKRGLGGFIRSSWEEVNELIAAANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCMSFYDWYCDLPPASPMIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKHADQWLNPKQG-TDAALALAFGHVILKEFHL----D -KPSTYFTDYVRRYTDWPNLVLLEK----RDDGSYQAGRFAR---------ASDFVEG-LG -ESNNPDWKTVAIDEATGEIIAPNGSIGYRW---------GENSKWNIQQKHG-------- --------TDQQEVTLALSLI---------------------------------------- ------------------------------------------------------------- ----------------------------------------------------KQHDQIVEL -CLPY--------------------FGGVPSDYFKGN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------VLKDVL----- ----------------------------RYQLPARQVTLAD-------------------- ------------------------------------------------------------- ----------------GTTGL---------------------------------------- --------------------------------LVTVYDLNMAN------------------ -----------------------Y------------------------------------- --------------------GISRGLGADDSAQDFNDA---------TAPYT--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------PAWQEAI------------------------- ------------------------------------------------------------- ----- ->king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1 rank: A; gpb:HDN1F_13240 narG; Nitrate reductase, alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLQF--FNKVKS--TFA-DGHGAVVNEDR------GW-ENAYR -SRWQY------DNIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCQRGASYSWYLYSANRLKYPMMRKPLLE---------LWRE--ARKSLSPVDA -WESIVENPVKSKAYKTKRGLGGFIRVDWEEANELVAAANIYTAKKY----GPDRI-NGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPSSPQTWGEQTDVPESADWYNSTFLMLWGSNVPQTRTPDAH -FYTEVRYKGAKSVVITPDYSEAAKFADLWLAPKQG-TDAALAMAFGHVVLKELHL----D -NPSEYFTEYCRKTTDMPHLVMLKT-----RGNAFVADRFLR---------ASDLSDN-LQ -QSNNPEWKTLVINENTNEMVVPNGSIGFRW---------GEDGKWNIQATDS-------- --------ADGSDIKARLSLI------E-----------NADQVVSVEFPYFGNLN----- -----------------HPHFTHTEHAEILERNVPARRIQLA-DGSDAYVVTVFDL----- -------LVAN-YGIDRGL--------GGENVAKSFDDDQPYTPAWQERITGVKREHVITV -ARQF------AENAHKTHGKSMVILGAGLNHWYHMD-MNYRGIINLLMMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWHRPPRHMNGTSFFYNHTSQWRHEKLDVREI -------LSPLADKTAWSGSLLDYNVRAERMGWLPS-----APQLN-VNPLELTKAAAAAG -QSPV-----DYAVENL-----KS---------------GKLAFACEDPDNPV-NFPRNLF -VWRSNLLGS---SGKGHEYFLKYLLGTTHGVQG--KDLGEMGAPKPEEVVWHEQGAEGKL -DLLVTLDFRMSTTCMYSDVVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIARKFSELSVGHLGVE-KDLVLVPTLHDTPSELGQAV----GVKDWKKG -ECEPIPNKTLPNMVVVERDY--PNTYKKFTALGPLLDKLGNGGKGISWNTQSEVEQL--- ------RDLNYRVTEEGVSKGLPRIESDIDACEVVLMLAPETNGQVAMKAWAALSKI---- ------TGRDHTHLALPRE----D-DKIRYR-DVQAQPRKIISSPTWSGLESEHVSYNAGY -TNVHEMIPWRTLT------GRQQFYQDHLWMLGFGESLCVYKPPIDTKTIA--P--LLN- -------------------------QRSNGNGEVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPCVWMSETDAKKVGIEDNDWI-- ----------------EAFNLNGALVARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-ASEITKTRGGIHNSVT---RTCPKPTHMIGAYAQ---------QSYGFNYY -GTV-GSNRDEFVIVRKLS-------KVDW---LDTPVAQA-------------------- ----- ->NarG_Pseudomonas_fluorescens_gb_AEV63780 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFS-DGHGETRKESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKIRKPLLK---------LWRE--ARQTLPPVEA -WASIVEDKAKADSYKSKRGMGGFIRSNWEEVNEIIAAANVYTVKEH----GPDRV-VGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----D -KPSAYFTEYAKRYTDLPVLVMLKPMLGAAPGAGYQPDRFLR---------ASDLTDN-LG -QDNNPEWKTIALD-AAGELVSPQGSIGYRW---------GEKGKWNILPREG-------- --------GEGREIDLKLSLI-------------------GGDVAEVAFPYFAGEA----- -----------------QEYFQHVAGDAVQFRRVPVHSVVLA-DGSVAKVATVFDL----- -------SAAN-LAIDRGL-------GGANVAKDYNDASVPGTPAWQEQITGVSREKAIQI -AREF------ADNADKTRGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWNRPPRQMNGTSFFYGHSSQWRHEKMSMHDV -------LSPLADKSQFPEHALDYNIRAERAGWLPS-----APQLN-TNPLHICRDAAAAG -MEPK-----DYVVKSL-----QD---------------GSLRFACEQPDSPV-NFPRNMF -IWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN--EDIGHSTECKPTEAEWVDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -ESRSDWEIYKGIAKAFSAMSVGHLGVE-KDLVTVPLMHDSVGELAQPF----GGTDWKSA -GVAPVPGKNAPNLQVVERDY--PNIYKQFTSLGPMLEKLGNGGKGINWNTDTEVKFL--- ------GELNHKEVEAGISQGRPKIDSAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGIDHSHLAISKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDDHVSYNAGY -TNVHESIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVNTRTIA----GVKG- -------------------------KRSNGETEIVLNW-------------------ITPH -QKWGIHSTYSDNLLMLTLSR---------------GGPIVWLSEIDAKRAGIEDNDWI-- ----------------ECFNVNGALTARAVVSQRVKEGMVMMYHAQE-------------- ---RIVNVP-GSETTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMV-------KVDW---LDGSSGDDLPRPLPTDIEEN-------- ----- ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFA-DGHGETRIESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWREARRN--MTPVDA -WASIVEDKAKAESYKSKRGMGGFIRSSWDEVNEIIAAANVYTVKQY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQIWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKLTDLWLNPKQG-TDAALAQAFAHVIFKEFHL----E -KPSEYFRDYAKRYTDLPVLVRLN-----EKDGSYIADRFLR---------ASDLADN-LG -QENNPEWKTIAVDGSTGELVSPLGSIGYRW---------GEKGKWNIEARE--G------ --------KDGRDVDLSLTQI------E---------GGETAEVAF---PYFGGIL----- -----------------HEHFQHAEGESIQLRRVPVRTITLA-DGSTTKVATVFDL----- -------MAAN-LGIDRGL-------GGGNVASSYDDASVPGTPAWQEVITGVSREKAIQI -AREF------ADNADKTHGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWSRPPRQMNGTSFFYNHSSQWRHEKMSIHEV -------LSPLADKSQFPEHMLDYNIRAERAGWLPS-----APQLN-RNPLQICRDAEAAG -MSPV-----DYVTQSL-----KD---------------GSLKFACEQPDNPD-NFPRNMF -VWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN-EDLGKRADGFKPTEAEWQDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EAKSDWEIYKGIAKAFSKMAEGQLGVE-KDLVTVPLLHDSPGELAQPF----GGTDWKTA -GVDPQPGKNCPNMAVVERDY--PATYKKFTSLGPLLDKLGNGGKGINWNTQDEVDFL--- ------GELNYKVRDEGVSQGRPQIESAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLALPKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHEYIPWRTIT------GRQQFFQDHPWMQAFGEQLMSYRPPINTR------------ -TIDYVK-------GKKSNGNP----------EIVLNW-------------------ITPH -QKWGIHSTYSDNLIMLTLSR---------------GGPIVWMSEVDAKKAGIEDNDWI-- ----------------ECFNANGALTARAVVSQRVMEGMVMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMA-------KVDW---LDGPNGNDLPQPLPQDI----------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16 rank: A; ocm:CBP12_03810 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------ETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRVKYPKVRKALLK---------LWRE--ARKNLKPVEA -WASIVEDPVKAQSYKSKRGLGGFVRSSWDEVQELIAAANVYTTKTY----GPDRV-VGFS -PIPAMSMIS------YASGARYLSL----------------------------------- ----MGGACLSFYDWYCDLPPSSPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----E -KPSEYFTDYVRRTTDFPMLVLLD-----EHGEGYKTGRFLR---------ASDLTGQ-LG -QDNNPEWKTIALDELSGELVSPLGAIGYRW---------GEKGKWNIEAREG-------- --------SKGADTKLKLSLI------D------------EGQVAEVAFPYFGGDL----- -----------------HDHFQHVEGDNLQYRRIPVREVQLA-DGRSAKVATVFDI----- --------TAGGLAIDRGL-------GGKNVASSYDDASIPGTPAWQEQITGVTREKAIQI -AREF------ADNADKTKGRSMIIVGAAMNHWYHMD-MNYRGLINMLMMCGCVGQTGG-G ---WAHYVGQEKLRPQT---GWTPVAFGLDWHRPPRHMNGTSFFYNHSSQWRYEKMNMHDI -------LSPTANKAEFPEHALDYNIRAERAGWLPS-----APQLN-RNPLQICRDAKAAG -LSPK-----DYAVKAL-----QE---------------GSLRFSCEQPDNPV-NFPRNMF -VWRSNLLGS---SGKGHEYMLKHLLGAEKHGVI---GDETAAGFTPKDVDFSQEGARGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EARSDWEIFKGIAKKFSELSVGHLGVE-QDLVTIPMQHDSVGELAQPF----GGLDWKTT -GEPLVPGKNAPNMVVVERDY--PNTYKKFTSLGPLLNTQGNGGKGISWNTDDEVEFL--- ------GDLNHRVLDEGVSEGRPQMLSAIDAAECVLSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLAVGKE----H-ESIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVSTRSIE----KVQG- -------------------------KMSNGNPEIALNW-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAQKVGIEDNDWV-- ----------------ECFNANGALTARAVVSQRVKEGMIMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMN-------KVDW--LEGSDTDDLPQPLPQNI------------ ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11 rank: C; pbm:CL52_03700 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ----MSR--------LLDQLRF--FKRKQD--EFA-DGHGETRIENR------EW-ENGYR -ARWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1 rank: A; reu:Reut_B5002 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLRF--LSRTKE--TFS-DGHGAVVDEDR------SW-ENAYR -GRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPLVRGRLME---------MWRE--ARQTMSPTDA -WESISQDPVKAKRYKSVRGQGGFVRASWDDVSEIIAAANAFTIKEF----GPDRV-LGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----IGGACLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTYLMVWGSNVPQTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMVKFGDIWLAPKQG-TDAALAMAMGHVILKEWHT----S -AQSDYFTRYVKQYTDLPMLVILK----LGKSGQLVPDYFLR---------ASHLSLA--E -QANNPEWKTLLIDCASGELIAPNGSIGFRW-----GESGDKVGRWNLELKDGGSARAIDP -CLS----LIDSHDDIVEVGF----------------------------DYYGGKD----- -------------------------ADDVLLRRVPAKRVKLA-DGSEALVTTVFDL----- -------TMAN-YGVDRGL--------GGGNVAMSYDDDVPYTPAWQERHTGVKRNLVIQV -AREF------AQNAHDTQGKSMVIVGAALNHWYHND-MIYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFAGDWVRPPRHMNGTSFFYNHTSQWRHEKLALDEI ------LAPTADAGPYSKLALLDLNAKAERLGWLPS-----APQLE-TNPLDIVDAADSKN -MDPV-----KYAVEEI-----KA---------------GRLNFSCDEPENPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALFG------DERDGIKPGEVKAGEAVEGKL -DLLTVLDFRMSTTCLYGDIVLPSATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKSDWEIYKTIAKKFSEIAGPYLGTR-KDLVLTPLLHDTPGELGQPF----EPKDWKHG -ECEPIPGKTMPQMTVVERNY--GDVYKKFTSIGPLLEKSGNGGKGIGWNTEHEVKEL--- ------AALNKLVTEPGVSQGRPKLETAIDAAEMILTLAPETNGHVAVKAWDALGKI---- ------TGRDHKHLAEGRD----H-DKIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHRWMLDFGEGLCIYKPAINTRTIE--P--MLG- -------------------------KHANGNAELVLNW-------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIE-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1 rank: C; cuh:BJN34_33750 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------K--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------HAN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------GNEELVLN-------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIEAKQAGIRDNDWV-- ----------------EVFNVNGTLTARVVVSQRVPVGMCLMYHAQE-------------- ---KIVNVP-GAETSGMRGGIHNSVT---RTVTKPTHMIGGYAQ---------LAYGFNYY -GTV-GSNRDEYVIVRKMK-------KVDW---LEGALKEEGEQA---------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6 rank: A; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MAACR------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------DWYCDLPPASPQIWGEQTDVAESADWYNSNYLMVWGSNIPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -RPSDYFTGYIRQYTDMPMLVMLKQ----DAAGRYLPDYFLR---------ASHLAGN-AD -QAHNPEWKTLVLDETSGNLAVPNGSAGFRW---------DQSGKWNLEEKA--G------ --------INSQPVKAQLSLI------A--------QSDEVVEVGF---PYFGAEH----- --------------------------DELITRRVPVRHIVLA-DGSTARVATVFDL----- -------MAAN-YGIDRGL--------GGGNVACSYLDDVPYTPAWQHKHTGVKPEMVIQV -AREF------AQNADQTHGRSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WCHYVGQEKLRPQT---GWAPLAFAGDWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LSPTADGKMANMALIDYNAKAERMGWLPS-----APQLT-TNPLDVTRHAAAAG -QDPI-----TYAVEQL-----KS---------------GQLDMACNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNAVMN-----SEEGCVKPSEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QAKSDWEIYKGFAKAISEVGGEYLGVQ-QDLVLTPLMHDTPEELGQPF----DPRDWKKG -ECEPIPGKTMPKMTVVERDY--RKIHDKFTSIGPLLEKVGNGGKGIGWQTGHEVDVL--- -------RGLNKTVASGVAAGQPRLDTAIDAAEMILTLAPETNGHVAVKAWAALSKI---- ------TGRDHTHLALPRE----H-DSIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHLWMRAFGEGLCLYKPHVDLK--T--TAAILG- -------------------------KKPNGHHEIVLNW-------------------ITPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWVSEIDAKKAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRVPEGMSLMYHAQE-------------- ---KIINVP-GAETSGKRGGIHNSVT---RTVVKPTHMIGGYVQ---------LAWGFNYY -GTV-GSNRDEFVIVRKMK-------NVDW---LDQPLSEHA------------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7 rank: C; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) -MEYARLVTHLAESENSRACFFLAPLLSNYPTLPPLPPPRSPSDQWAVCLRLLTIGGIGTG -LSGPANPLEARMSHFLDRLNF--LGKVKS--TFS-DGHGAVVKEDR------KW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGVLMQ---------HWRE--LRKKLGPIEA -WQRISQTPEIATQYKTQRGQGGFVRASWDEVNEIIAASNAFTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------I---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----GVPRLVL------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2 rank: A; chrm:FYK34_01610 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--MSKVKA--TFS-NGHGAVVKEDR------QW-EDAYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----ADL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGKLMQ---------MWREARKS--MGAIDA -WESISQNPEKAKEYKSRRGQGGFVRASWDEVNEMVAAANAYTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQIWGEQTDVAESADWYNSTYLMVWGSNVPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -KQSSYFTDYIRRLTDMPMLVRLK-----EEGGRYLPEYFLR---------ASHLEGG-LG -EDNNPDWKTLLIDENTGDIVAPNGSIGFRW-----GQPEGKTGKWNLEHRDGAT------ --------AREIQGQLTLLGQ------Q----------DEVVGVGF---PYFGAEH----- --------------------------DELLTRNVPAKRITLA-DGSTALVATVFDL----- --------MAANYGIDRGL--------GGGNVASSYMDDVPYTPAWQQKHTGVKPEMVIQV -AREF------AQNADQTQGKSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQS---GWAPLAFGADWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LCPTADGSMANMSLIDYNAKAERMGWLPS-----APQLS-TNPLDITRQAEAAG -QDPV-----AYTVQGL-----KD---------------GTLDMSCNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALMS-----DEANCITPTEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKTDWEIYKGFAKAISEVGGDYLGVQ-KDLVLTPLMHDTPQELGQAF----DPRDWKKG -ECEPIPGKTMPAMTVVERDY--KAIYQKFTSIGPLMEKAGNGGKGMAWKTGHEIEKL--- -------RAMNKVVQDGVAKGQPRLDTAIDAAEMILTLAPETNGHVAVKAWESLSKI---- ------TGRDHTHLAIPRE----H-DHITFR-DIQAQPRKIISSPIWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHQWMRAFGEGLCLYKPPVDLKT----------- -TAAVHR------------------HKPNGNTEILLNF-------------------LTPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWISEKDAQEAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRIPKGMTLMYHAQE-------------- ---KIVNVP-GAEMSGKRGGIHNSVT---RAVTKPTHMIGGYAQ---------YSYGFNYY -GTV-GANRDEFVVVRKMK-------NVDW---MDQPK----------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6 rank: C; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------T -ASHQAMMNSRS-----------------------------------------------NG -NPEIA------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------LN------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------F------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPCVWVSEVDATKIGLVDNDWV-- ----------------EAFNANGALCARVIVSQRVPEGMMMMYHAQE-------------- ---KIVNVP-GSEIMNTRGGIHNSVT---RAVVKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVILRKMN-------KVDWMDDEASPAGENS------------------- ----- ->nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------AW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--HRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCL-----VEKDGAYVPDRYVR---------AADLVGA-LG -EANNPDWKTLVIDEASDALTVPVGSIGFRWGQEKDGAPTADKGKWNLKEET--------- --------SDGRQIKPRLSLV------K--------HHDAVVEAAF---PYFGNIA----- -----------------HEHFNSTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVASSYDDDIPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLRVADL -------LSPLADKGKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLELSREAIAKG -LDPK-----EYVVNQL-----KS---------------GELKFSCEDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGHTGEVKPQDVVWHDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRFSELS---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DGYLGVEKDIVAVPIL--HDTAGE- ------------------------------------------------------------- -----IAQPYDTKDWKK-------------------GECEA-IPGKTMPNFVVVERNYSEI -H--------------EKFTSLGPLLDK--------------------------------- -------------------------------------------------------LGNGGK -GIN-------------------------W---NT-------------------------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------SW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--QRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCM-----VEKDGAYVPDRYVR---------AADLIGA-LG -EANNPDWKTLVIDEESDALTVPVGSIGFRWGQDKDGAPTADKGKWNLKEET--------- --------TDGRKIKPRLSLV------Q--------KHDAVVEAAF---PYFGNIE----- -----------------HEHFNNTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVAGSFDDDVPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWSRPPRHMNGTSFFYAHTDQWRYETLRVADL -------LSPLADKNKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLDLTREAIAKG -VDPK-----EYVVNQL-----KS---------------GELKFSCDDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGQTGDVKPQEVVWRDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRYSELSDGYLGVE-KDLVAVPILHDTAGEMAQPY----DAKDWKKG -ECEAIPGKTMPNFVVVERNY--SEIYEKFTSLGPLLDKLGNGGKGINWNTDHEIKLL--- ------GELNYKVRNEGVAHGRPNIDTDIDATEVVLTLAPETNGEVAVKAWAALSEF---- ------TGIDHRHLALTRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESEHVSYNAGY -TNVHELIPWRTLT------GRQQLYQDHEWMRAFGEGFCSYKPPVDLRSHQ--Q--VMN- -------------------------AKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWLSEVDAQKVGIEDNDWI-- ----------------EAFNSNGALCARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-GSEITQTRGGIHNSVT---RAVLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVVVRKMN-------KVDW---MDGPAQPAMEA----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF----FVTPTEGFA-DKHGATVDEDR------TW-EDGYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCQRGASYSWYLYSANRVKYPMVRSPLLK---------LWRE--KRKMLAPVDA -WKAITDDHNAVRSYQSQRGLGGFLRTTWDEVNEMIAAANVHTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCTSFYDWYCDLPPSSPQMWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMTEVRYRGTKVVSVFPDYAEGSKFGDLWLHPKQG-TDAALALAMGHVIVNEFHV----K -NKSDYFDQYCRQYTDMPNLVKL-----VKQGDYYVPDRLVR---------CSDFTDN-LG -QDNNPDWKTVVIDENTNMLTVPVGSIGFRW----GQKEGEDLGKWNLQEKN--------- --------AAGADIRPRLSLI-----------------GGHDGVVLVASPYFGNQQ----- -----------------HDHFQHTDHANILPHNIAVRKLQSR-DGE----ILVASV----- ----YDLFVAN-YGVDQGL--------GGPNVASSYDDDIPYTPAWQEKITGVKRHLVIQV -AREF------ADNADKTHGKSMVIVGASLNHWYHMD-MNYRSVINMLVMCGCIGQSGG-G ---WAHYVGQEKLRPQI---GWAALAFATDWHRPPRQMNGTSFFYAHTDQWRYETLSVKKI -------LSPLADPKKFSGSLIDFNVRSERMGWLPS-----APQLQ-TNPLQVCRDAQKAG -MSAK-----EYAVAQL-----KS---------------GKLRFSCEDTDHPD-NYPRNMF -IWRSNLLGS---SGKGHEYFLKHLLGTTHGVQG--KDLGQSGGQKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----F-SAAVDPAW -MARSDWEIYKGIAKKFSELTEGHLGVE-QDLVTVPIMHDTPDELGQAF----EPKDWKRG -ECEAVPGKTMPNFVLVERDY--PNTYKKFTALGPLMDKLGNGGKGINWNTQHEVKHL--- ------GELNYLVSEEGVTKGRPKIETDIDATEVILMLAPETNGEVAVKAWDALSKF---- ------TGIDHTHLAKTRE----D-EKIRYR-DIQAQPRKIISAPTWSGIESEHVSYNAGY -TNVHELIPWRTIT------GRQQLYQDHHWMRAFGEALCVYKPPIDTASHQ----AMMN- -------------------------SRSNGNPEIALNF-------------------ITPH -QKWGIHS----------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------F-GNLEH -DHFQG----------------------------------------TDHPSVLK----RRV -PVREVQL-KDGKAFVATVFDLFCANYGL-------------------------------- -----------------DRGLGG-----------------EHVARDY-------------- ------------------------------------------------------------- ----------------GAMEPYTPAWA---------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------E--------------------------------- ------------------------------------------------------------- ------------------------------------------------KITGVPADQIITI -AREF------ASNAEVTKGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLGVEEI -------LSPTAPEGDWDASLIDYNARAERMGWLPS-----APQLK-TNPLEVGKAIKASG -KDAK-----DYVAEAL-----QS---------------GALEMSCFDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGETGAQKPKEVKWHEEAPKGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWDIYKGIAKKFSEIAPEVLGVE-HDVVLTPIQHDSPNEIAQAY----DVADWGHG -QVEAIPGKTMANVALVERNY--AELYQKFTALGPLMEKLGNGGKGIGWNTDHEVEGL--- ------RKLNGTVAADGPAKGMAQIETAIDAAEVILMLAPETNGEVAVKAWADLGKK---- ------TGLDHTHLALPKE----D-EKIRFR-DIQAQPRKIISSPTWSGIESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEGLCVYRPPIDTKAVK--PML---- -------------------------DEAKDAPHVILNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KITNVP-GSPLTGQRGGIHNSVT---RAVLKPTHMIGGYVQ---------LAYGFNYY -GTV-GSNRDEYVIVRKLS-------KVDW---LEGALS-------EGETAA--------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1 rank: A; emv:HQR01_12825 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRHKKE--QFS-DGHGVTTAEAR------DW-EDSYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLIK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKKW----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALAMAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----IEQDGRLVPERLLR---------ASDFKGD-LG -EKNHPEWKSVAIDEARDEVVAPTGSAGFRW---------GDKGKWNLEEKD--------- --------GKGAEVKLRMTAI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------LDKDH---------------------------------------- ------------------------------------------------------------- -----------------------------------DEVVEVA------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKKE--PFS-EGHGVTTAEAR------DW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRKYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDFAGG-LG -ETNNPEWKCVAIDETSDEVVAPSGSVGFRW---------GEQGKWNLKEED--------- --------GRGEAVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFQGTDHPDVLMKRVPVREMQLA-EGRAYVATV--------- ----FDLLCAN-YGLDRGL--------GGQHVARDYADGAPYTPAWAEKITGIPADAIVTT -AREF------AANAEATNGKSMVILGAGVNHWYHMD-MTYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVGEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAARASG -LEPK-----DYIAQAL-----KG---------------GDLELSCMDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPREVKWHEEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESKSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGHG -EIEAIPGRTMATVALVERDY--PNLYNRFTALGPLMDKLGNGGKGIGWNTAAEVENL--- ------RRLNGVQDAGSPAAGMAKIETAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGINHRHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNQLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNTNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW------LEGALPEG--ENAA----------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKSE--TFS-DGHGLTTGEDR------HW-EDGYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWREARRT--LPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLMMWGSNVPQTRTPDAH -FMTEARYRGTKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDVKGG-LG -EGNNPEWKCVAIDEASDELVVPSGSAGFRW---------GEKGKWNLEEKD--------- --------GQGREVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFEGTDHPDVLMKRVPVRQLDLT-EGR----AYVATV----- ----FDLLCAN-YGLDRGL--------GGEHVARDYAAMSPYTPAWGEKITGVPADAIITA -AREF------AANAEATNGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVSEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAAKASG -MEPK-----DYVAQAL-----KG---------------GDLELSCLDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPQEVKWHDEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGKG -EVEPIPGKTMATVAVVERDY--PNLYKRFTALGPLMDKLGNGGKGIGWNTVTEVDNL--- ------RKLNGTVGDDGPTKGMARIDTAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGRDHKHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW---LEGALS-------EGENAA--------- ----- ->NASQAN2015_010_A_bin.16_Ga0466474_000034_25 rank: A; oca:OCAR_5043 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLLF--FKKKVD--TFS-GTHGVVTNEDR------SW-ESSYR -SRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKFPMIRGRLVR---------LWRE--ARLSLDPVDA -WASIVEDPLKSAEYKSKRGLGGLVRANWDEVNEIIAAANIYTAKTF----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVSMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FMTEARYKGAKVVVVSPDYSEASKFADLWLHPKQG-TDAALAMAIGHVILKEFHV----E -GQSPYFNGYVRENTDLPFLVMLK-----EQDGYYVQDRFLR---------ASDFSGS-LG -QDNNPDWKTVAYDELNGQIVPPCGSIGFRW---------GESGQWNIEQKT--------- --------SDNQAVKLRLSLI------D-----------IKDEVASVGFPYFGGSE----- -----------------HPHFTHSAHDAIQKRNVPVKKIILA-DGTEVLATTVFDL----- -------LVAN-YGIDRGL--------GGGNVAASYDEDVPYTPAWQEKITGVSRSNVIAV -AREF------AINAEKTKGRSMVILGAGINHWYHMD-MNYRGIMNMLMLCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWLPLAFGLDWKRPPRQMNSTSFFYNHTSQWRYETLKVSEI -------LSPTAKPEDWQGSLIDFNVKSERMGWLPS-----APQLQ-TNPLQVVRDAKAAG -IAPA-----DYVVAGL-----KN---------------GSLKMSCEDPDNPL-NFPRNMF -VWRSNLLGS---SGKGHEYFLKYLLGTQHGIQG---KDLGDDGDKPSEVVWHEKAAEGKL -DLLVTLDFRMSTTCLYSDIILPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIAKKFSELTIGHLGLE-QDIVTVPVLHDTPGELAQPF----EVKDWKKG -ECEPVPGKTMPSLVVVERDY--PNTYKMFTSLGPLLSKIGNGGKGIAWNTETEVKQL--- ------GELNYLVTEEGISKGLPRIASDIDATEVILMLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAKPRE----D-DKIRFR-DVQAQPRKIISSPTWSGLESEQVCYNACY -TNVHERIPWRTLT------GRQQFYQDHSWMRAFGETLCVYKPPVDTRSIT--P--ILG- -------------------------QKPNGNDELVLNF-------------------LTPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMGEIDAAKVGIKDNDWI-- ----------------EAFNVNGALVARAVVSQRVPEGMCMMYHAQE-------------- ---KIVNMP-GAETTGGRGGIHNSVT---RATLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIIRKMS-------KVDW---LEEPKPEQA------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1 rank: A; tun:J9260_09180 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- --------------NMLAMCG---CVGQSG------------------------------- -----------------------------------------------------------GG -WAHYV---------------------------------------------GQEKL----- ------------------------------------------------------------- --------------------------------------------------------RPQTG -WL------------------PLAFALDWSRPPRQM-NSTSFFY----------------- ------------------------------------------------------------- ------------------------------------------------------------- --------SHSNQWRYEKLEL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------KEILSPL -ANPA------------------RHSGSLIDYNVRSE------------------------ ------------------------------------------------------------- -----------------------------RMGWLPS-----APQLN-TNPLRIAKAAQAAG -MSPA-----EYTVAAL-----KA---------------GKIAFAAEDPDNPQ-NFPRNLF -VWRSNLLGS---SGKGHEYMLKYLLGTQHGVQS--KDLGVMGGAKPEEVKWHDTAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAAVDPAW -EARSDWEIYKGIAKAFSKVCEGHLGVE-TDLVTLPLLHDAPAELGQAM----GVKDWKKG -ECELIPGKTAPALVAVERHY--PDTYARFTAIGPLLEKLGNGGKGISWNTETEVAFL--- -------GQLNHQQTTGINEGRPCLNSAIDAAEMILSLAPETNGQVAVKAWQALSKI---- ------TGIDHSHLAIHKE----D-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHDWMRDFGESMLVYRPPINTKTIK--P--LLN- -------------------------QRSNGNPELALNW-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWMSETDAKTLGIQDNDWI-- ----------------DLFNANGAIAARAVVSQRVMPGMVMMYHAQE-------------- ---KIVNVP-GSVITGHRGGIHNSVT---RVCPKPTHMIGGYAQ---------QAYGFNYY -GTV-GSNRDEFVIVRKMT-------QVEW---LDNE---------GNDYAQEAVQ----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1 rank: C; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLN---FLARKNADTFS-DGHGVTTTENR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLIRSRLLK---------LWRK------------ ------------------------------------------------------------- --------------------ERTIK------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------TPIGAWAAIQEN--------- --------PEKRADYMKMRGL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1 rank: A; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------FLARKNAGTFS-DGHGVTTTESR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLVRSRLLK---------LWRK--ERTIKTPIGA -WAAIQENPEKRADYMKMRGLGGFVRATWEEVNEIIAAANAYTVKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEVRYKGAKSVVVSPDYSEAAKFSDLWLHPKQG-TDAALAMAMGHVILREFHL----D -RQADYFEDYCRRYTDMPMLVKLTG----KDGHFIPD-RFVR---------ASDFTGA-LD -ETNNPEWKTVAVDAKTKQFVSPGGSIGYRW---------GEQGKWNLEAKDGKGADVDLA -MSFI---LDGEHDTIANVGF----------------------------PYFGNRE----- -----------------HDYFEGTDHDSVLVRKVPARKVKLA-DGEALVATV--------- ----FDLFVAN-YGLDRGL--------NDPNSAKSYQENLPYTPAWAEKITGVPRDQIIAV -AREF------ASNAEKTNGRSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNGTSFFYAHTDQWRYETLKVDEI -------LSPTAPEGPWDASLIDYNIRAERMGWLPS-----APQLK-TNPLEVSKQAAAAG -KEAK-----DFVAEQL-----KA---------------GALSMSCEDPDDKA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTKHGVLG--KDLGEEGRQISKEAVWHDEAPEGKL -DLLVTLDFRMSTTCVYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SSAADPAW -DARSDWEIFKGIARKFSEVAPEVLGVE-KDVVLVPTLHDTAGELAQPI----DVKDWKKG -EIEPIPGRTMPTVAVVERDY--PNLYKKFTSVGTLLDTVGNGGKGIAWNTEHEVDLL--- ------ARLNGVVQEEGVTRGRPRIESDIDATEVILSLAPETNGEVAVKAWEALSKF---- ------TGRDHTHLAIPKE----D-EKIRFR-DVVAQPRKIISSPTWSGLESEKVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFCVYRPPIDTKT----------- -VNPAIR------------------SKADGKPHLVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWISEPDAKRAGIVDNDWV-- ----------------EVYNTNGAIVARAVVSQRMKDGTVFMYHAQE-------------- ---KIVNTP-GSPITGQRGGIHNSVT---RVITKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDEFVVVRKLE-------TVDW---LEGPHTESVAY--NKEAAE--------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206 rank: A; bprc:D521_0425 Respiratory nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--LSADKE--EFS-DGHGVTVGEDR------TW-EDAYR -SRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKYPMIRGRLLK---------QWREAKSVA-KSPVDA -WANLVENTAKRKEWMELRGKGGFVRSSWDEVNEIIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADIWMHPKQG-TDAAIAMAMGHVILKEFYF----N -KRTEYFDDYVRRYTDMPNLVMLEEKVLDDGRKVLVPGRYAR---------SSDFDGK-LG -QTNGADWKTVAFD-TAGKPVVPNGSIGFRW----GPEGRKDQGKWNLESKE--A------ --------NYGNDVKLKLSLMEDQSIHD------------VVPVGF---PYFGGID----- -----------------TPYFDANKQSDVLVQNIPAKKIILT-ENGVEKEVFVATV----- ----FDLLAGN-YGIDRGL---------GGECAKSYDDNVPYTPAWQESITGVKREQVIAV -ARQF------AENAEKTKGKSMVIIGAAMNHWYHCD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWIRPPRQQNSTSFFYAHTDQWRYEKLGMEEV -------LSPLANKEEYTGSMIDFNVRAERMGWLPS-----APQLK-TNPLEVVKEALAAG -KDPK-----KYVVDGL-----KS---------------GTLQMSCEDPDHPS-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGADEARPSEVEWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -EARSDWDIYKGFAKKFSEVCVGHLGVE-KEIVMTPLMHDTPAELAQAF----DVQEWKKG -ECDLIPGKTAPQIAVVERDY--PNTYNRFTALGPLMDKVGNGGKGIAWDTKVEVEQL--- -------RELNGRVEHGEMKGMAKISTDIDAAEVVLMLAPETNGHVAVKAWDALSKI---- ------TGLEHAHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNACY -TNVHEYIPWRTLT------GRQQFYQDHKWMRAFGEGFVSYRPPVDLKTII--------- -----------EVKGIKPNGNK----------EIVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDAVKAGIVDNDWV-- ----------------ELYNANGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVTVRKMR-------NIDW---LDTENANSVQA----------------- ----- ->whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1 rank: A; pde:Pden_4236 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNF--LKSTRK-DTFA-DGHGQTTIENR------DW-EDTYR -SRWRH------DKIVRSTHG-VNCTGSCSWKIYVKNGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKTPLVRGRLMR---------RWRDLRRT--LGPIEA -WTAIQSDPAARADYVKARGRGGFVRASWDEVTEIVAAANAYTAKTW----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEARYRGTKSAVVSPDYSEAAKFGDIWLNAKQG-TDAALAIAMGHVILREFHL----D -RQVDYFEDYTRRYSDFPMLVKLEP-----KGDRFVPGRMLR---------AADIDGA-LG -ETNNPDWKTVAIDDASGRLVAPNGSIGHRW---------GEQGTWNLEEKA--------- ---------GAESVRLRTTLI------------LDGQNDGTAGVDF---PYFGGSA----- -----------------TNGWQACDTPDVLTRAIPVRKVALK-DGE----AMVATV----- ----FDLLCAN-YGLDRGL--------GGDWVARDYGSDMPGTPAWAERITGVPADRIIQV -AREF------AANAEKTGGKSMIIIGAAMNHWYHMD-MNYRGVINMLVMCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWGRPPRHMNSTSAWYAHTDQWRYETVRSDEI ------LSPTAPAGDWSSLSLIDYNIRAERMGWLPS-----APQLR-TNPLQVAAAAKAEG -TEVR-----DYVAREL-----KA---------------GRLEMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVLG--KDLGEEGRRKPVEARWHDKAPEGKL -DLLTCIDFRMSTTAVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKTDWEIFKAIAAKLSEIVPGYLGVE-TDVVQLPLQHDSPGEVAQPR-----VADWKQG -QCDLIPGKTAPAFIAVERDY--PNLYRRFTALGPLMEKAGNGGKGIAWDTKHEVAHL--- ------RALNGTVTDEGPTKGMARIDTAIDAAEVILMLAPETNGEVAVKAWEALSKA---- ------TGREHKHLALPKE----D-EKNRFR-DIAAQPRKIISSPTWSGIESESVCYNAGW -TNVHELIPWRTLT------GRQQLYQDHEWMLAFGEFFLAWRPPVDLKTIT--APATGA- -----------------LGANE---------KHVVLNF-------------------ITPH -QKWGIHSTYSDNLLMLTL------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17 rank: A; acis:CBP35_16735 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--TFS-QGHGQTNGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLK---------HWRA-ALLLAKSPVDA -WANIVENESAKREWQKQRGLGGFVRSTWDEVNQMIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSSFIIAWGSNVPQTRTPDAH -FLTEVRYKGTKVVSITPDYSEVAKLGDLWMHPKQG-TDAAVAMAMGHVILKEFYFKDGGK -GRSTYFDDYARRYTDLPLLVVLKEKTLPDGRTVMVPDRYVR---------ASDFPGQ-LD -QSNNPDWKTVGYD-ELGQVTLPNGSIGFRW----GADGRADEGLWNLENKE--A------ --------RTGNTVKLKLSVI------E--------DGEQAYDVADVAFPYFGGVQ----- ----------------TPNFTANEQGGDVMVRRVPVSHLELA-GHEAQGRVMVATV----- ----FDLLAGN-YGIDRGL--------PGEEPGGSYDADRPYTPAWQESITGVPREQIIAV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHCD-MNYRGIMNMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------LSPLADKKSYSGSMIDYNVRAERMGWLPS-----APQLK-TSPLQVAKDAAAKG -MDAK-----DYVVQSL-----KD---------------GSLQMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGRDEAKPEEVQWHANAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QAKSDWEIYKGFAKAVSEVSVGHLGVE-KDVVLTPIMHDTAGEMAQPY----GVRDWKKG -DCELIPGKTAPQVTVVERDY--PNLYKRFTALGPLMDKAGNGGKGIGWNTQTEVGQL--- ------GDLNGRVKEEGVTQGMPRIVSDIDATEVVLMLAPETNGHVACKAWEALGKQ---- ------TGRDHVHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMRDFGEGFVSYRPPVHLKALH----EVEG- -------------------------KKPNGNREIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAASAGIVDNDWV-- ----------------ELFNANGAIAARAVVSQRVNPGMVMMYHSQE-------------- ---KIINTP-GSEITGTRGGIHNSVT---RIVLKPTHMIGGYAQ---------YSYGFNYY -GTI-GTNRDEFVLVRKMD-------RVDWLDDEVSDTGAHA------------------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1 rank: A; hyb:Q5W_04195 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------QG------------------------------------------- ------------------------------------------------------------- -------------------------------------TDAALAMAMGHVVLKEFYFPAN-G -QRSSYFDDYARRYTDLPMLVMLKEQTLPDGSTTLVPDRYLR---------ASDFNGK-LG -QANNPDWKTVAFD-TTGKAVLPNGSIGFRW----GDQGREDAGKWNLESKE--A------ --------RDNGDVKLKLSVL------E-----DGAQDHQVVDVGF---PYFGGQQ----- ----------------TPNFPANAAVGDVNQAKVPAVRLRLG-KAGEERYALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKNYDDNAPYTPAWQETITGVPRQQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWLRPPRQQNSTSFFYAHTDQWRYEKLDVSEI -------VSPLADKAKFGGSMIDYNVRAERMGWLPS-----APQLK-TNPMQVVKDATAAG -MDPK-----DYVVQAL-----RD---------------GSLEMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTENGVQG---KDLGADEAKPTEVKWHKDAPQGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSKSDWEIYKGFAKRFSEVCVGHLGVE-KEVVLTPLMHDTAAELAQPF----EVKEWKKG -ECELVPGKTAPQIAVVERDY--PNLYKRFTALGPLMNKLGNGGKGIGWKTEIEVEQL--- ------GQLNGVTREEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMVAFGEGFSSYRPPVDLK--T--TDVVQG- -------------------------LRPNGHKEIVLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEDDAKSAGIQDNDWI-- ----------------ELFNVNGAVAGRAVVSQRVKNGMVMMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMQ-------KVDW---LDTP---------RDDHLVKAVQSQGEN -P--- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------LYSANRVKYPLVRGRLLE---------RWRT-ALKTARTPVDA -WATIVENPDARRDYQKVRGMGGFVRSSWDEVNQLIAAANVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAVTPDYSEVAKLADLWLHPKQG-TDAALAMAMGHVALNEFYF----K -QRSPYFDDYARRYTDLPLLVMLKEHILPDGSKTLVPDRYLR---------ASDFNGK-LG -QDNNPEWKTVAFD-AGGRAVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RHGAEVKLKLSVI------E--------DGTQAHEVVGVGLPYFGGVS----- ----------------TPHFTANAQQGEVNFVKVPAVRLRLG-KEGEQREALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKSYDDNAAYTPAWAESITGVPGDQIITV -ARQF------ADNAHKTRGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------VSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVKDATAAG -LDAK-----DYVVRGL-----RD---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTESGVQG---KDLGKDDARPAEVAWHEHAPEGKL -DLLVTLDFRMSTTCLYSDVVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCIGHLGVE-KEVVLTPIMHDTAGEIAQPF----DVKEWKKG -QCELIPGKTAPQVTVVERDY--PNVFKRFTALGPLMDKLGNGGKGIGWKTGTEVEQL--- ------GQLNGTTQADGPTKGMPQIVTDIDACEVILQLAPETNGHVAVKAWQALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DVQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMIAFGESMSSYRPPVDLKT----TSGIHN- -------------------------IKGNGNPEILLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDARLAGVQDNDWV-- ----------------EVFNINGAIAARAVVSQRVNPGMLMMYHAQE-------------- ---KIINTP-GSQITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMS-------KVDW---LDTPR--------DDHLAAAYQAQGENP ----- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FTLPRE--RSA-DGHGVVTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------------RWRAALTTARTPVDA -WAT--------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------IVENP------------ ------------------------------------------------------------- ------------------------------------------------------------- -DARRDYQKVRGMG----------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPQE--TYS-GRHGVATNEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIADDESARRDYQQVRGLGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSSFIIAWGSNIPQTRTPDAH -FFTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVILKEFYFKDGGQ -GRSAYFDDYARRYTDLPLLVMLKEHQLADGSTTLVPDRYLR---------ASDFSGQ-FG -QDNNPEWKTLAFD-TSGNPVLPNGSIGFRW---GEQLDEGELAKWNLESKD--A------ --------RNGQDVKLKLSVV------E--------DGAQPHEIAEVAFPYFGGVE----- ----------------TPNFPANAAQGEINRAKVPTVRLDLVGQGGESRQALVATV----- ----FDLQVAQ-YGIDRGF----------GSGAIDYDDNVPYTPAWQESITGVPRDQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNGTSFFYAHTDQWRYEKLGVEEV -------LSPLADKAAFGGSMIDYNVRAERMGWLPS-----APQLK-THPMQVVKDASAAG -LDAK-----DYVARAL-----KD---------------GSLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGADEAKPTEVKWHAKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QAKSDWEIYKGFAQAFSEVCVGHLGVE-KEVVLTPLMHDTPAELAQPF----GVQDWKKG -ECALIPGKTAPQVTVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTDLEVTQL--- ------GQLNGVTLEEGVTKGMPKIVTDIDACEVILQLAPETNGHVAVKAWEAQSKA---- ------TGRDHVHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLK-----TTGGLS- -------------------------IKSNGNAEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEEDATKVGIVDNDWI-- ----------------ELFNSNGAIVGRAVVSQRVKPGMTMMYHSQE-------------- ---KIINTP-GSEITGARGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLEEPAGAPASGAGH----------------- ----- ->eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPRE--AFS-GDHGLTTNEDR------TW-EDAYR -NRWAH------DKVVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIAEDDAARRDYQQVRGMGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSNFIIAWGSNVPQTRTPDAH -FLTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVVLKEFYFKDGGK -GRSAYFDDYARRYTDLPLLVMLKEHKLPDGSITLVPDRYLR---------ASDFNGK-LG -QGNNPEWKTVAFD-ADGRAVLPNGSIGFRW---GEKLGEGETPKWNLESKE--A------ --------RHGQDVKLKLSVV------E--------EGEQEHEIAEVAFPYFGGVQ----- ----------------TPNFPANSAQGEINRAKVPAVRLRLG-KEGDERYALVATV----- ----FDLQAAQ-YGIDRGF----------GSGAASYDDNAPYTPAWQEAITGVPRDQVVTV -ARQF------ADNADKTQGRSMVIIGAAMNHWYHSD-MNYRGVINLLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNSTSFFYAHTDQWRYEKLGMEEV -------ISPLADRKIYDGSMIDYNVRAERMGWLPT-----APQLK-TNPMQVVRDAAAAG -LDAR-----DYVAKAL-----KA---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGAGDAKPSEVKWHASAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KDVVLTPLMHDTPAELAQPF----EVKDWKKG -ECELIPGKTAQQITVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTELEVTQL--- ------GQLNGVTLEEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKV---- ------TGREHKHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLKT----TAEIAG- -------------------------VKPNGNPEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEEDAAKAGIVDNDWV-- ----------------ELFNVNGAISARAVVSQRVKPGMTLMYHAQE-------------- ---KQINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDEPAGTAGSGH---------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSQPKE--TFS-GDHGLTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRSRLLE---------RWRA-AMKTAKTPVDA -WATIVEDDAARRDYQKVRGMGGFVRSSWDEVNQIIAASNVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWG--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2011_265_B_bin.52_k121_959771_6 rank: A; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------GEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FYTEVRYRGTKSAVVSPDYSEAAKFGDIWLNPQAG-TDAALAMAMGHVILREYHL----D -RQAEYFEDYARKYTDMPMLVRLE-----DRDGHLVPGRMLR---------AEDFDGK-LG -ETNNPDWKTVAYDEATGQIAVPNGSIGFRW---------GEEGKWNLEQRA--------- ---------KGAEANLRLSQILDGHHDE---------------IVGVDFPYFGGVA----- -----------------TGDFVKCDHPEVLTRNIPARRAKLA-DGSQVLAATVFDL----- -------FCAN-YGLDRGL--------GGKWVSKDFNDDSPYTPAWAEKITGVAREKIIAV -AREF------AGNAEKTHGKSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCIGQEGG-G ---WSHYVGQEKLRPQT---GWAPLAFALDWNRPPRQMNSTSCWYAHTDQWRYETLRAGEI -------LSPTAPEGDWHISLIDYNIRAERMGWLPS-----APQLK-TNPLEVAKAAKAA- ----------GKAIPAYVAEQLKS---------------GALQMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVMG--KDLGEEGGVMPKEAVWHDEAPKGKL -DLLVTIDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKSDWEIFKSIARKFSEVAPEVLGVE-TDIVQLPLLHDTPGELAQAH-----VRDWKKG -ECDLIPGKTAPNYIAVERDY--PNLYKKFTSVGPLLEKLGNGGKGINWDTKVEVGHL--- ------RDLNGVVQDEGVSKGMAKLDTAINAAEMILMLAPETNGEVAVKAWEELEKP---- ------TGRHHAHLAEGAH----H-TKIRFR-DVAAQPRKIISSPTWSGIESETVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFVSYRPPVDLKTI---TKAVNN- -------------------------DAAEGNPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVVWMSEVDAQKARLVDNDWV-- ----------------EAYNINGALTARVVVSQRIKQGTLFMYHAQE-------------- ---KIVNTP-GSEKTGHRGGIHNSVT---RTTLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIVRKMK-------KVDWLD-TPATHKVEAAE----------------- ----- ->NASQAN2011_265_B_bin.52_k121_465271_4 rank: C; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNFFQSKELEQ---FS-DGWGQTTRENR------DW-EDVYR -NRWRH------DKIVRSTHG-VNCTGSCSWKIYVKSGIVTWETQQTDYPRTR-----AGL -PNHEPRGCARGASYSWYLYSANRVKNPLIRGALMR---------AWRK--MRPTMTPVAA -WAAIQNDPVLRASYTKTRGKGGFVRATWDEATEIIAAANAYTAKTY----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -F----------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSH--FSAPKE--EFA-DGHGVATGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALLVAKSPVDA -WASIVENPQARAEWQKQRGLGGFVRSTWEEINQLVASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----D -KRSAYFDNYVRRYTDMPNLVQLEERTLPDGRKVMVPGRYLR---------ASDFDGK-LG -QSNNPEWKTVALD-QDDKIVLPNGSIGFRW----GAAEREDLGKWNLENKE--A------ --------RGDTQVTLKLSLM------E----GAKDGSAADYEVGDVGFPYFGGID----- -------------TPNFDANKQSAAVGDVLVRKVPVRRVKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------PGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWVRPPRQMNSTS -FFY------------------AH------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------TDQWR--------------------------------- ------------------------------------------------------------- -----------------------Y------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------ERLGVDE------ ------------------------------------------------------------- -------------------------------ILSPL------------------------- --------------ADKSK------------------------------------------ ----- ->NASQAN2015_172_B_bin.54_k121_327740_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------IWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRQVVVPGRYIR---------ASDFNGK-LG -QDNNPDWKTVALD-QNDKIVLPNGSIGFRW----GAEGRSDEGRWNLENKE--A------ --------RGDGDVKLKLSLM------E--------GEDSEYQVGEVAFPYFGGID----- -------------TPNFHANKQVSAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------DGETAAKDYEEDVPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAVG -MDPK-----EYAIKAL-----QD---------------GSLKMSCEDPDNPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGPEDAKPAEVKWHDKAPEGKL -DLLVTLDFRMSTTCMYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----EVNEWQKG -KCELIPGKTAPQITVVERDY--PSTYKRFTALGPLMAKVGNGGKGIGWNTADEVQQL--- ------GELNGHVRTEGVTKGFPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHPWMIAFGEGLTSYRPPVDLKT----VDDMID- -------------------------RKPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKDAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEISGMRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVIVRKMR-------KIDW---LDNEANNQVQV----------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_678_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- -------------------------------------NGKLGQDNNP------EW-KTVAL -DQA--------DRVVL-----PNGSIGFRWGAEGRSD--------------------AGK -WNLEDKEARGG--------NEVKLKLSLM------------------------------- ---------------------------------------------------------EGEG -ADYEVGEVA--------------------------------------------------- ----------------------FPYFGGIDT------------------PNFSANKQASA- -------------------------------------VD---------------------D ------------------VLVR--------------------------------------- ------------------------------------------------------KVPVR-- ------------------------------------------------------------- -------------------------------------RIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKT----VDEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQA----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--AFS-GGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRAALAVA-KSPVDA -WTSIVENPNARLEWQEQRGLGGFVRSTWEEVNQIIASANVYTIKQY----GADRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QADRMVLPNGSIGFRW----GAEGRSDAGKWNLEDKE--A------ --------RGGNEVKLKLSLM------E--------GEGADYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVIWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKTV----DEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQV----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--PFS-GGHGVTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRA-ALAVAKSPVDA -WASIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RGDSEVKLKLSLM------E--------GEGSEYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----DYAVKAL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEDAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLMPLMHDTPAELAQAF----DVKEWSKG -ECELIPGKTGPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTTDEVHQL--- ------GELNGKVRAEGVTQGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMQAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKNAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KVDW---LDGEAPATVQA----------------- ----- ->NASQAN2011_028_B_bin.24_k121_53788_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALAVAKSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERNLPDGRKVMVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKEA-------- --------RGDNEVKLKLSLM------E--------GEGSDYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRVKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKQDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMKVVKDALAQG -MDPK-----DYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGIEDAKPTEVHWHDQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----DVKEWKKG -ECELIPGKTAPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTADEVHQL--- ------GELNGKVRAEGVTKGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RKPNGHKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KIDW------------------------LDGEAPA -TVQA ->NASQAN2015_227_F_bin.21_scaffold_4919_3 rank: C; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRAALAVA-KSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_25058_1 rank: C; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--SFS-GDHGVTTGEDR------TW-EDAYR -TRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSMQPVDA -WASIAQSDEKRREYQTVRGLGGFVR------------SNVYTIKKH----GPDRI-VGFS -PIPAMSMVS------YGAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYF----P -DGGKPRSAY---FDDMPMLVMLKEHQLPNGDTVMVPDRYVR---------ASDFNGK-LG -AANNPDWKTVAFD-ESGKVVLPNGAIGFRW----GPDGRADEGQWNLEAKE--A------ --------RHGTEVKLKLSVM------E--------GDNPSLETAKVGFPYFGGIV----- -------------SEHFPNNATGDAAKDVLVRTVPVQRISLG-KEGDKREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------AENADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGMDEV -------LSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPFQVVKDAEAAG -MSPV-----DYTVKSL-----KD---------------GSLAMSCEDPDHPN-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG--------------------------- --------------------------------KDLGADEAK-------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PTEVVW------------------------------ -----------------------------------------HKEAPEGKLAL--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----VVTLD---------------------------------------------------- -----------------------------F------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4 rank: C; buq:AC233_31260 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --WRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGPQDAKPTEVKWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -QSRSDWEIYKGFAKKFSEVCVGHLGVE-QEVVLTPLMHDSPAELGQPM----GVQDWKRG -DCELIPGKTAPQITVVERDY--PNVFKRFTALGPLMNKVGNGGKGIAWNTQVEVTQL--- ------GQLNGLVREEGVTKGMPKIDTDIDACEVVLQLAPETNGHVAVKAWEALSKA---- ------TGRAHKHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHAWMLAFGEGFGSYRPPVDMKA----TALMHN- -------------------------QRPNGQPEILLNF-------------------ITPH -QKWGIHSTYTDNVLMLTLSR---------------GGPIVWLSEDDAKSAGIVDNDWV-- ----------------ELFNVNGAIAARAVVSQRVKPGMVMMYHAQE-------------- ---KIINTP-GSEITHVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMD-------KIDW---LDTPVG-------AERVTRVQAQGENA- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3 rank: C; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY----FSQPTEPFS-NEHGITTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCQRGASYSWYLYSANRVKHPMVRARLLK---------HWRE--ARLHHDPVDA -WASIMANETKRRDYQQVRGLGGFVRSSWDEVNEIIAAANVHTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGCKTVAVTPDYSEVAKLADLWMHPKQG-TDAALAMAMGHVILKEFYF----D -RRAAYFDDYARRYTDLPMLVMLREQTLDNGRTVLVPDRLLR---------ASDFNGK-LG -QANNPDWKTIAFD-TTGKAVAPNGSIGFRW----GPEGRADAGRWNLEDKD--A------ --------RTGADTKLKLSVL------EDEHGEGAAQAHEIVEVGF---PYFGGVV----- ----------------NPHFTGNDQGGDVRRIHVPAVRLRLG-KAGEERHALVATV----- ----FDLQAGQ-YGIDRGL----------GTGAKNFDDDAPYTPAWQEAITGVPREQVIAV -ARQF------AENAEKTEGRSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWIRPPRQQNSTS -FFY------------------AH------------------------------------- ---------------------------TDQWRYE--------------------------- -----------------------------------------------------KLGMDEVL -SPLADKAAFKGSAIDFK------------------------------------------- ------------------------------------------------------------- --------------------------------APQLNVNPIQVAKA--------------- -------------------------ARAA-------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------VDPKDYTVQGLKNGS---- --------------------------------------IDLACHDPDAP------------ -----------------------------QNW----------------------------- -------PRNMFV----------------W------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2 rank: A; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ----------------------S-------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------MNYRGVINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMDEI -------LSPLADKKAYAGSMIDYNVRAERMGWLPS-----APQLK-TNPLKVVRDASAAG -MDPK-----DYTVKGL-----KD---------------GTLKMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGRDEAKPSEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWDIYKGFAKKFSEVCVGHLGVE-REMVLSPMMHDSPGELAQPL----DVKDWKRG -EVDLIPGKTAPNMVVVERDY--PNVYKRFTALGPLMNKVGNGGKGIAWNTQTEVKQL--- ------GELNGLITEQGVTCGMPRIDSDIDACEVVLQLAPETNGHVAVKAWQALGKQ---- ------TGIDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFTSYRPPVDLKTT---------- ----------AGIHGIKSNGNP----------EILLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKRAGIVDNDWV-- ----------------ELFNINGAIAARAVVSQRVNNGMTLMYHAQE-------------- ---KIINTP-GSEITGIRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDTPADASNPA------------GSHA- ----- ->NASQAN2016_164_F_bin.17_scaffold_8891_2 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPRE--SFS-GDHGVTTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSQDPVDA -WASIAQSDAKRKEYQSVRGLGGFVRSSWDEVNEMVAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNS----------------DAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYFPDGGK -ARSTYFDDYVRRYTDMPMLVMLKEQTLPSGEVVMVPDRYLR---------ASDFNGK-LG -AANNPEWKTVALD-ESGKVVLPQGAIGFRW----GPDGRADEGQWNLQAKE--A------ --------RHGNDVKLKLTVM------E-----GEQASLETAKVGF---PYFGGIE----- -------------SEHFPNNATGAGANNVLVRTVPVQRIALG-KAGDTREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFGLDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEV -------LSPLADKKAFGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVRDAQAAG -MEPK-----DYAVKGL-----KE---------------GTLSMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDMGHDEAKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2015_227_B_bin.17_k121_559871_7 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPKE--AFS-GEHGVSTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWREARLS--MDPVDA -WASIAQDDAKRKEYQSVRGLGGFVRSGWDEVNEMVAAANIYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYC-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2 rank: A; aon:DEH84_18240 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- --------------------AA-------------------------------DW-VRPSR -QQN--------STSFFYAHT---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DQWRYEKL----------------- --------------GVNEVLSPLADKAKF-------------------------------- ------------------------------------------------------------- ----------------------------------------GGSMI---------------- ---------------------------D--------------------------------- ------------------------------------------------------------- ----YNVRAER-------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------MGWLPS-----APQLQ-TNPLNLVKEAQAKG -MDAK-----DYAVQSL-----KD---------------GSLKMSCEDPDNPA-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGPNDAKPQEVQWHNQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -EARSDWEIYKGFAQKFSEVCVGHLGAE-REVVMTPIMHDTAAELAQPF----GVQEWKKG -EIDLIPGKTAPQIAVVERDY--PNTFKRFTSLGPLMNKLGNGGKGIGWNTQDEVHAL--- ------GELNGTVREEGVSQGMPKIVSDIDASEVVLMLAPETNGHVAVKAWEALGKQ---- ------TGRDHTHLALHRE----D-EKIRYR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFVSYRPPVDLKT----LDDIKG- -------------------------VKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNNGMVLMYHAQE-------------- ---KIVNTP-GSEITGTRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLDDESSNQGVHA------------------- ----- ->NASQAN2016_164_F_bin.17_scaffold_1152_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -----------------VTCG---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------MPKI- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------TDIDAC------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------EVVLQLAPETNGHVAVKAWKALGKQ---- ------TGLDHTHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNA-- --------------------GYTNVHEMIPWRTR--EGFTTYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSETDAKSVGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW--------------------LEEEAQGENA- ----- ->NASQAN2015_227_F_bin.21_scaffold_2406_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------VSYNAGYTNVHEMI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------PWRTL-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------T------------------------------------- --------------------GRQQFYMDHPWMTAFGENFSSYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAKSAGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMA-------KVDWLDDEGSSTEPTATHN---------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSSPKE--SFS-DGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTRD-----DL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLQ---------HWRA-ALAVSKSPVDA -WANIVENTAARSEWQKQRGLGGFVRSTWEEVNQLIASANVYTAKKY----GPDRV-MGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYSEVAKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----N -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVMVPGHYLR---------ASDFNGK-LG -QDNNPEWKTVAID-ENDKIVLPNGSIGFRW----GAEGRSDMGKWNLESKEA-------- --------RGDAEVKLKLSLM------E--------GATPDYEVGDVGFPYFGGID----- -------------TPNFNANKQGEAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------AGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTKGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLE-TNSFQVVKDAQAAG -MDTK-----DYVVKSL-----KD---------------GSLKMSCEDPDNPK-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG---KDLGAEEAKPTEVQWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAQAYSEVCVGHLGVE-KEVVLTPLMHDTPSELAQAF----DVKEWKKG -ECDLIPGKTAPTIAVIERDY--PNTFARFTALGPLMEKAGNGGKGIGWDTKVEVQQL--- ------QSLNGKVHTEGVSKGMAKIVTDIDAAEVILQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAIHRE----D-EKIRFR-DVQAQPRKIISSPTWSGI----------- ----------------------------ESETVSYNAGYTNVHE----------------- ----------------------------------MIPWRTLT------------------- ------------------------------------GRQHFYL------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- --------------------------------TLT-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------GRQHFYLDHDAYIAFGEHLSTYKPSPT-------------- ----------PEAYGDLRKT-----VNDGHAKMLN---------------------CLTPH -GKWHIHSTYGDTLRMLTLSR---------------GNEPCWLSEEDAAELGIKDNDHV-- ----------------EVYNDHGVYVARACVSARIPKGVCIVYHAVERTYNIP-------- ---KSQIRR-GEHGEPRRGGMNNSFT---RVHLKPNLMCGGYGQ---------FTYHFNYW -GPV-GVNRDTHVLVRKMH-------VVEY------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- --------------------MG--------------WIQDLFAPEQR------SW-EDFYR -NRWAH------DKVVRTTHG-VNCTGSCSWNVYVKQGVVTWEMQALDYPTID-----RSI -PNYEPRGCQRGISTSWYIYSPLRVKHPYMRGALLD------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------LWQEARRE--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------HP------------------ ----------DDPVAAW-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------ASIT----------------------------------- ------------------------------------------------------------- ----- ->AFN37208|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIVTWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGFRRATWDECLELVASSLLYTAKKY----GPDRV-VAFA -PIPAYSYLS------FGAGTRFIQL----------------------------------- ----FGGFTLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVANGANMNMTRTPDVH -FISEARHNGTKFVVIAPDFSQVAKYSDWWLPVKAG-QDQALWMGIDHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGKVAVTTA--------- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEPYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWSCWALGKDWVPTSRLQQSSSWHYAHSDQWRYEGDFTEYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPLDVVKQAEAAG -AKT------DEQIVKWVVEQVKS---------------KQLKFAIEDVDAPE-NWPRTWL -IWRGNALQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVTFREPAPRGKM -DLLCQLNFRMDTTATYCDVVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMTPLAHDTPDELSQDYQAGMKVLDWGKG -EIEMIPGKTAPHFKVVERDY--ANIYNQWITFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRK----TGDIV-- -------------------------RSPVDDESVVLNY-------------------ITPH -GKWHIHSTYYDNHRLLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPE-------------- ---RTISIPKSQVRGNRRGGAHNSLT---RIRINPMQMAGGYAQ---------WTYAWNYW -GPIGIMTRDTHVAVR--------------------------------------------- ----- ->AFN37205|Nitrolancea_hollandica_Lb ------------------------------------------------------------- -----------------------------------------------------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRHRWQRARGKGGFRRATWDECLELVASALLYTAKKY----GPDRV-VAFA -PIPAYSYLS------YGAGSRFIQL----------------------------------- ----FGGFNLSFYDWYADLXNSFPEVWGDQTDVCESADWYNSKFIVSNAANMNMTRTPDVH -FISEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTCWALGKDWIPPSRLQQTSTWHYANSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPFEVVKQAEAAG -AKT------DEQIVKWVVAQLKS---------------KQLRLAIEDVDAPE-NWPRTWL -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVVVREPAPRGKM -DLVCQLNFRMETTATYSDIVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMQPLAHDTPDELSQDYLAEMKVLDWGKG -EVDLIPGKTAPHFKIIERDY--ANLYNQWTSFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMVYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYAFNYW -GPIGIFTRDTHVA----------------------------------------------- ----- ->AFN37207|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRC-AAFA -PIPAYSYLS------YGAGSRFFQL----------------------------------- ----FGGFNMSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVIAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIDYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCVGYRW-------ATKETGKWNISMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------EVAQVEF----- ---------------------DIFGTGKVARRGVPIKYLETS-EGK-VAVTTAFDL----- -------LLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPIEAPILTGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTTWALGRDWIPPSRLQQSPVWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAIDLLASAVRMGWMPF-----YPQFN-RNPLEIVKQAEAAG -AKS------DEQIVKWVVGQLKS---------------GNLRYAIEDIDAPE-NWPRTWV -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EEHAKGRVKDVVLRDPAPRGKM -DLVCDINFRMETTALYSDMVLPTAMW--YEKNDLNTTDLH-SFIHP----L-GAAVPPVW -EAKTDYEIFKAIAKKVSELAPSVFPQPVKDIISNPLIHDTPDELAQDYLSEMKVLDWGKG -EIDLIPGKTGPHLKIVERDY--VNLYNRWISFGPKARENGISGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGGRYPRLEFAEEAANLLLHLSPETNGEVCYHAFKEEEKQ---- ------IGMPLADLAESIR----G-VRMNYF-DLTRQVRRTMISPCWTGMINDGRAYAAWC -LNVERLVPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRKTG--DIVRSP- ----------VDDES------------------VVLNY-------------------ITPH -GKWHIHSTYYENHRMLTLSR---------------GIEPCWINDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMFNYW -GPIGIFTRDTHVAVR--------------------------------------------- ----- ->AFN37206|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRV-TAFA -PIPAYSYVS------FGAGARFIQL----------------------------------- ----FGGFHLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEGYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLSLVS---AWQSWALAKDWFPPSRVQQSSTWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPM-----YPQFN-RNPLELVKQAEAAG -AKS------DEQVVEWVVGQLKS---------------GNLRYAIEDVDAPE-NWPRVWL -IWRGNAFQS---SAKGAEYFLRHYSGTHDNAVA-----EEHAKGRVKDVVFREPAPRGKF -DLLCDLNFRMDTTALYSDIVLPTAMW--YEKNDLNTTDLH-TFIHP----L-GAAVPPVW -EAKSDYEIFKSLAKKVSELAPSVFPQPVKDIVSNPLAHDTPDELSQDYLAEMKVLDWGKG -EIEMIPGKTAPHFKIVERDY--VNFYNRWISYGRKARENGIVGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGQRYPRLEFAEEACNLIMFLAPESNGEVCYHAFKEEEKQ---- ------LGLPLADLAEAVR----G-VRMNFF-DLTRQVRRTLISPCWTGMVNDGRAYSAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMWNYW -GPIGILTRDTHVAVR--------------------------------------------- ----- ->WP_005004540|Nitrococcus_mobilis ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMEDG-------- --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGSVLVATV--------- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIHDLDNSPID- ------------------------------DKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVE-------------- ---RTIYIPKSQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->Nitrococcus_mobi_EAR23355 ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMED--G------ --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGS----VLVATV----- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIH--DLD---- -------------------------NSPIDDKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVERT------------ ----IYIPK-SQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MS-WIEDIISPNTR------KW-EEFYR -NRWQY------DKVVRSTHG-VNCTGGCSWAIHVKDGIVVWEMQQLDYPQFN-----KDV -PPYEPRGCQRGISYSWYLYSPIRVKYPIIRGALID---------LFRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------E ------------------------------------------------------------- ------------------------------------------------------------- --------KKKCG------------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- -----------------------------------------DPVLA--------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------ANLQADDTK------------ ---------------------------RKRYQRA--------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Nitrobacter_winogradskyi_gb_ABA05326 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLAD---------LWHEAKASY-PDPVQA -WASLVEDEEKRNRIQKARGKGGFRRAKWEELIELIAASCLYTARKH----GPDRV-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----FGGGLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWSTVAMALDWNKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPNFH-RNPIEVVAEAERAG -AKS------TADIATYVADQVAS---------------KKLDLAINDPDAEE-NWPRVWF -IWRANAIQS---SAKGHEFFLRHYLGAHDNVIA-----EERAKGKTTTVKYRDTAPQGKY -DLVVDINFRMNTTGLYSDIILPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDIVLQPLMHDTPDELAQPE-----ILDWAEG -ECKLVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVNIPIKKQYDQMLEN -PIMPMPDSRHMRCVEWGGKRYPSLEDVLDACNVVLLCAPVANGEVSYQGFVNEEQH---- ------VGLPLADIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLVNDGRAYSAWC -MNIERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRLLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RIRINPLFLAGGYAQ---------FTYGWNYW -GPTGIFTRDTHVVVRKME-------KVEW------------------------------- ----- ->WP_011314088|Nitrobacter_winogradskyi ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYVRGPLYD---------LWKEAKASH-PDPVQA -WASLVGDEQKRSRIQKARGKGGFRRAKWEELVELIAAAALYTARKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TADIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLISKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNIPIKKQYDQMLDN -PIMPMPDARHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLTNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->Nitrobacter_sp_Nb_311A_ZP_01048070 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLYD---------LWREAKASH-PDPVQA -WASLVGDEQKRLRMQKARGKGGFRRAKWEELVELIAAAALYTARKW----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------AKRVARY--Q -DVENGDWKMLVLDSKTGEPRAFKGQVGDRW--------GSTHGKWNLSAED----TLDNS -PIDPVLSFIDQSDGVVQVGF------D---------------------DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGEVLVTTG--------- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDENAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLQAKAVRSGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TDDIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGMTNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDSQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->A_Nitrobacter_hamburgensis_YP_578638 ------------------------------------------------------------- --------------------MS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLLD---------MWREAKASS-ADPVQA -WGALIGDEQKRSRIQKARGKGGFRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFVDYIKRYTDLPFLVELES-----NGNTYKTGRLLR---------SNRVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVKRVATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWATVALALDWAKPPRLVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPKWAKGHAIDLEAKAVHNGWMPF-----TPHFN-RNPIEVAAEAERSG -AKN------VQDIETYVVDQVVS---------------KKLQMAIDDPDAAE-NWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNAIA-----EDRAKGKAQVVKYHETAPRGKY -DLVIDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIGKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWSLG -ECKAVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPNR----N-VAATFY-DLTRQPRRIITSPCWTGMVNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- -----SR---------------------VDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->B_Nitrobacter_hamburgensis_YP_578186 ---------------------------------------------------------MTTG -LAAGQR--------TEETQMS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRIKYPYVRGPLLD---------MWREAKASS-ADPVQA -WGALVGDEQKRARMQKARGKGGYRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLLSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGTTYKTGRLLR---------ARHVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVRRIATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATTAEYTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWASIALALDWSKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKAVRSGWMPF-----TPHFN-RNPIEVAAEAERAG -AKS------TEDIATHVIDQVAS---------------KKLNLAIEDPDAAE-NWPRLWF -IWRGNAIQS---SAKGHEFFLRHYLGTHDNAIA-----EDRAKGKTHTVKYHDTAPRGKY -DLVVDLNFRMDTSSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWDIFKLIAKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNVPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPTR----N-VATTFY-DLTRQPRRLLTSPCWTGMMNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14 rank: A; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGQRSTWGVVSESRRRFLVKAGL -ASAAGA--------AINLNLFGCGRSHAPLQHFKGTTAGHFDLGPRTTPKLGNW-QDLYR -QRWTW------DKVVKGSHGWANCRSACEWDLYVKDGIVVREEQSATYEASE-----PGV -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------PRGSGQWEKISWEQAIKEIAQKTVDAVTEF----GTDTVFQDLG -PNFDFGPST--------AGRFKFMYQAGSLFADM-------------------------- ---------WGEI---GDLNFGATMALGAAQIGGSSDEWFLSDFIVVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPIETG-TDAALGLAVARHLFEVNAI----D -------LPFVREQTDLPLLVRLDTGRFLRETDLNSG------------------GNA--- ----------------------------------------DQLYLWHPQKNAPVFAPGC-- --------TGNTTRKLTLDFE----------------------------APIDGQW----- -------------------------------------TIKLH-DGKEVAIAPVGAL----- ----LKEHLEP-WTFEHTA-----------------------------SVTHLHVDQVKKF -AEGW-----------AKCQRPMVLSSWGSNRFVHSD-LMNRSKILCLMLKGALGKKGT-G ----YQATGIVDMEGFNNAMQMDHEGVR--------------------------------- -------------------------------GRLGALLGIMPPADLFQAVLDIVMQRKTEG -DVAL-----ETEMNYL-----KHHLCSSDVMESNFKAPGYRAAVVKEHEGMLPRSLESYY -QEARQKDWS---QGLPRKAPVKVYFSGGANILRRSNMP-----------QYYKTFIWDEM -QCIVDINPKYSFTGTQSDYILPAAGW--YEKAGIKYTMSYVPYLH-----YCDVAVPPLG -ESKGEWEIFWLLTREMERYA---------------------------------------- ---KEKNLPVLDGCGRGSNDF--KTLHQRYSNQGELGQ----------------------- --------------------------------HDDEKVMKEILHGDATEGMTIEGLKQTGI -AKFTSAGKPVAADAINNP----D-WKGEGV-MTTLTRFTVHKEPWPTYS----------- --------------------GRITSFIDHPWFIEMREQFPIHKDSPKAGG----------- ---------------------------------------------------DYPFQFVSCH -ARWSIHSTWRDTPMMLRLQR---------------GEPLVYINPIDAERVGVKDFEYV-- ----------------EIFNNYGSVRMRVKVAAMVRPGVAYYYHAWE-------------- ---------------PHQFPNHQSFKWLIPGLVNPLYMAGGYGQ---------INHAMNRY -QPG-SAVQDTRIGIR------------PW---HGQATGAHPVKRPEAAATSK-------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1 rank: C; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGNLIKTGIASASRRKFLVMAGA -ASAAGA---------ALSLFGCGRAPLQH--FKGTTASGRFDLGPRTAPKLGNW-QDLYR -QRWTW------DKVAKGSHGWANCRSACEWDLYVKDGVVVREEQSATYEASE-----PGI -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------SRGSGKWEKISWEQAMKEIAQKTVDAAEKW----GTDTIYQDLG -PNFDFGAST--------AGRFKFQF----------------------------------- ---MAGGVFADNWAEIGDLNVGASITTGAAHLGGSSDEWFLSDFIIVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPLESG-TDAALGLAVARHLLETGAI----D -------LPYIREQTDLPLLARLDTGRFLRESEMVNG------------------GNA--- ----------------------------------------DQLYMWHPQKNAPVPAPGC-- --------LNNTTRNLKLDFE----------------------------PPIDGQW----- -------------------------------------KVKLA-DGKEVGVVPVGAM----- ----LKEHLDS-WTFEHAA-----------------------------KVTHLHIDQIKKF -AEGW-----------AKAQRPMVLSSWGSNRYVHSD-LMNRTKLLLLMLKGAMGKKGA-G ----------YQATGWV-------------------------------------------- ----------------------------------------------DLDGFGNAMQMEKSG -MT------------------------------------GRLAVMLNAM------------ ---------P--------------------------------------------------- ------------------------------------------P------------------ ------------------------------------------------------------- -----------------------KELFNA-------------------------------- --------------------------------VVDIIKKRKTEGDVALEG----------- ----------------ENN----Y-LRTK-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------LCTSDVVEVNLKSDGY--- -----------------------RAALNKEQKGLYPHELDEYYKEAHD------------- -----------------------------KGWAP--------------------------- -----GLPRKAPPKIFF-------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3 rank: A; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MSISRRHFIVGSAV -AVAGVG------------LYS--LRPKKP--VVYPVGVRAPKVAAR-KVHYNDY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQAAIYEPHR-----PDV -PDFNPRGCQKGACYTQLQVSEARVKYPLKCVG---------------------------- -----------------ERGEGKWKRVSWDTALDEIADRLIDIAVRDGTESIIFDDTTNVG -YGPE-----------TAGDVRFAAA----------------------------------- ----IQATRLDSWSGVGDMPNGLIQTWGLYNCEGTSDDWYLSDYIVIWVGNPNYTRIPDAH -FLHEARYRGAKLVVVAPDLNPSTAHADLWINVNAE-TDSALALSCAQVMIAEKLY----K -------KDYVLQQTDFPFLVRKDDQRFLRAADMVKG--------------GAD------- ----------------------------------------NALYLWDEAKHAPVIAPGCEG --------DGDGGRIMALGGI------K---------------------PALSGTF----- -------------------------------------KVTTQ-DGKTVEVQTVFDM----- ----IRAKLDAEYTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPKAMIIASYGSCKHYHHD-LNQRSFVLLMNLTGNQGQQGG-G ----------YRISAW-----WAMDGLD--------------------------------- -------------------------------QMADSTVPLKDMLRIIPKAIRGLSPRDYEG -LFTEYSDKEGHTPALLFLY--LH---------------GGYKEMWDKPHLQDPALPRPF- ---ADYVQES---IDKGW-SKVHPPLGREPRAYI---FTGGNPLRRWPSPQIAKQHLWPKF -ELVVSVNFRMSTSSLFSDYVLPVAAY--YEKYGIKYAQTYVPYIIT----S-DKATEPLG -ESKSDWETFGLLSKHVAERARVRGVTMVRGL----------------------------- ----------------KDVLFDLSKAYEVHTHHG--------------------KYDP--- ----------------------------TDPEDPIKLMDAIFANSPSIGCNTGREALDMGA -VPVIGTGRPSLIDQNYSP----YDPKDTYW-PHKDFIDKKIAWPTLT------------- --------------------GRQQFYIDHPWFLEGKEHLPTFKPSIHANSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHAVWRDVKLLLRLQR---------------GQPACWLNPKEAEKRGIKDGDMV-- ----------------RVFNDHGTCECMVKVSAITAPGEVIIYHAW--------------- ----------EPYQFKKWQGNQEPVE---APW-KALHLAGGYAQ---------LHWRVYYH -GPN-HSPRGAPVEVEKIGYEGG-------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4 rank: C; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MQISRRGFIVGSAV -AAAGVG--------LYSLKSK--KAVIKPGITLP-DKTPAKKIKYN------DY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQNAIYEPPR-----PGI -PDQNPRGCQKGACYTALQLSESRVKYPLKRAG---------------------------- -----------------NRGEGKWKRISWDEALTEIADKLLDIAVAEGTETICFDDLSNTG -YGPETAGDFR-----FSTGMQVSRL----------------------------------- ----------DGWSGVGDMPLGVIQTWGAFNCEGTSDDWFRSDYIVIWLGNPSYTRIPDAH -FLHEARYRGAKLVVVAPDLNATTVHADMWLNVKPE-TDAALGLACAQIMISENLY----K -------KDYVLEQTDFPFLVRKDNQRFLRVSDVVKG--------------GAD------- ----------------------------------------NAFYLWDEAKNAIAMAPGCEG --------DGDGGRSLKLGAL------K---------------------PALSGTR----- -------------------------------------SVKLA-DGSTVECITVFDM----- ----IKERLDKEHTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPSAMIIASYGACKHYHSD-LFQRSFILLMNLTGNQGKPGG-G -MRVAAWWGMDGLDAMA----DSTIPMA--------------------------------- -----------------------------------------DMMKIIPKAVRGLTPRDYES -LYTDYSNREGHTPTMVFLY--VH---------------GGYKELWDKPYLQDPNLPRNI- ---SSYMRES---IDKGW-TKVHPPENKSPKAYI---FTGGNPLRRWPSPQIAREKLWPKF -DLVCSVTFKMSTSTLWADYVLPVAAY--YEKYGIKYAQSYVPYIIS----S-DKATEPLG -ESKSDWETFGLMAKKVAERAKARNITMVRGL----------------------------- ----------------DDKPFDVSKVYDFYTGNG--------------------KYDP--- ----------------------------TDPEDPVRLMDEIFAGSPNVACNSAREALQRGA -VPVTGPGRPSLINQNYSD----YDGKDTYW-PHRDFIEKKVAWPTIT------------- --------------------GRQQFYIDHPWFIEGKEALPTHKAPPLATSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHSIWRDVKLLLRLQR---------------GQPAAWMNPAELQKRGLKDGDMV-- ----------------RVYNDHATFECNIKSSPATAPGEIIVYHAWEPFQFK--------- -----------------KWQSNQEVT---EAPVKGLHLAGGYTQ---------LHFRVYYG -SMH-HTPRGAAVEVEKAPT----------------------------------------- ----- ->NASQAN2015_111_B_bin.76_k121_226837_116 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVSRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDIWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVRAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVETR-TGK-VTVTTVFAL----- ----LRKRATE-HSPEKMS-----------------------------TETGLNPKAMRTV -AREF----------AKAGQRAMIYAGFSACKWLHGD-ILQRSMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLEEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DTAVKPLG -EAVDDFEALRRVSAAISTIAREKATPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRDSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQQGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDAGSFVCMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLYS-------RGKV---TAAKARIA-------------------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVNTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------NVETR-TGK-VTVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKRAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DQAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLHS-------RGKV---------------------------TAAK -VRIA ->NASQAN2014_190_B_bin.96_k121_3766_2 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLTHSAL -AAGAAL--------ALHHGAA--------------MADALSR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIDEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VAVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------DETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPIYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDATARNVRDGDLI-- ----------------EVFNDGGSFICMAHVSAGIMPGTVYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---------------------------TAAK -VRIA ->greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHTAL -ASAALA--------LQHGAAM--ADALTR--------------PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVYKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGDI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VTVTTVFAL----- ----LKKRAAD-HSPENMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRIVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRASGN--------------RWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTAAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVWNSDESP----FHADIA------ESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARNVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---TAAKVRIA-------------------- ----- ->providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4 rank: A; shal:SHALO_2978 molybdopterin oxidoreductase, alpha subunit (db=kegg) ----------------------------------------------MANSSRRNFLKASG- ---------------FSAAMLAGQGTLFAKTDVIK-VENAKDSYPNA------SFTETNYR -DEFKFTYGEKAEHGYAYHCV--NCQGNCAWEVWGNNGIVTRENQSAKYPAF------GHN -PDFNPRGCNKGVQHSQVMYEKDRILYPMKRIG---------------------------- -----------------ERGKGKWKRISWDEAATEVAQKLYTTM-------------IDPK -KGPAAITVH------AGTGLLTEGRRPSVLRFGT-------------------------- ---QLGASRIYPASYLGDMFTGAAIAYGEGNMGCTYDFMFNVSTSIMWGANPSATRIPDAH -FVWEGKYNGSKIIVITPEYNATAARAHLWVPIKPG-TDSFLAMSIINEMLAKKLY----- ------LPQAVKTYTDLPFLVDAKTKRFIRRSDAEHA------------------------ ---------------HDEKTHHLYE---------------DEFYCWNLKSGKPELMPGTEG -SERKTIMLKDKGWDI-----------D---------------------PALEGEW----- -------------------------------------EMTLQ-GGKKVKVTTVFEL----- ----LKKEASK-YSAKDTQ-----------------------------KITGVHLDVVTEL -ATHI-----------AKDKCVEITTGFSLNKYFNGV----LSIWNIATICGLTGRFGPRG ------------------------------------------------------------- -------------------------------GLNTE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------NEFQLSG------------------------------------------------ ------LEALSGFAGKYS------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PRFA-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------SGFLSEFM------------------------------------------- ------------------------------------------------------------- ----- ->muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MKLTRRTVLQGIAG -ASAATVVGGQD---ALGEAGAPAAKTGKD--VPVIIDDPREHYPNT-----RPV-EDMYR -SEFADTFGDPDDHGTAFHCV--NCQGNCAWQVWIKDGKVTRENQSAAYPAIR-----EDI -PDSNPRGCNKGVQHSQVMYEADRIRYPMKRVG---------------------------- -----------------ERGGGKWERISWDEAIDTIAQKLYRTM-------------VERG -PQGNYVH--------VGAGLLSEARGASIKRMGA-------------------------- ---LLGAVRPYIASYVGDMFPGVSLVYGEGNIGCSYDFMYGTNVQVYWGCNPNTSRIPDAH -YVWEGKYNGSKVIVISPEFNSTAIHADRWIPIKPG-FDGHLAMSLMHELVDKQLY----D -------AELVRKFTDLPMLIREDSGAMLRLSDIDPARAAAEGALAFDAELAEKFGKKAHG -KKDHAEDVFLAVNEVGGKLTAMPGGEGSAL---------GTLR----------------- --------LQDVGWKIT--------------------------------PALSGNW----- -------------------------------------TVTLR-DGKTVRVHTVFDA----- ----LRKELEA-FTPEKTH-----------------------------KLTGVHPTLVRDL -ARDI-----------ALPEVVSVTMGFALGKHFNGM-LTQRAIASLMALTCRMGPRGGLN --TENEWSISGLGGLSGFDGAFKHRFAS--------------------------------- -------------------------------GAVSEH----QLGDGAATSKKAYTDDEIRE -ATG------QDAASYR----------------------AEIAALLEKS-----KNDRGVD -PAKGRFGKPWWDTVETFFIVADARFRRNKSGYR--------------------EAFLDKA -KFFAVADMKMGETARFADIVLPSASH--YEVWDLRVNPGYHRFANIA---QPPKGLEPVG -EAKSEWHIATMLVTRMQEIA---------------------------------------- --------------------L--AEYAR--------------------------------- --------------------------------TKNIGVMHIPDPTHTRDGIRPLDKF---- -------------VELFTD----H------------------------------------- --------------------GKLGT---DKQAVEFALGHV--------------------- ------------------------------------------------------------- -------DQFRGEDLESCYDR----------------GGFLVVNDKGGKT----------- -------------------------------SPLYP------------------------- ------------------------------------------------------------- -----DKPYSTF----------------------------------ENHF----------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MSISRRDALRNLLF -GTVAAG--------VAAKVPTAEAKEFSDPQPVR-VDDPRKSYPDT------QTTEDFYR -AEFQAVRGNPDERGFAYHC--VNCQGNCAFEVWTENGKVTRENQSASYPQLA-----PNL -PDANPRGCNKGSQHSQVMYEADRLLYPMKRAG---------------------------- -----------------ERGSGKWKRISWDEAITEIAENL------------HRGL-VEKG -PSSNYVH--------IGAGVLTEARAASIKRLGSL------------------------- ----IGAVRPYIASYVGDMFPGVTVVYGEGNIGCTYDFVFTTNVAVFWGCNPNTSRIPDAH -YLWEGKYNGSKIIVITPEFNSTAIHADLWVPLKAG-YDGHLALSIIHRIIQRKLF----R -------PEFLKEYTDLPFLVRKDTKELVRLSDVALD--------------AKGFDGA--- ----------------SARLFGEHPH--------------ECFLAFNTKNRKFTAMPGTEG -SGVETLRLQDMDWDI-----------D---------------------PALNGSW----- -------------------------------------KLTLK-DGKQVQVTTAFEL----- ----FKKEVAA-FAPEKVQ-----------------------------KLTGVHPSIVDEL -ATDL-----------TKAKVSLVTMGFAVGKHFNGM-LSQRAIASLTAFCGKLGPEGGLN --TENEWNISGLEGLSGFQGKYQHRFAS--------------------------------- -------------------------------GFVSE-----FMLGEGLEDADALYSDEDMR -RGT------GDSKAEY-----KA---------------KVQALLEQGKNDERYKEGKPYW -T-----------TVENFLLFADSRFRRNKGNYQ--------------------KAFLEKA -KFIAYGDVRANDMAIYADILLPCKTP--YECWDLRTNPGYHRYANIA---YPPPNLKPVG -ESKSEWEIATLVVEKLEALAKQKAAAT--------------------------------- ----------------GEDRY---------------------------------VVIP--- --------------------------------DKTHTQEGVRRLDELVREFTKDGTL-RTD -KDAVEYALEHVDQFKPNDTKSLY-ERGGFL-QLNEKAGKSS--PLYADK-----PYNTFE -NQLFLHQRFDTLT------GRLTFYVDHPLWIAANAHVPTAKQPIRPARHP--------- ------------------------------------------------------FVLMTPH -ARWSIHSTYKTSPILLRLQR---------------GKPCVMINPEIARARGIQDGDTI-- ----------------KMFNELGEVRVMAKLSPACPPDALVMEHGWE-------------- ---------------PFMYDGKKGHNLIIGDMLNLLELTDGWGH-------LKFGTNWDGN -----QHAYESTMDIAKA------------------------------------------- ----- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60 rank: A; sul:SYO3AOP1_1175 molydopterin dinucleotide-binding region (db=kegg) -----------------------------------------------MTVSRRDLLKAAAL -GSVAIGSNTLAKNAFTEPIPQKEAKDI----PVI-VEDPRASYLNTK-----SI-EDMYR -REFAETFGEKKDHGYAYHCV--NCQGNCAWQVWTKDGKVTRENQSASYPQIA-----PNI -PDYNPRGCNKGVQHSQIMYEQDRLLYPMKRVG---------------------------- -----------------PRGEGKWKRISWDEAITEVSENLYNTMQE---K----------- --GPAGNYIH------IGAGVLTEGRAASVKRLGT-------------------------- ---LLGAVRPYIASYVGDMFPGVSTVYGEGNIGCTYDFIFKTNVAIFWGCNPNTSRIPDAH -FLWEGKYNGSKIVVISPEYNSTAIHADLWVPIKPG-YDGHLAMAVLNEIVFKKMY----N -------ESFVKEFTDLPLLVRKDNKELVRFAEIDTKDSNFD---------SKSSEKL--- --------------LKKILKRELKEHEVF--------------LAWNQKTNKMTVLPGSEG -SPVETLRLKDRGWNI-----------N---------------------PALSGTW----- -------------------------------------KIKLK-DGHTVEVTTVFDL----- ----FKQELKK-FDPLRMH-----------------------------AVTGVHPTIVSEL -ARDM-----------IVPKNTLVTMGFSLGKYFNGM-LIQRAISALTAISGRLGESGGLN -T-ENEWNITGLSGLSGFEGKYQHRFAS--------------------------------- -------------------------------GFVSE-----YMLGDNLNDYDHLYAEAEIK -EST------GLGKKQY-----RE---------------KIEKIVKDG------ANDEGFK -NGKPYWTTM---ETFLLFADAR--FRRNKGSYK--------------------EAFLKKA -KFIAYGDYRMSDFCNYADILLPCKSH--YEVWDIRTNPG---YHRFANIAYPPANLKNVG -EAKSEWEISTLIAEKIQDIA------------------LKKYKS--------------SG -DKKAIHVPDTTHTQTGFRAL--DEVVNEFTIGG---------------------KVR--- --------------------------------SDKDAVEYMLEHVDQFKPNSTKTMY-ERG -GFLVLNDKAGKSSPLYSN----K-PYNT------FESNKLLYQPFETLT----------- --------------------GRLTFYVDHHLWIETGAHIPTARNPIRPKK----------- ----------------------------------------------------FPFVLMTPH -ARWSIHSTYKTSKILQRLQR---------------GKPYIMINPKVAEAKGIKDGDEV-- ----------------KMFNDLGETFLMAKITPSAPEHSLVMEHGWEPFMYKNKVGH---- ----------------------NALV---GDMINLLELSDGWGH-------LKFGTNWDGN -----QHAYETTVDIVKA------------------------------------------- ----- diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json b/assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json deleted file mode 100644 index 76c34e49..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json +++ /dev/null @@ -1,11 +0,0 @@ -{ - "empirical_frequencies": true, - "datatype": "AA", - "subs_model": "WAG", - "program": "RAxML version 7.7.2", - "ras_model": "gamma", - "gamma": { - "alpha": 1.530755, - "n_cats": 4 - } -} \ No newline at end of file diff --git a/assets/trees/nar_nxr/nar_nxr.tre b/assets/trees/nar_nxr/nar_nxr.tre deleted file mode 100644 index 72500eef..00000000 --- a/assets/trees/nar_nxr/nar_nxr.tre +++ /dev/null @@ -1 +0,0 @@ -(OOP57237|Brocadia_caroliniensis:0.010806074,(RIK02127|Brocadia_sp:0.000910858,(KKO18748|Brocadia_fulgida:0.000000005,OQZ00558|Brocadia_sp_UTAMX2:0.000914005)0.781:0.000917034)0.992:0.013579216,(WP_052562588|Brocadia_sinica:0.009341785,(OHB44699|Planctomycetes_bacterium_GWE2_41_14:0.028539476,((WP_070066136|Brocadia_sapporoensis:0.005501886,RZV59451|Brocadia_sp_BROELEC01:0.002673850)1.000:0.025826757,((((OHB72803|Planctomycetes_bacterium_RBG_16_41_13:0.009726587,(WP_099324707|Kuenenia_stuttgartiensis:0.000917459,NxrA_Candidatus_K_stuttgartiensis_CAJ72445:0.000000005)0.998:0.017229244)1.000:0.098072241,((((RBG1_10:0.249943905,((GCA_001803565_00046|MHDQ01000004unannotatedprotein:0.399259377,((BBJ23760|Nitrotoga_sp_AM1:0.0,BBJ23368|Nitrotoga_sp_AM1:0.0):0.003761140,((RFC31618|Nitrotoga_sp_SPKER:0.006020303,((SPS06998|Nitrotoga_fabula:0.0,SPS06751|Nitrotoga_fabula:0.0):0.042255811,(RFC37636|Nitrotoga_sp_CP45:0.000000005,(RFC33776|Nitrotoga_sp_LAW:0.000000005,RFC30723|Nitrotoga_sp_MKT:0.001768416)0.953:0.002651540)0.916:0.006621566)0.695:0.008594937)0.950:0.008908972,BBJ23476|Nitrotoga_sp_AM1:0.013693167)0.440:0.001391552)1.000:0.666812638)1.000:0.321755680,((((greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3:0.011379394,(NASQAN2014_190_B_bin.96_k121_3766_2:0.017081478,(NASQAN2015_111_B_bin.76_k121_226837_116:0.021392246,icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5:0.002525334)0.985:0.013886431)0.102:0.014633186)1.000:1.045689577,((flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14:0.290495020,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1:0.289900857)1.000:0.977544665,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3:0.182186058,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4:0.220237367)1.000:0.733397499)0.485:0.198655286)0.560:0.125080923,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1:0.429037937,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1:0.433198646,((NASQAN2011_330_B_bin.17_k121_430440_3:0.641466723,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7:0.393884505,(gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3:0.324547720,((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1:0.157095605,((whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1:0.167523285,(NASQAN2011_265_B_bin.52_k121_959771_6:0.026017376,NASQAN2011_265_B_bin.52_k121_465271_4:0.000000008)0.818:0.115349202)1.000:0.087988271,(logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2:0.159911107,(lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5:0.020931878,(watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30:0.032515342,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1:0.071100891)0.951:0.024998611)0.985:0.042982912)1.000:0.086501401)0.986:0.042923050)1.000:0.086203118,(((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6:0.320376687,(flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9:0.147904578,(nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5:0.099435688,lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3:0.013429712)1.000:0.121234242)0.749:0.040234813)0.863:0.055442056,((king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1:0.156531059,NASQAN2015_010_A_bin.16_Ga0466474_000034_25:0.177178519)0.992:0.044604086,((((NarG_Escherichia_coli_NP_415742:0.203008887,NarG_Halomonas_maura_gb_AAT47523:0.153894902)0.981:0.047232779,watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1:0.311887965)0.998:0.063567006,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6:0.106781950,(NASQAN2011_286_B_bin.1_k121_764018_13:0.005660724,NASQAN2011_286_F_bin.29_scaffold_54_27:0.000000005)1.000:0.123919793)1.000:0.131403606,(NarG_Pseudomonas_stutzeri_gb_AAZ43099:0.046987015,(NarG_Pseudomonas_fluorescens_gb_AEV63780:0.078508524,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16:0.074914222,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11:0.000000008)0.885:0.078978122)0.708:0.032866426)1.000:0.168519259)0.242:0.019184033)0.998:0.047390479,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1:0.199222465,((littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6:0.090260755,(littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7:0.175888927,watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2:0.078834694)0.544:0.015106087)0.765:0.040298684,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1:0.189261863)0.493:0.037097247)1.000:0.139855980)0.732:0.020426298)0.995:0.035229012)0.458:0.027215325,((((((NASQAN2015_172_B_bin.54_k121_327740_1:0.048321373,((cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17:0.003316375,Yukon_2004-1_F_bin.10_scaffold_678_1:0.110287220)0.999:0.034293344,(cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5:0.010147982,(NASQAN2015_227_F_bin.21_scaffold_4919_3:0.024300445,NASQAN2011_028_B_bin.24_k121_53788_5:0.000000005)0.990:0.014294289)0.365:0.007073108)0.988:0.017900532)0.950:0.016382079,(watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1:0.104162330,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1:0.054766712)0.871:0.041502925)1.000:0.076566993,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4:0.104610952,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2:0.070583667,eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23:0.043655384)1.000:0.048776638,((yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1:0.089459252,cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1:0.023635532)0.326:0.001148673,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1:0.090302159)0.885:0.013388066)0.878:0.032405321)0.565:0.021969185,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2:0.152164297,(NASQAN2016_164_F_bin.17_scaffold_1152_1:0.081072836,NASQAN2015_227_F_bin.21_scaffold_2406_1:0.055593684)0.976:0.109893377)0.649:0.067627453,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2:0.064995222)0.815:0.039464533)0.963:0.029952893)0.148:0.015135463,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17:0.129369944)0.861:0.019065424,(((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1:0.392541235,yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1:0.171599398)0.840:0.248083204,((Yukon_2004-1_F_bin.10_scaffold_25058_1:0.105822798,NASQAN2016_164_F_bin.17_scaffold_8891_2:0.030238438)0.312:0.015380827,NASQAN2015_227_B_bin.17_k121_559871_7:0.039959075)0.928:0.056585084)0.234:0.007394197,(watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7:0.604640728,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3:0.181397923)0.845:0.147304633)0.903:0.041551231)0.908:0.028658570,lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206:0.136445862)1.000:0.145006781)0.508:0.034596552)0.999:0.098317003)0.563:0.079911427)0.999:0.168588838)0.985:0.135263217,(CRI68048|Thiocapsa_sp_KS1:1.094261762,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4:0.488541056,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1:0.401066831,((GCA_003453735_00577|DMNE01000186unannotatedprotein:0.309801231,(((AFN37208|Nitrolancea_hollandica_Lb:0.039042664,AFN37205|Nitrolancea_hollandica_Lb:0.011623567)0.981:0.018883572,(AFN37207|Nitrolancea_hollandica_Lb:0.059889634,AFN37206|Nitrolancea_hollandica_Lb:0.035086850)0.741:0.017421853)1.000:0.237080104,((WP_005004540|Nitrococcus_mobilis:0.005243894,Nitrococcus_mobi_EAR23355:0.002640284)1.000:0.244172179,((WP_011314088|Nitrobacter_winogradskyi:0.002534990,(Nitrobacter_sp_Nb_311A_ZP_01048070:0.009400785,(A_Nitrobacter_hamburgensis_YP_578638:0.031550923,B_Nitrobacter_hamburgensis_YP_578186:0.023740548)1.000:0.053836401)0.978:0.022733577)0.963:0.016265428,Nitrobacter_winogradskyi_gb_ABA05326:0.037260949)1.000:0.216806507)0.880:0.055888930)1.000:0.201356108)0.974:0.063994885,(blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11:0.000000005,blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9:0.000000005)1.000:0.282418622)0.992:0.095642727)0.132:0.041822075)0.986:0.188699247)0.017:0.049701189)0.871:0.184584331)0.173:0.116759705)1.000:0.987285179)0.550:0.236304701,(providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4:0.472026440,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60:0.325258151,(icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14:0.332187014,muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5:0.705095308)0.418:0.106182937)0.994:0.312896913)1.000:0.774651657)1.000:0.778950754)0.975:0.154198707)1.000:0.231811834,((((cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor:0.000877951,cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor:0.000943888)1.000:0.055806636,(GCA_003523945_00056|DOFS01000023unannotatedprotein:0.004579427,DJ_nxrA:0.006504779)0.999:0.028051194)0.999:0.046515340,(DJ_nxrA2:0.074233359,DJ_nxrA1:0.060036576)0.694:0.026270877)0.990:0.045759227,(((((WP_053378142|Nitrospira_moscoviensis:0.008325164,(riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5:0.012480447,GCA_002083555_01644|MSXN01000007unannotatedprotein:0.002680030)0.924:0.008235322)0.880:0.003077004,(((GCA_002420115_02525|DIHK01000043unannotatedprotein:0.012092376,GCA_002483475_03556|DLHZ01000062unannotatedprotein:0.002691200)1.000:0.023236403,(GCA_900078535_00262|FJVM02000053unannotatedprotein:0.014982211,(GCA_001458695_00808|LN885086unannotatedprotein:0.023036213,GCA_002451055_00821|DKBD01000269unannotatedprotein:0.007573759)0.688:0.003976613)0.390:0.001522946)0.694:0.004052451,GCA_002331335_02310|DCZO01000011unannotatedprotein:0.017101140)0.922:0.006393889)0.980:0.016473529,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32:0.002308752,GCA_002737345_00863|NSIK01000010unannotatedprotein:0.006832549)1.000:0.023034521)0.393:0.016407361,WP_080886776|Nitrospira_japonica:0.032980329)1.000:0.048957408,(((Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein:0.0,Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein:0.0):0.048648714,((CBK42946|Nitrospira_defluvii:0.0,NxrA2_Nitrospira_defluvii_YP_003798871:0.0):0.003132849,GCA_900170025_02937|FWEX01000006unannotatedprotein:0.002326236)1.000:0.046043049)0.987:0.028241355,((CUS31266|Nitrospira_nitrosa:0.032070423,CUS38776|Nitrospira_nitrificans:0.014206130)1.000:0.059565512,(GCA_001567445_02228|JZQY01000048unannotatedprotein:0.031898730,((CBK42928|Nitrospira_defluvii:0.0,NxrA1_Nitrospira_defluvii_YP_003798853:0.0):0.020188049,GCA_003456605_00391|DMQK01000091unannotatedprotein:0.020042828)0.973:0.029005902)1.000:0.049275974)0.916:0.026734542)0.987:0.030138243)0.163:0.019579673)1.000:0.351067665)0.984:0.079553236,((OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14:0.144751486,OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b:0.164104591)0.967:0.106906909,(((OUC07869|Chloroflexi_Litorilinea_aerophila:0.108541565,RCK74665|Chloroflexi_Anaerolineae_bacterium:0.109258954)1.000:0.169950317,(KRT77589|Armatimonadetes_bacterium_CSP1_3:0.210493116,KRT68888|NC10_bacterium_CSP1_5:0.135568128)0.411:0.038266264)0.915:0.031759119,(GBC85351|bacterium_sp_HR11:0.152552869,(GCA_002328125_01442|DCWK01000050unannotatedprotein:0.001947491,GCA_002685755_01556|NYYB01000002unannotatedprotein:0.001760896)1.000:0.300590274)1.000:0.072067691)0.853:0.038248286)0.986:0.048595639)0.582:0.046460101,((MSP_nxrA:0.025354205,(((MBL09191|Acidiferrobacteraceae_bacterium:0.033838550,TDJ60388|Nitrospina_sp:0.042298150)0.934:0.011901270,((Nitromaritima_KMP11423|SCGC_AAA799_A02:0.031363214,((GCA_002705185_00880|PAJA01000060unannotatedprotein:0.0,MAX17737|Nitrospina_sp:0.0):0.009948403,(GCA_001542995_01387|LFLA01000024unannotatedprotein:0.011368914,(GCA_002453875_01196|DKHT01000003unannotatedprotein:0.0,GCA_002454045_00625|DKID01000024unannotatedprotein:0.0):0.025625262)0.731:0.006753767)0.957:0.010197443)0.837:0.006601827,cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor:0.016703925)0.925:0.009659103)0.780:0.008734629,PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15:0.031915291)0.638:0.007806333)0.907:0.014421329,(WP_042250442|Nitrospina_gracilis:0.018020385,WP_042251421|Nitrospina_gracilis:0.040064063)0.228:0.014895744)1.000:0.388356661)1.000:0.140833958)0.990:0.036064959,((((WP_007222969|Jettenia_caeni:0.0,NxrA_planctomycete_KSU_1_ZP_10101005:0.0):0.002251376,TLD40744|Candidatus_Jettenia_ecosi:0.013337202)0.983:0.006913180,TLD41279|Candidatus_Jettenia_ecosi:0.021669001)0.000:0.000000005,WP_007220240|Jettenia_caeni:0.000000005)0.998:0.026966168)0.882:0.017606145,((WP_070067449|Brocadia_sapporoensis:0.003688908,(OQZ04816|Brocadia_sp_UTAMX1:0.003783493,RZV56287|Brocadia_sp_BROELEC01:0.003479253)0.233:0.001151055)0.997:0.020857077,(KKO18624|Brocadia_fulgida:0.021890769,(OOP55454|Brocadia_caroliniensis:0.024026386,(WP_052561322|Brocadia_sinica:0.000917852,KXK29028|Brocadia_sinica:0.000923980)1.000:0.023040103)0.993:0.017011726)0.725:0.010490186)0.877:0.013675102)0.965:0.015645586)0.779:0.007537636)0.931:0.007662564)0.935:0.007110293); diff --git a/assets/trees/nar_nxr/nar_nxr_color_map.tsv b/assets/trees/nar_nxr/nar_nxr_color_map.tsv deleted file mode 100644 index 27fa3bb2..00000000 --- a/assets/trees/nar_nxr/nar_nxr_color_map.tsv +++ /dev/null @@ -1,6 +0,0 @@ -"label" "color" -"nxr/nar-N utilization" "purple" -"other-None" "blue" -"narG-N reducer" "green" -"nxr-Nitrifier" "red" -"nxr-None" "orange" diff --git a/assets/trees/nar_nxr/nar_nxr_search_terms.txt b/assets/trees/nar_nxr/nar_nxr_search_terms.txt deleted file mode 100644 index 6bfb7b07..00000000 --- a/assets/trees/nar_nxr/nar_nxr_search_terms.txt +++ /dev/null @@ -1,13 +0,0 @@ -K00370 -K00371 -K00374 -nitrate reductase -nar -NAR -narG -narH -narI -narJ -EC: 1.7.99.4 -EC: 1.7.5.1 - diff --git a/assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa b/assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa deleted file mode 100644 index 8620f8d1..00000000 --- a/assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa +++ /dev/null @@ -1,5425 +0,0 @@ ->RBG1_10 -----------------------------------------------MTLSRRRFLKISSL -SAAGA---------LVDLPELKFLQFLET------VENPLEYYPNR------DW-EKIYR -DQYRY------DSSFTFVCT-PNDTHACRLRAYVRNGIVIRVEQAYDVQNYTDLYGNKAS -VMWSPRGCNKGYNLPRRVYGPYRVKHPMVRKGWKE----------WAE----------AG -FPDPTLPENQQKYF--RRGEDSWVKVSWDEGFELVAKGLLHTMEKYSGEKGAEIL-RKQG -YPEEMIEAM------HGSGAQTIKIRGAMPLLGATRIFGFYRFAN-MLGLYDGK------ ----LGARGWSNFSWHGDLPPGHPMVTGVKCSDPELNDFRHSKLLVFLGKNMVESKMADAH -WWIETIERGGKVVNISPEYSATSSKSDYWIPIRPG-TDTALLLGVTQIIIQEKLY----D -------QDFIKKHTDLPLLIRMDNLKLLRPTDIIKG---YK----------NQILTG--- ---------------YSVKVQKIKPELREKW---------GDFVVWDLKTKK--PQTVT-- --------REDLGEKIERKGL------N---------------------PALEGNY----- -------------------------------------KIKLV-NGKEIEVKTVFQL----- ----YKELLSE-YDLETVS-----------------------------QITGSPKNLIYQL -AQDL-----------ATIKPASIHTGEGVNHFFHCD-LVTRAVWLPLALTGNIGKPGA-N ---VGHWAGNYKGEVFD--------GLG--------------------------------- -------------------------------VYLNE-----DPFNPNLDPSAKLEDIKLKK -YYK------GEEVCYW-----NY---------------EDRPLIVKG----------KCF -TGKTHMPTP---TKAEWVGNGN-LLNNAKWAHN----------------MIANVE--GKV -EMIVYNEIEWTASCEYADVVFPVHSWMELTLPDMTASCSN-PFLQV----W-KGGIKPIF -DTKQDNEVLAGVAAKLSELT---------------------------------------- ----------------HDNRY--KDYWKF-------------------------VLEG--- --------------------------------NNEVYLQRILDACSTTKGYKIDELL-KSD ------RG----WLMNFRT----Y-PRIPFW----EQIQESK--PFYTKT----------- --------------------GRMEFYREEDEFIDYGENLIVHREPVEATPYL--PNVILG- -THKAIR---PNSYGISPESIN---ADERQVRNLKMSWKQVKLSKNPLWEKGFRFYCLTPK -SRHTVHSSWSVLDWNMIWQSNFGDPYRMDNRTPGVGEHQMHMNPLDAKELGINDGDYAYV -DANPEDRPYTGWKEEDPFYKVSRLMVRVKYNPAYPRGITMIKHASFIATHKSVKAHESRP -DKRAVSED-TGYQSSFRYGSQQSIT---RGWLQPTMMTDSLVRKNYMGQEIGEGYEIDVN -APN-TCPKETLVKIIKAE-DGGMGGKGKW---EPARTGYTPAG--ENKDMKKFLEGGFIL -KV-- ->cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLITQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ECLVTQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_003523945_00056|DOFS01000023unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAVMTKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRM-REQG -YPPEMIEMT------KGSAIRSFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENLY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLSKNQ--AVPIH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-NGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPECIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAIMSKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRL-REQG -YPPEMIEMT------KGSAIRAFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENMY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLNKNQ--AVPLH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-SGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDISFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA2 -----------------------------------------------MLVTKRQFLKITAG -TVAAVA--------LADNALA--LTALQP--VVE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDMYGNRGT -FAHNPRMCLKGYTYHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPELD-PTVMTKYKFSARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEAGARRL-REQG -YPPEMIEMM------KGSGVRSMKFRAGMPVLGVIGKMGITRMNGGCGALLDSWVRKVGP -DSAQGGRYFNNLTWHGDQDPSQPFWSGAQAIDCDLSDMRFSKMNTSWGKNFVENKMPEAH -WKLESIERGGRVVVITPEYNPTAQRADYWMPVRPE-TDGALFLGACKIILDDGLQ----D -------NDFIRSSTDFPLLIRTDTLQYLDPRDVIKD---YA---------FPDFSKS--- ---------------YSGKVQGLSPSQIARL---------GGFMVWDLNQDK--AVPLH-- --------RELVGWHFKKSGI------D---------------------PALTGSF----- -------------------------------------RVKLL-SGREADVMPLFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDN-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAAMVMTLTGNMGKFGS-G ---CHTWSGNYKVGVWA-ATPWSGEGIG--------------------------------- -------------------------------IHTGE-----NPFKITTDPNAHGKEINYRP -YYY------GEETTYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKLRWVANVN-ILNNSKHHYD----------------MVKNVD--PHI -ETIVTQDIEMTSDVNHADVSFAVNGWMEFTYPEMTATVSN-PWMQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDAGSTSYGYSADTML-KSE ------KG----WMVMTRT----Y-PRIPLW----EETNESK--PMWTRS----------- --------------------GRLETYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHVNPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQLDSLPGKMANKWKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA1 -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTMHRRVYGPYRLKGPLMRRGWKQ----------WMD----------DG -SPEFT-PAIQTKYKFNARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEYGARKL-REQG -YPPEMIEMM------KGSGVRAFKFRAGMPVLGIIGKMGITRMNGGCGALLDSWVRKVGP -ENAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDIDLSDMRFCKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAYRADYWIPIRPE-SDGSFFLGACKMIVDEGLF----D -------ADFVRANTDMPLLVRTDTLQYLDPRDVIKD---YQ---------FPDFSNT--- ---------------YSGKVQTLKPAEIARL---------GGIMVWDLNKNQ--AVPIH-- --------RELVGWHFKKSGI------D---------------------PALTGTH----- -------------------------------------RVRLL-TGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QICRSPKDLIVRW -ARDM-----------GTVKPAAIHNGEGVCHYFHMT-QNGRAAALTLIYSGNMGKFGS-G ---CHTWSGNYKAGTWA-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFKITTDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNSKHHYD----------------MVKNVD--PHN -ECLVHQEVEMTSDVNHFDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRLLDAGNCSYGYNADTML-KSE ------KG----WMVMTRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRVETYRVEPEAIEYGENFIVHREGPEATPYL--PNAIMS- -SNPYIR---PDDYGVPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPFVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHPVAWKFKWGFAIDHH -AVN-TTPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_001567445_02228|JZQY01000048unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPIFQL----- ----YQVHLQD-YDLDTVH-----------------------------QVNRSPKDLIVRW -ARDC-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLTTDAHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNSKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVSAKLKELT---------------------------------------- ----------------GEARM--ADTYRF-------------------------VYQN--- --------------------------------RMDIYVQRILDASTTFYGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFIVHREGPECTPYL--PNAIMS- -TNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYCFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42928|Nitrospira_defluvii ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->NxrA1_Nitrospira_defluvii_YP_003798853 ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->GCA_003456605_00391|DMQK01000091unannotatedprotein ----------------------------------------------MMQVSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VVE-VDNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLVVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPYEVVKE---YQ---------LPDFTKS--- ---------------YSGRIQGLTQDHIRRL---------GGMMVWDLAKGQ--AVPLH-- --------REQVGLHFAQTGI------D---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDVMPVYQM----- ----YTIHFQD-YDLDTVH-----------------------------QINRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLKDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFSGVAVKLKEIT---------------------------------------- ----------------GDQRM--ADTYKF-------------------------VYQN--- --------------------------------RVDIYVQRILDASSTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFISHREGPECTPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKQQANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQANFRYGAQQSFT---RSWLMPMHQTDSLPGKQANAMKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMAKWLKGEHIK -IKV- ->Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42946|Nitrospira_defluvii ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->NxrA2_Nitrospira_defluvii_YP_003798871 ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900170025_02937|FWEX01000006unannotatedprotein ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -DKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPLRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NGREIDVMSIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS31266|Nitrospira_nitrosa -----------------------------------------------MVITRRQFMKASAG -TIAAIA--------VADKVLA--LTALQP--VTE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLIRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFASRFLDDMLRVSWDTAFTYAAKAMVVIATRYSGEAGARRL-REQG -YAPEMVEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPVLDTWVRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARLAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMH----D -------VDYLKQFTDMPLLVRTDTLQYLDPREVIPD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDLAKQK--AVPLH-- --------REQVGWHFDSSGI------Q---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDAQPIYQM----- ----YQIHFQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-SNGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWS-ATPWSGSGSG--------------------------------- -------------------------------VHLSE-----DPWQINLDPNAHGKEIKYKS -YYY------GEEPGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAARLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRVEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPHVR---PDDYGIPVTAQH---HDDKTIRNIKLPWVEIKRHTNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS38776|Nitrospira_nitrificans -----------------------------------------------MLVSRRQFMKATAG -TIAAAA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WAD----------DG -SPELT-PEAKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPLLDTWIRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMQ----D -------IDYLKQFTDMPLLVRTDTLQYLDPRDVIQD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDMAKKQ--AVPLH-- --------REQVGWHFDKSGI------E---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDALPIYQL----- ----YLIHLQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-ANGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWN-ATPWSGVGGG--------------------------------- -------------------------------VHLSE-----DPWHINLDANAHGKEIKYRN -YYY------GEEPAYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPIAAQH---HDDKMIRNIKLAWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_080886776|Nitrospira_japonica ---------------------------------------------MTMFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMMRVSWDTAFTYAAKSMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVTS -DQAQGGRYWSNYTWHGDQNPSQPWWCGAQASDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGGRIVVITPEYNPTAYRADYWMPLRPQ-SDGAIFLGAMKIITDENMH----D -------IDFLKGYTDAPVLVRTDTLQFVDPRDVVRD---YK---------FPDFSKS--- ---------------YSGRVQTLKPEQVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYSNSGI------D---------------------AALTGTY----- -------------------------------------RIKLL-NGREIDVMPVWQL----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLLVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHMT-VNSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWV-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PSI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQV----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEIT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYMN--- --------------------------------RVDVYVQRLLDASATFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRVPFW----EETNESK--PMWTRT----------- --------------------GRFETYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYCR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHANGLKWKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRVQSLKPEQVERL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-STPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002737345_00863|NSIK01000010unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRTFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPREVVAD---YQ---------FPDFSKS--- ---------------YSGRVQSLKPEGIARL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002420115_02525|DIHK01000043unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDSWIRKVSP -DQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFMGAMKIIIDENMH----D -------VDFLKQFTDAPILIRTDTLQYLDPRDVVPD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGVPITAQH---HDDKTIRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002483475_03556|DLHZ01000062unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------VDFLKQFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGCWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_001458695_00808|LN885086unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -APELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGVQGSDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFLGAMKIIVDENMH----D -------VDFLKSFTDAPILVRTDTLQYLDPRDVIPD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIQRL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIHTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VVNNAKHHYD----------------MVKNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRPEAEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWDEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPFVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGCQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900078535_00262|FJVM02000053unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------IADNVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------SDFMKQFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQTLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKQ -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTIRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMSKHAPYVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002451055_00821|DKBD01000269unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRRYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIMVDENMH----D -------IDFMKSFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKGEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-ANARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VVNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAVAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002331335_02310|DCZO01000011unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVIMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFMKSFSDAPILIRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKAEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDVEMTSDVNHNDIAFACNTWVEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYSN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMTKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_053378142|Nitrospira_moscoviensis -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIVATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGTAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYLN--- --------------------------------RVDVYAQRMLDASSTFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAYIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVNP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFIGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDT------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->GCA_002083555_01644|MSXN01000007unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMVIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVKD---YA---------FPDFSKS--- ---------------YSGRMQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALNGTF----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYTN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002328125_01442|DCWK01000050unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDTFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNL------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVH-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPETAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->GCA_002685755_01556|NYYB01000002unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDIFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNI------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVY-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPEAAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->WP_042250442|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKIRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDDTFTYLAKGHVAVGKAYSGQRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGIYRLAN-MVGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVCPEYNPPSTKADYWIPCRAGASDISIFLGCAKIIMDEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDTNTDK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDSVN-----------------------------QISHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------SMVAE-----DPFNPVLDISKNVDWANVKG -YLK------GEEVGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---SKLIWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYADFVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTAGMGYNIDDII-NGK ------YGEPGACLLLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTAMMKHSCWTSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMFGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQY-- ----- ->WP_042251421|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRVTWDETFTYLAKGHVAIGKAYSGSRGAQRL-KNEG -YQPEMIEAM------GGSGSRSMKYRGGMGLLGVVGKYGIYRLAN-MMGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPTRAGLADISIFLGVAKILMDEGLV----D -------GEYVKEYTDMPLLVRTDNLIRLHPEDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNYDRDKM---------PDFVVWDTNTDK--PVALT-- --------REDIGAKMRRKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWSGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVLDVTKNVGWENIKA -YAK------GEEPGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLLWFVNVN-VINNAKWFYE----------------MVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQIT---------------------------------------- ----------------GDKRF--ADYMK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTSTSGMGYNIDDII-NGK ------YGEPGCCLLLYRT----Y-PRSPFW----EMYTESK--PFYTAH----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTSMMKHSAWQSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKSKTKMKFVHGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPARTGYTPESPLKDRFAEMYLAGQY-- ----- ->MBL09191|Acidiferrobacteraceae_bacterium -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNRYPMIRVGWKQ----------WAD----------DG -FPYLD-KANREKYKMTSRGTDEFVRMSWDDTFTYLSKGHIAVGRAYSGPRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISVFLGCAKIIMDEGLV----D -------IEYVKDYTDMPLLVRTDNLKRLHADDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFSRDQM---------PDFAVWDANTNK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DVKLT-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLVVRV -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDPAQNTDWKNVKG -YLK------GEEVSYW-----AH---------------RDEALIVNTP-----RYGRKVF -TGRSHMPTP---TKLFWFVNVN-VINNAKWFYE----------------LVFNTD--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFARRMSEVT---------------------------------------- ----------------GDKRF--GEFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -XGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKFGYEADNH -AVN-ATPXEXLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->TDJ60388|Nitrospina_sp -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKRVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRLSWDQTYTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MMALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPVRAGLSDISVFLGAAKIIMDEGLV----D -------VPFVKEYTDMPLLVRTDTLVRLHPDDYIPG---YK---------VQALPKD--- ----------------GFTTKWLKNFNRSKM---------PDYTVWDTNTNK--PVAIT-- --------REDIGAKMLKKKI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPMYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLIIRL -SRDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---AHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFHIILDPAKNVDWKNVKG -YLK------GEEISYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLMWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIIAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLMHREFGKRMAQIT---------------------------------------- ----------------GDKRF--ADFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PYYTPN----------- --------------------GRLQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEEEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYTR -VKI- ->MSP_nxrA ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPLYEM----- ----YKIHLKD-YDLETVN-----------------------------QISHAPKDLVVRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPEMDPAKNTTWAQIKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRMAEVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTGTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPH----------- --------------------GRLQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15 -------------------------------------------------------MQVSAG -VATAMA--------LTSKKVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGSRVMKYRGGMGLLGVVGKYGIYRLAN-MVALLDAIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------VNFVKEYTDMPLLVRTDTLMRLHPDDFIPG---YR---------NQDLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDANTDK--PVAIT-- --------REDIGSKMKKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTIPVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIMPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVMDIAKNTDWANVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRSHMPCP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNCWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFARRLAEVT---------------------------------------- ----------------GDKRF--SDYMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWASTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->Nitromaritima_KMP11423|SCGC_AAA799_A02 -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTGKKVG---AQLKP--VVK-VGNPLDTYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRLSWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTMKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGVNKIIMEEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDFIPG---YK---------AQQLPKD--- ----------------GFTTKWMKNYNRNQM---------PDFTVWDTNTNK--PVAIN-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DVKLV-NGKTITVMPLYEM----- ----HKIHYKD-YDIDTVN-----------------------------QISHAPKDLIIRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFTPLMLTGNVGPKGS-G ---SMTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----TPFDTELDPAKNIDWNRVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PFYTPN----------- --------------------GRTQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPFMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWTATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor ---------------------------------------------------------MSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGVRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVIGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISIFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDNLIRLHPEDFIPG---YK---------VQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFTVWDINTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKVHLKD-YDIDTVN-----------------------------QISHAPKDLILRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTVLDASKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEFGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFLHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002705185_00880|PAJA01000060unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->MAX17737|Nitrospina_sp ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_001542995_01387|LFLA01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSKRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAVAPEYNPPATKADYWIPVRAGLSDISLFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDANTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNIVMDPSKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRMAEVT---------------------------------------- ----------------GDKRF--MDHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002453875_01196|DKHT01000003unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GCA_002454045_00625|DKID01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GBC85351|bacterium_sp_HR11 -----------------------------------------------MKLTRREFMQTTAA -GAAALV--------LDDALRG--LRLLQP--VVE-VGNPLAAYPNR------DW-EAVYR -DQYRY------DRSFTWVCS-PNCTHECRLRAFVRNGIVLRSEQNYDLHRISDLYGNKAT -AHWNPRGCLNGYTFQRRVYGPYRLKYPMIRRGWKQ----------WAD----------DG -FPELT-PENMAKYKFDSRGTDTFVRVSWDEAYTYVARGMIAIARRYSGEEGRRRL-LEQG -YPEEMLEHW------EGSGVRTFKLRGGMGLLGVIGKYGLYRFAN-MLALLDAHVRKVPP -EEAKGARIWSNYTWHGDQAPGQPFVHGLQTSDVDMNELRFARLHIQCGKNLVENKRPESH -FFIELMERGAKIVAIIPEYGPQATKADYWIPIRPA-TDAALWLGITRVMIDNGWY----D -------VDFLKKWSDMPLLIRTDTLRRLRAHEVFPG---YR---------GGLDPKG--- ---------------PSFQVQDLKPDQYEKI---------GDFVVFDEKSQS--LKPLT-- --------RDDVGGRLTAKGI------D---------------------PALSWRG----- -------------------------------------KVRLV-DGTEVECMTLWEA----- ----YKIHLQD-YDLDTVC-----------------------------EITHAPKELVLRL -ARDIWETTQEVRRQNPDMGAVAIHIGEGLNHWFHAT-EMNRAVYLPLILTGNIGKPGA-G ---CHTWAGNYKAALFQ-GSPWTGPGFL--------------------------------- -------------------------------GWIAE-----DPFHPLLDPKADGTQVKVKK -YTH------DEEPAYW-----NY---------------DDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKLMWFTNVN-LLNNAKWVYE----------------MIKNVN--PKV -ELIIAQDIEMTSSCEYADVILPANSWMEMETYEITASCSN-PFLQI----W-KGGIRPIF -DTKDDVLIMAELAKKLGEIL---------------------------------------- ----------------KDRRF--ADYWKF---A----------------------LER--- --------------------------------KTEVYIQRLLDTCTTTKGYRVEDIL-AGK ------YGEPGAALMLFRT----Y-PRVPFW----EQVHDDL--PFFTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNVIVS- -SNPLIR---PEDYGIPLDHMG---RDERQVRNVKLPWSEVKKTKNPLWEKGYRFYCLTPK -TRHATHSSWQVTDWHLLYNNDFGDPYRLDKRSPGVGEAQLHMNPQAAKDLGINNGDYVYV -DANPADRPYVGWKPGDPFYRVARLMLRVKYNPAYPYHVVMMKHAAWIATEKSVRAHETRP -DGRALSED-TGYQASFRYGSQQSVT---VGWLMPMHQLDSLFHKAKAKVGFIFGGEADNH -AVN-TTPKETLVKVTKAE-DGGLGGKGVW---EPARTGYTAGD--EDDFMKRYLNGELVE -IVGE ->WP_099324707|Kuenenia_stuttgartiensis -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALSPS--GYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->OHB72803|Planctomycetes_bacterium_RBG_16_41_13 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKAKYMFDNRGNDELLRASWDEAFTYASKGILHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVDP -DQALGGRNWTNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKIVVITPEYSPSSQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLVRTDTLKRVSPKDIIPN---YK---------LQDISEG--- ---------------PSYQIHGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PALEGSF----- -------------------------------------KLKTV-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------DMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAANFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITTSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEH---WDDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDAFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELVK -VDA- ->WP_070066136|Brocadia_sapporoensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IVNKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFSD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------AAIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTIRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->RZV59451|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKTIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYSGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->OHB44699|Planctomycetes_bacterium_GWE2_41_14 -----------------------------------------------MKLTRRTFLQIAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFVCS-PNDTHGCRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGALGIIGKYGMYRFNN-MLSLVDSHHRGVGA -DKALGGRNWSNYTWHGDQAPGHSFSHGLQASDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSSQKADYWIPIKCN-TDTALFLGVTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQPKDIFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREIV---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLRD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GYVAE-----DAFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPENAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGVW---DPVKTGYTTGN--ENDFMKKYLNGELIK -VEKA ->WP_052562588|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGILHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIIRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKIKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMTKYLNGELIK -VEKA ->OOP57237|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREIL---------GDFVVWDAKTNG--PQPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFYQI----W-KGGIRPVN -DSKDDVMVIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTAKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVTMIKHSSWIATEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVTKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -VEKS ->RIK02127|Brocadia_sp -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPSLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->KKO18748|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->OQZ00558|Brocadia_sp_UTAMX2 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGVGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->TLD40744|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->TLD41279|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------MKHSACISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELVK -MEKA ->WP_007220240|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNIGYPGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->WP_007222969|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->NxrA_planctomycete_KSU_1_ZP_10101005 -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->WP_052561322|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRADTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->KXK29028|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWIYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->OOP55454|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFS--------LADKTMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRSFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGFTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISQG--- ---------------PSFKMHGLHDDQRETI---------GDFVVWDAKTNG--PSPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPYAPATDLKVRG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWAEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSRDDVMILAGMAAKLGDLL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFDAIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAEVKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAMDMGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAD-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMRRYLSGELIK -IEKA ->KKO18624|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LADKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRRGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDEAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPVRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFLN---YQ---------LEDISQG--- ---------------ASFKIHGLHDDQREII---------GDFVVWDTKTNS--PKPIT-- --------RDDVGDKLVGKGI------D---------------------PALDGTF----- -------------------------------------MVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVMILAGMATKLGELL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRMQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDNYGIPESAEH---WDERTVRNIKKSWSDTKQTRNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNPSYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGVW---DPAKTGYTAGN--ENDFMKRYLNGELIK -IEKA ->WP_070067449|Brocadia_sapporoensis ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------RGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTNG--PKAIT-- --------RDDVGDKLVAKDI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLRNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->RZV56287|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPESAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->OQZ04816|Brocadia_sp_UTAMX1 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLVENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVVKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRVKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->KRT68888|NC10_bacterium_CSP1_5 -----------------------------------------------MEITRRTFLKAAAT -GATAF---------LADDAWA--LRLLQP--AVE-VGNPLSEYPDR------GW-ERIYR -DQYGY------DRTFTFVCS-PNDTHACRLRAYVRNGVVMRIEQNYDVSRYADLYGNKAT -PHWNPRGCLKGYTLHRRVYGPYRVKYPLVRKGWKR----------WAD----------DG -FPDLT-PANKTKYRFDSRGTDELMRISWDDAYSYIAKGMIQIARRYSGEEGVRRL-REQG -YPEEMIRET------HGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-TLALLDVHVRGVGP -DQALGGRTWSNYTWHGDQAPGHPYSHGLQGSDVDLNDFRFSKLHIQCGKNLIENKMPESH -FFNELMERGAKIVVITPEYSPPAAKADYWIPIRPN-TDTALFLGLTKILMEERHY----D -------AAFVKRFTDFPLLVRTDTLKRLRAHEVFPG---YR----------GRLPEN--- --------------GPSFTIQGLTKEQYEKL---------GDFVVFDAKSQS--LKPLT-- --------REDVGDRLAQQGT------D---------------------PTLDWQG----- -------------------------------------KVKLA-DGTEVEAMTLWAM----- ----YTIHLKD-YDLDTVH-----------------------------EITHSPKELIQRL -ARDI-----------ATIKPVAIHIGEGINHWFHAT-LSNRAFYLPLMLTGNIGVPGA-G ---SHTWAGNYKAALFQ-GSSWSGPGFK--------------------------------- -------------------------------GWVAE-----DPFNPNLDPNAPGQAVKVKG -YTK------DEEPAYW-----NH---------------GDLPLIVNTP-----KYGRKVF -TGLTHMPTP---TKVMFFNNVN-LINNAKHVYE----------------MLKNVN--PRV -EMIISVDIEMTASIEYADFALPANSWMEFQTPEITASCSN-PFLQI----W-KGGIKPLY -DSKDDVTILAELAQKLGAIV---------------------------------------- ----------------NDHRF--AAYWRF-------------------------ALEG--- --------------------------------RPEVYIQKLLDTSSTTAGYRVDEIM-AGK ------YGEPGACLMLFRT----Y-PRVPFW----EQVHDSD--PFYTDT----------- --------------------GRLHAYCDIPEAIEYGENFIVQREGPEATPYL--PNVIVS- -TNPYIR---PEDYGISPDAMH---WDERTVRNIKMAWADAKRTTNPLWEKGYRFFFLTPK -TRHRVHSQWSVCDWNQIWDSNFGDPYRMDKRMPGVGDHQLHMNPQAAKDLGINDGDYVYL -DANPADRPYIGWKPSDPFYRVSRCMVRVRYNPAYPYQVVMMKHAPYIATERTVKAHETRP -DGLALSE--TGYQANLRYGSQQSLT---RNWHMPMHQTDTLFHKAKATMSFLFGGEADNH -ALN-TVPKETLVKVTKAE-DGGMRGKGIW---EPARTGFTPGN--ESDFMKRYLAGEIVQ -IKKR ->OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------MIWDSNFGDPYRMDKRTPWVGENQLHINPQAGKALGINDGDYVYV -DANPADRPYIGAKPEDPFYKVARLMLRAKYNSAYPYHIVMMKHAPNIATERSVKAHETRP -DKRALS-E-LGYQSNFRYGSQQSIT---RNWHMPMHQTDSLFHKAKVFMGFLFGGEADNH -AVN-TVPKETLVRVTKAE-DGGLGGKGVW---APATTGYTPGA--ESEAMRKYIDGGFVS -T--- ->OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b -----------------------------------------------MNESRRDFLKISAV -TAVTLA--------LSNKPFL--LWALEP--VAN-VENPLAYYPNR------DW-EKIYR -DQYRY------DRTFSWVCS-PNDTHACRALAYVRNGIIIRSGSEYNYETYGDLYGNKAT -QNWNPRQCAKGFTFHRLMYGPYRLKYPLVRRGWRE----------WAD----------AG -FPDLT-PENKTKYKFDSRGTDQLEKATWDEAYTYIANGIMSIAKRYSGVEGKRKL-LAEG -YPEEMLAPM------KGAGTRTMKFRGGMGLLGVFGKYGMYRLAN-TMALLDVNIRGVSE -EGAMGGRAWSNYTWHGDQAPGHPWVHGLQNADCDFNDLRFSKLIIQDGKNLVENKLTDSH -WFIECMERGAKLVTISPEYSPPASKSDYWIPIRPQ-TDAALFLGITRLMIDQGWY----D -------KEFVAQFTDFPLLVRTDNLKRLRAADIFPD---YK---------LGLSKNG--- ---------------PSFKYQGLKQEQYEKL---------GDFVVWDETKGA--PVAIT-- --------RDDVGKNLSKKGI------N---------------------PALEGSY----- -------------------------------------KVKTV-DGKEIEVTTLFSL----- ----YKIHLRD-YDLDSVV-----------------------------EITKAPKDLIEQL -AKDI-----------AAIKPVAIHQGEGINHWFHAT-EMNRAAYLPLMLTGNIGQKGA-G ---AFGWAGNYKAALFQ-GSAWTGPGFK--------------------------------- -------------------------------GWVAE-----DPFHPNLDPQTPGKAINAHA -YFR------DEEPAYW-----NH---------------GDRALIVDTP-----AEGKKVF -TGSTHMPTP---TKAMLFTNVN-LINNAKHTYD----------------MLKNVN--PNV -EMILSIDIQMTASIEYADIALPANTWMESEGLEVTASCSN-PFLQI----W-KGGIPPIF -DSKDDLVILSEIAAKLGDLT---------------------------------------- ----------------GDARF--RDYWKF-------------------------ALEG--- --------------------------------KREVYIQRLLDSSTTTTGYKLDDIM-KGK ------YGPPGGALMLFRT----Y-PRIPFW----EQVHEDQ--PFYTDH----------- --------------------GRLQAYTDVPEAIEYGENFIVHREGPEATPYL--PNVIVS- -SNPYIR---PKDYGIPLDAEH---WDERTIRNVKLPWSEVKNTKNFLWEKGFQFFCLTPK -SRHRVHSLWSNVDWHQIWDSNFGDPYRMDKRTPGVGEQQIHLNPQAAKDLGINDGDYVYV -DANPADRPYRGAKPGDPFYKVARLMLRAKYNSAYPYHVAMMKHGTYIATEKSVKAHETRA -DKRALSEG-GAYQANFRYGSQQSVT---RNWHMPMHQTDTLFHKAKVFMSFIFGGEADNH -AVN-TVPKETLVRISKAE-DGGLGGKGLW---EPVKTGYTPAH--ENDVMKQYLHGGFIK -T--- ->KRT77589|Armatimonadetes_bacterium_CSP1_3 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------MDFNELRHARLHIQVGKNLIENKMPESH -FFNELMERGAKIAVITPEYSPPAAKADYWMPIRPQ-TDAALFLGITRLMMDRRWY----D -------EAFVKQFTDFPLLIRKDTLKRLRAAEVFPG---YK----------PGLDPD--- --------------GPSFKRHNLKLDQYEKL---------GDFVVFDRKTRK--LQAIT-- --------RDQVGERLAQAGL------D---------------------PDLRWRG----- -------------------------------------KVKLI-DGREVECLTLWEA----- ----HRDHLRD-YDLDTVA-----------------------------EITQTPRAMIERL -ARDI-----------ATIKPVSIHIGEGINHWFHAT-LANRAFYLPLMLTGNIGKPGA-G ---CHTWAGNYKAGIFQ-GSPWTGPGIT--------------------------------- -------------------------------GWLFE-----DPFHAALDPATSGTEIKVKK -YLK------DEEPAYW-----DH---------------GDVPLIVNTP-----KAGRRVF -TGTTHMPTP---TKVMWYNNVN-IINNAKWAYG----------------VIKHVN--PNV -ELIINQDIEMTASAEYADIILPANSWVEFETPELTASCSN-PFLQI----W-KGGIKPLF -DTKDDGVIIAEVAAQLTAQT---------------------------------------- ----------------GDRRF--RDYFKY-------------------------LLER--- --------------------------------RPEVYIQRILDSSTSTVGYRVADVV-NGK ------YGEPGAALMLFRT----Y-PRIPFY----EQVHDSE--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENFIVHREGPEATPYL--PNVIVT- -TNPLVR---PEDYGIPLDALH---WDQRTVRNVKLAWRDVKKTKNPLWEQGYRFYLLTPK -TRHRVHSSWSTVDWNMIWDSNFGDPYRLDKRAPGVGEHQLHIHPQAARDLGINDGDYVYV -DAYAADRPYIGWKPSDPFYRVARCMVRVRFNPAYPYSVLMMKHAPFMATEKSVRAHETRP -DKLARSAD-TGYQANLRYGSQQSVT---RDWLMPMHQTDTLFHKSKGTMAFIFGGEADNH -AVN-TVPKETLVKITKAE-DGGIGGKGLW---EPARTGFSPGR--EGDFMKRYLAGTLVK -VTKR ->OUC07869|Chloroflexi_Litorilinea_aerophila ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------EITASCSN-PFLQI----W-KGGIPPLY -NTRDDARILAEVSAALADEI---------------------------------------- ----------------GEPRL--RDYWRF-------------------------ILEG--- --------------------------------RPEIYIQRLLDSSLTTSGYRVEDII-AGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSV--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENIISHREGPEATPYL--PNVIVT- -RSRFVR---PEDYGIPADHMG---WEERTVRNIALPWNQVKETKNPLWAQGFHFYCLTPK -TRHRVHSSWSTVDWTIILDSNFGDPYRADKRLPGPGDHQLHMNPQAAKDLGIEDGDYVYV -DANPADRPYIGWKPDDPFYKVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVKAHETRP -DGLAKSEG-TGYMANLRYGSQQSVT---RDWSMPMHQTDTLFHKQKTGMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGLDGKGPW---EPTKTGYTPAH--ENEFMLRYLAGETIE -VTT- ->RCK74665|Chloroflexi_Anaerolineae_bacterium ----------------------------------------------MSHLSRREFLKLSSV -AALGTV--------INDLD----WKLLDP---IQ-VDNPLAAYPSR------DW-EAVYR -NQYRY------DSSFTFVCS-PNDTHACRLRAFVRNGIILRAEQNYDVERYSDLFGNTAT -AHWHPRGCKKGQTFHRRLYGPHRLKGPLMRKGWKE----------WAD----------AG -FPELD-EENKTKYKFNARGQDELLPVSWETAYDYIARGMIAIARRYSGEEGARLL-RKQG -YPEEMIQAM------SGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-MLALLDVHVRNVPP -EEAKGGRTWSNYTWHGDQAPGIPFVTGLQASDEDLNDLRNSRLHIQCGKNLVENKMAESH -FFIEAMERGAKIVTITPEYSPPATKSDYWIPIRPA-TDTALFLGLARWIIENQKY----D -------EQFVKRFTDFPTLVRADTLKRLRADEVFSN---YQ---------PGLDPQG--- ---------------ASFTLQGLKPEQYEKL---------GDYVVINEKTGR--PQAIT-- --------RDQVGEVMDKAGI------Q---------------------PLLDWKG----- -------------------------------------KLRLV-DGSEVEVLTVWSM----- ----YLEHLKD-YDLETVL-----------------------------EITHVPKDLFLRL -AEDI-----------TTLSPVALHIGEGINHWFHAT-LANRAQFLPLMLTGNIGKPGA-G ---LYTWAGNYKAALFQ-GSAQSGPGFK--------------------------------- -------------------------------GWVGE-----DPFAPNLDENASGKEIKVHA -YTK------DEEPAYW-----NH---------------SERPLIVDTP-----KYGRKVF -TGQTHMPTP---TKVQFFTNVN-LLNNAKHHYE----------------MIKNVN--PNV -ELIISVDIEMTSTVEYADFALAANTWAEFETYEITASCSN-PFLQI----W-KGGIPPLY -DSRDDARILGELAARLGELL---------------------------------------- ----------------EDNRF--RDYWKF-------------------------ILEG--- --------------------------------RPEVYIQRLLDSSITTSGYRFTDII-EGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSI--PFYTDT----------- --------------------GRMNTYCDIPEAIEYGENLISHRESPEATPYL--PNVIVT- -SSRFVR---PEDYGIPPDATG---WEERTVRNLKMPWSEVKNTRNFLWEAGYHFYCLTPK -TRHRVHSSWSTVDWTLILDSNFSDPYRVDRRQPGVGEHQLHINPQAAKDLGLEDGDYVYV -DANPADRPYIGWKAEDPFYRVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVLAHETRP -DGLARSAD-TGYQANLRYGSQQSIT---RDWSMPMHQTDSLFHKQKTAMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGIEGKGIW---EPAKSGYTPAH--ENEFMSLYLQGKTIE -IKR- ->GCA_001803565_00046|MHDQ01000004unannotatedprotein --------------------------------------------MSFDRVSRRQFLETLAA -TATAAL--------VSKPAIGLALEKLQP--IPE-IKNPLEHYPPR------EW-EKIYR -DIYNP------DSSYIFACT-PNDTHNCYLRAYIKNGIVTRIGPSQRYRDATDIYETKAS -ARWDPRICNKGVAMVGRFYGDRRVKYPTVRKGFKE----------WVE----------KG -FPRD--ENGQPPLKYFKRGEDQWEKVSWDEAYTIVAQSMIDTVKTYSGTKGAELL-QKQG -YDAKMIEKM------MGAGTQAMKFRGGMPLLGVIKLFGLYRMAN-SMALLDSYIRGVGP -DKAIGGIGFDNYSWHTDLPPGHPMVTGQQTIDFDLVNAEYANIILCWGMNWICTKMPDGH -WLSEARLKGAKVVTITTDYNSTSSKADEIVIIRPG-TDPAFALGLAQVIINERLY----D -------EEFVEGFTDLPFLVRMDTRELLRAHEIISG---YN---------NAELKYT--- -RVIKKEEKPPPPFATNLGMPAVSSDMRQEW---------GDFVVWDSNAKK--ATPVS-- --------RDDTGERFTNKGV------K---------------------PALEGEF----- -------------------------------------EISLT-NGEKIKVRPIFDI----- ----IKQHLEDTWNVDSTS-----------------------------KITWAPKEAIINL -AREI----------AANKEKVLFTVGMGPNQLFNAD-QKDRAIFLVAALTRNVGFFGG-N ---VGSYAGNYRAALFN--------GMP--------------------------------- -------------------------------QYIAE-----DPFNIILDPTKPA---KVKP -YFK------MQSAHFY-----AH---------------GDTPLKVHDI----------YF -NGETHMPTP---TKFFWFAASNSILGNSKGMYD----------------VVMNLLRNRKI -EAVVVNEWWWSASCEYADVVLPADSWGEYNVHDMTASVTN-PFVMV----MPLTGVSRIW -DTKSDSETYAGVSEKLGELT---------------------------------------- ----------------GDSRF--KDYWRF-------------------------IADG--- --------------------------------KAKPYLQRIIDHSNTMKGYQIDNLISKAK ------DGIP--ALLMSRT----Y-PKFIGY----DQSVESA--PWYNKT----------- --------------------GRLEFYREEPEFLDYGENLPVHREPVDATFYE--PNVIVAK -GHPLIKPKTPTDYGWPMDDLS---GETRQVRNVVYTPDELLNTKHPLRKEGFTHIYLTPK -FRHAVHTFGVDLDLLSIWFGPFGDMYRRDKRKPWVNEGYVEINPDDARELGIEDGDYIWV -DPDPKDRPFKGWQDKPADYKVARCLLRARYHPNLPKGITRTWFNMYQATHGSVRGHESRK -DGLARNPD-TNYQSMYRYGGHQSST---RSWLRPTLLTDTLVRKNLMGQMIGKGFEPDVH -CAN-GAPRESFVKFTRAE-DGGESGKGKW---RPAVLGFRTGY--ENVAMKKYIKGGFIS -KGGK ->SPS06998|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->SPS06751|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->RFC37636|Nitrotoga_sp_CP45 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC33776|Nitrotoga_sp_LAW ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC30723|Nitrotoga_sp_MKT ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-STAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC31618|Nitrotoga_sp_SPKER --------------------------------------------------------KLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGA -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIIPD---YK---------LAELTHH--L -KVMKPGEGPTMPPAFQ-STAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVTPVFQL----- ----QKEYLEE-YTAENTS-----------------------------IMTGVPSEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KMAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--TIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGH -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23760|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23368|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23476|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRAGFKA----------WVE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYAGDKGAALL-TRQG -YDPEMIASM------HGCGCKVMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGS -DEASGAKVMDSYSWHTDLAPGCPMVSGHQQLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGEEPTQPVAFQ-ATAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVAPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HVAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------KEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYHAPE-------------- ---RTISVPKSPMRGNKRAGGHNSPT---RVHLKPSLMVGGYGQ---------FTYSFNYW -GPT-GVNRDTFILVRKLP------GKPEF------------------------------- ----- ->CRI68048|Thiocapsa_sp_KS1 ------------------------------------------------------------- -------------------MSK--TKDDNG--NGG-SRWFRELDEPR------KW-EDFYR -RRWQY------DKSVRTSHS-VNCSGSCSWEVFVKNGMITWELQKTDWPQI-----NDET -PNYEPRGCQRGISASWYPYSPVRPKYPYVRAVLLDFWRAERAAGKDPI----------AA -WGAIVENPERSKAYRNARGKAGWRRTTWDEATEIIAAAKIYTIKEH-------------- ----------GADHLASFSPIPAMSMVSFLSGHRL-------------------------- -SNLLGGTMLSFYEWYHDLPHVMPMIWGDQTDVHESADWYQSAYWIVMGSNLPMTRTADAH -FASEHKYNGGKLVNLSPDYSDVTKFADLWVPVRPG-TDTAFILSCIHVILQEFHV----N -RRSEYFHSYVAQYTNLPFLVILD-----QEGDHFASGRFLR---------ASDVAAY--- ---------------------AD--EELADW----------KLPCFD-KEGE--LRLPGGT -LGFRWEEKNTGRWNLKNEDAVTAQPFD---------------------PLLTLMDGEFEE -VIVEYADFTHTFNVEFGTTALRGEKARKSLRGVPSRVLTKK-DGTK---VRVATA----- ----YDLLLAS-FGVNRGLSGSGYPKDYDDASEAYTPAWQE-------QETGVDRNLAIRV -AREW------ADTAEKTKGKCLFITGSGILHWYHGGSLTYRSEAVMGILTGCQGRNGG-G ---FAHYVGTEKIRNMA---AIGTIGNAADWGNVGRQQNSTSYFYFHTDQWR-YDGMSLDP -LWAPRAKEMPARANHAADMNAVAVRNGWLPFFPQF-----DERNPTDVMQDARKAGCKSL -EDVK-----TWVAQQF-----KE---------------RKLKFALPNVDAPK-NHPKVLW -IYRGNLIGT---SMRGHELNLKHMLGTHNNVLGGETRA----KDMVNEIDWTENAPLGKL -DLIYNVNLRMDSSANYSDIVLPTAHWYEKFDLTCTD--LH-SFLHP----F-TPAHDPAY -ESKHDWEAFRLIAEKISELAKVHLPDPIEDLVMTALSTDTPDEMAQPM---GELRDWWKG -ESEPIPGKTFPNVSVVTRDY--TKIHDMYTTLGPAVTKPNSYGAKGIKGDLAEVYEQMKE -SYLVGEKQGRPNMETAAKVCEVILRISPESDGELSY-----------QIFKNLEKR---- ------CGVPLAHIVEPER----E-TAYHYP-DLISQPRRALTSPHWSAIETKGRTYSPWT -LNIEALKPFHTLT------GRQEIYYDHRMFRDLGEDFPVYKPPVDMV--S--IGDVAQ- -------------------------KDIKMKGAKLFRF-------------------ITPH -QKWGIHSMFGDSWQMQNMFR---------------GGPTVWINDDDARDIGVKDNDWV-- ----------------EIFNENGIQVARAVVSHTVPRDMSIVYHQTERH-------VNVP- ---FSSLAR-ERGASDLRGGNNNATT---RIMMNPATMVGGYANWTYWLNYQGTS------ -----PSERDCVVLIRKKP-METRGRKVIY---QESQL--------NVGA----------- ----- ->NASQAN2011_330_B_bin.17_k121_430440_3 rank: A; amyy:YIM_22320 narG; Nitrate reductase alpha subunit; K00370 (db=kegg) -----------------------------------------------------MFHNASLG -HTATMGRTDDVPNGTEEALIK--FGRFFAGGEVSKDLLSVTKAGGR------EG-DVFYR -DRWSH------DKVVRSTHG-VNCTGSCSWKVYVKDGIITWETQQTDYPSVG-----PDS -PEYEPRGCPRGAAFSWYTYSPTRIRFPYIRSVLLE---------MYREAKGRL-GDSVLA -WADVVDNSENRQRYHRARGKGGLVRVSWSEVSEIIAAAHVHTIKKY----GPDRI-FGFS -PIPAMSMAS------HAAGARFISL----------------------------------- ----MGGSMLSFYDWYADLPVASPQVFGDQTDVPESADWFNASYLIMWGSNVPVTRTPDAH -FMTEARYKGQKVIAISPDYADNTKFADEWVAPHPG-TDGALGMAMGHVILKEFFV----D -KQVPRFQDYVKKFTDLPYLVSLRK----KDGSWVPDKFLVASD-------LGDVSEG--- -----SRFKTVVLDSSTGETFVPNGSLGHRY-------NDSSTGKWNLDLEGVDPLLSV-- --------YGKKGAVSAPVLM----------------------------PRFDQGQ----- -------------------------------------EVSES-GGVLARGVPVIEIAGKTV -TTVYDLMLAQ-YGVAREG--------LDGDWPEGYDDRSPYTPSWQEEITSVPAVQAIRI -AREF------AQNAIDSEGRSMILLGAGTNHWFHSD-TMYRTFLALVTLTGCQGVNGG-G ---WAHYVGQEKCRPVT---GWAQLAFGADWSRPARQMIGTAFWYVSTDQWRYDALGSDLL -------ATPLGEGRFKDMTAIDVIAQSARMGWMPS-----YPSLN-RNSLDLVDEAREKG -VDPA-----QHVINEL-----KS---------------GDLQFAIENPDAPE-NWPRVLT -VWRANILGS---SSKGNEYFLKHLLGTDNSVRA----NENEPDARPKDVKWHEDAPEGKL -DLLVSVDFRMTSTGLFGDILLPAATW--YEKHDLSSTDMH-PFVHA----F-TPAINPPW -ETKTDYEIFQMLGRQVSEQAKGHLGER-EDLVVVPLLHDTPDAMATPG---GVVLDWKKG -EVEPIPGVTMPKLVVVKRDY--SQIGEKMAALGPLIDTLGTNTKGVPVSVLPEIELL--- -------RHSNGVASTGVGAGRPSLARDVDACEAILALSGTTNGRVAVAGFRALEKR---- ------TGQKLTDLALDNE----G-KRITFA-DTQARPVPVITSPEWSGSEHGGRRYTAFA -INVERLKPWHTLT------GRQHFFIDHDWMSELGEQLPVFRPPLNMHRIF--GS----- -------------------------QGDGVAKEVTVRY-------------------LTPH -SKWSIHSEYQDNLFMLSLSR---------------GGQEIWMSVEDAEIIGVKDNEWI-- ----------------EAYNRNGVVVARACISHRMPSGTVFMYHAKD-------------- ---RVVDVP-LAETSGKRGGIHNSLT---RLVIKPTHLIGGYAQ---------LTFAFNYL -GPT-GNQRDEVTVIRRRS--------------------------QDVEY----------- ----- ->GCA_003453735_00577|DMNE01000186unannotatedprotein ------------------------------------------------------------- --------------------MG--------------WIKDIFDPKAR------LW-EEFYR -SRWQY------DKKVRSTHG-VNCTGGCSWEVYVKDGIITWEMQETDYPLLE-----PGL -PHYEPRGCQRGITFSWYIYSPLRIKYPYIRGVLLD---------LWRKAKSIH-TDTVAA -WESVVENEESRRSYQKARGKGGLRRTTWEEALEIIAASTIYTAKKY----GPDRV-IGFT -PIPAMSMLS------YASGTRFLQL----------------------------------- ----FGGVALSFYDWYADLPPASPEVWGEKTDVAESADWYNSKYIVAMGANLSMTRTPDVH -FVAEARNNGTKLVVLSPDFSQVSKYADWWLPVTAG-HDGAFWMAVDHVILKEFFV----D -RQVQYFSDYLKRYSDAPFLVEIE-----GGEGSLRAGRFLR---------ANTLSRY--R -DAENGEWKLLVFDGKAKEPRMPNGSVGFRW--------QERKGQWNLEM----------- --------KDGADDTIIQPLLSLFEDRD---------------------AAVSINF----- ---------------------TEFASGRTFKRAVPVKYLQTE-KGR----VLVATV----- ----FDLLMAQ-MGVGRGL--------EGDFAEDYNDAERPYTPAWQEQFTGVSRDTLVCF -AREW------AVTAEKTKGKCTIIVGSGVNHWYHSN-LNYRAGITALILCGCVGVNGG-G ---MNHYTGQEKVAPEA---SWKSIAFALDWIKPPRLQNTPSFHYVHSDQWRYAE------ --------PENGIKVLEYMHPMDVLVNAVRMGWLPF-----YPQFN-RNPIDLVREAEESG -AKS------EQEIIEWLVLQLKD---------------KKIRFAVEDPDAPE-NWPRVWY -IWRGNAILA---SMKGHEYVLKHYLGTSTNAVA-----DEIVSASIKEVHSKGSAPEGKL -DLVIDINFRMDTSALFSDIILPAATW--YEKDDLNTTDLH-SFIHP----L-SAAVPPCW -EAKNDWDIFKEIALKISQLAPAHFSEPFREIVATPLMHDTRQEISQPQ-----VKDWHKD -KCQAIPGKTMPKFSVVERDY--TNLFKQFISYGHKEKEEGMGERGIQWKIGDMYDEF--- --------MKGVPVEQWGGERYPSLSEARDAANVILHFAPETNGEIAYRGFKALEEI---- ------TGMPLSDLAERQR----S-VRTIFP-DLLDQPKRILTSPCWSGITNGGRAYAPYC -INVERLMPWRTLTGRQHXAGRQHFYLDHEGYISFGENLPTFKSRVLLQN----------- ----------SGDIG----------KSTAIEKSLVLNF-------------------LTPH -GKWHMHTTYYDNLLMLTLSR---------------GVEPFWLNSKDAEDIGVKDNDWV-- ----------------EVYNDNGVVVTRAVVSARTPAGVGIFYHAPERT------------ ----ISFPK-SPLRNMKRGGGTNSLT---RIRLKPVLMVGGYAQ---------FSYAFNYW -GPI-GPDRDTYAYVHKLD------GKPVF------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------MRGALLD-------------------------------LW-QEARR -QH-------------------------------------------------------PDD -PV--------------------------------------------------------AA -WASITDDPARRKRYQEARGKGGFRRVSWSEAQELIAAANLHTVKKY----GPDRL-VGFS -PIPAMSMIS------YAAGARFLQL----------------------------------- ----MGGLCLSFYDWYCDLPPASPEIWGEQTDVAESADWFHSKFIATVGSNVLMTRTPDAH -FLVEARHKGAKVVVFSPDFSQTSKVADEWIPINQG-SDTAFWMAVNHVILREFHA----E -RSVPYFQTYLRENTDAGFLVVMKA----DAQGNYRPGSLLR---------ASQLAET--Q -GEENAEWKSFVLD-TQGNLRVPVGQVGHRW--------QKSKGQWNIKQED--ARTGE-- --------AFEAALTLRDSAT----------------------------GAVKAVF----- ------------------DDFSEGRTDRVRVREVPVREVQTV-EGP----VYVTTV----- ----YDLHLAQ-HGVNRGF--------GGDWPTGYADDTHPFTPAWQEQYTGIKAETVINF -ARQW------ATTAEKSQGKCTVIIGAGVNHWYHNN-LIYRACINALIYCGCVGRNGG-G ---LNHYVGQEKLVPQA---SWGPIAFGTDWSAPPRLQNAPSFHYMHSDQWRYDRKFDEMC -------PVADKSHLMASGHTADKQALAVRSGWLPC-----YPQFTEHN-FKLVQEAEDRG -ADPV-----QHVVGRL-----KD---------------RSLKFAMEDVDNPA-CFPRVWY -IWRGNAIQA---SAKGHEYFLKHYLGTHHNSIA-----VEHAREDVKEVTWHDKLELGKM -DLIVDVNFRMDTSALYSDIVLPTASW--YEKDDLSSTDMH-SFIHP----L-QAAVPPCW -EAKSDWKIFRGIAEETSRMAQRYLPEPVKDFVCTPLMHDTPAEIAQPT-----VKDWAKG -ECEAIPGKTMPNMKVVERDY--TKIFQKYITLGRNFRNNGLGIHGTTYPVDDLYDAY--- --------LQDHPVEEVDGERYPSLRADRSVCEAILHFAAETNGELAYRAYEAESHK---- ------TGIDHTHLAAPTR----G-VRYNFA-DLCTQPRRSLTTPFWTGITNGSRTYSAYC -QNVEERIPWRTLT------GRQHLYFDHEAYVAYGEHLPTFKPRADLRTTR--DLDMTG- ----------------------------VESGALVLNY-------------------LTPH -GKWHIHSTFGDTLRMETLSR---------------GIEPFWMNEQDAGLLGIHDNDWI-- ----------------EVLNDHGTVVTRACVSARIPRGICFIYHATERT------------ ----IGNPK-SKHRGMRRAGGHNSLT---RARLKPLFMIGGYAQ---------FTYAFNYW -GPQ-GVNRDTFVVVKKLD-------KPEW------------------------------- ----- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MN-WIEEISNPHAR------QW-EEFYR -NRWQH------DRVVRSTHG-VNCTGSCSWMIYVKDGIVTWELQALDYPVLN-----NGL -PPYEPRGCQRGISFSWYQYSPIRVKHPYMRGVLMD---------LWRKAKETH-QDPVEA -WTAVVEDEAARKSFHQARGKGGFRRASWDEVTEIIAASTMYTIKKY----GPDRI-IGFS -PIPAMSMLS------YAGGSRLMQL----------------------------------- ----LGAVSMSFYDWYSDLPPASPETWGEQTDVAESADWFNSKYIVSVGSNMSMTRTPDVH -FAAEARHNGTKLVVFAPDFNQVAKYADWWVPVNAG-QDGAFWMAVNHVIMNEFHY----Q -NPTPYFLDYMKRYTDSPFLVELN-----EVDGKFVPGRMVR---------AGQVERT--K -DVENGEWKFLVWDELSNAPRMPQGSLGFRW--------QQQKGQWNLEPKD--G------ --------LDGSEIRPQLTFL---GATD---------------------EQLSVSF----- ---------------------AEFGEGKSFQRNIPVRTIETA-NGK----VAVATI----- ----YDLLMAQ-YGVGRGL--------EGDYPASYDDENLSYTPAWQERYTGIDRQTVIQF -AREW------ATTAEKTEGKCMIIIGAGVNHWYHNN-LIYRACIGALMLTGCVGRNGG-G ---LNHYVGQEKLAPAA---PWASIAFALDWQKPPRQMNSPSFHYINSDQWRYERTYTEPQ ---PVSRPDSESHRDMTQEHTLDANIRAVRMGWLPS-----YPQFN-VSSLEIIRKAEQAG -AKS------DAEIRQWVVNQLKS---------------GELKFAVQDPDAPE-NWPRLWF -IWRGNALNA---SAKGQEYFFKHYLGTHHQIIS-----EEVDKSHFNEVTYRDEAPEGKF -DLVVDINFRMDTSALYSDIVLPTASW--YEKDDLNSTDMH-SFIHP----L-QMAVPPSW -ESKSDWDIFKILAEKFSELAPTHFPEPVRDLVAMPLQHDTPAEMAQAH-----IRDWAKG -ECEPIPGVTMPNFIVTERDY--VNLGKRFVSLGPKVEKEGFAIHGIHMEVGDLYREL--- --------LKSKPTVTWNGQTYPSLTVARDAANIILNLAPETNGEVAYRAFKAEEER---- ------IGLKLTDLAEPTR----A-VRTDFK-DVVRQPRRLLNSPIWTGIMTDGRPYAAYT -LNVERLVPWRTLT------GRQHFYLDHEGYLAYGEHLPTYKPRPD-------------- ----------PLAFGDLEKSHS-------EGKTIQLNY-------------------LTPH -AKWHIHSNYFDNDRMLTLSR---------------GLEPLWISEKDAKEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYH----------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3 rank: A; htq:FRZ44_42870 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------ILDKLMF--FKAGTE--RFA-DGYGAVTEESR------AW-EDGYR -QRWQY------DKVVRSTHG-VNCTGSCGWQVYVKSGFVTWETQVLDYPLTR-----PDL -PNHEPRGCARGASASWYLYSSNRIKYPLMRRQLMD---------LWREARRRH-KDPVEA -WRSIVETPELARRYKQARGRGGFVRAEWDEANELIVASNTYTIKEY----GPDRV-VGFS -PIPAMSMVS------YSAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSNFLIVWGSNVPQTRTPDAH -YFAEVRYKGTKTVVVTPDFSEAAKFADLWLDPKQG-TDAAMAMAMGHVILKEFHA----D -NPEPYFRDYCQQYSDLPFLVRL-----VKQGEHYVPERFVR---------ASDFADG-QG -QDNNPEWKTLGFDELTDELVVPNGSIGFRW---------GEDGRWNLEQKD--A------ --------RSGVAAKLRLSLL------EAPSEAPGPKSERSTQVANVAFPYFGGRH----- -----------------HEFFESSPQDEIQVRNVPARTLALK-DGE----YLVATV----- ----FDLMLAH-YGIDRGL---------GGVAASSYDDDVPYTPAWQERITGVSRDKVIAV -ARGF------ADNAAKTRGRSMVIIGTGVNQWFNND-MTYRAVINMLILCGTVGRSGG-G ---WAHYVGQEKLRPQP---GWQTLAFALDWSRPPRLMNGTSFWYAHTDQWRYEKVQASEL -------LSPTREQGDWDVSLIDYNVRSERMGWLPS-----APQLE-KNPLRLGREIHEQK -LDAP-----TAVAHQL-----ET---------------RTLRLSCEDPDNPR-NFPRNLF -VWRSNLLGS---SSKGHEYFLKHLVGAKHGVLG--ADLKELGERLPTEVDFHDEAPEGKL -DLLVTIDFRMSSNCMYSDIVLPTATW--YEKNDLSTTDMH-PFIHP----L-TGAVDPLW -ECKSDWEIFRGFAEKFSEVCEGHLGTE-YDVVLQPLQHDAPGELGQAL----GVVDWKKG -ECRAIPGKTMPNVQLVERDY--PATYKRFVSLGPLVNSLGMSTKGLKWDATEEVELL--- ------KEKNGEVAEAGVGHGRPRIQTDLHACETILALSPETNGRVAVKAWKALEVR---- ------TGRQHAHLAEGRA----A-ERITFD-DVVAQPRKVITSPTWSGAESEKVTYSAGY -INVEEQVPWRTLT------GRQQTYQDHPWMRAFGEHFPSYKPPIDTK--T--VGTLLR- -------------------------SQENGNPQLVLNF-------------------LTPH -QKWGIHSSFTDTQMMLTLSR---------------GGPNIWVSEQDARRLGISDNDWI-- ----------------EAYNSNGALVARAVVSQRIKAGCAFMYHSQD-------------- ---KTVNAP-GTETTGTR-GIHNSIS---RIVVKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDDFVVIRKVR-----------------NLDFMDGTPVRILAPAVSVGGAE-- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7 rank: A; ddz:DSYM_27970 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--FERVQS--TFS-GGHGIVTNEDR------KW-EDAYR -NRWRH------DKIVRSTHG-VNCTGGCSWKIFVKNGLVAFEMQQTDYPRTR-----DDL -PNHEPRGCQRGASFSWYLYSPHRIKHPLVRGRLLD----------LYRAERKSGKDPVEA -WEAIQADPAKRIQYTAVRGLGGFVRTNWDEVTEIAAAANVYTIKKW----GPDRI-YGFS -PIPAMSMLS------YAAGSRYLSL----------------------------------- ----IGGACGSFYDWYCDLPAASPQTWGEQTDVPEAADWYNSTYLIICGANLPMTRTPDAH -FATEVRYKGAKVVSMAPDYAEFVKFADLWMPVKQG-TDSAAFLAMGHVALKEFHV----K -RQDPYFQEYIRKYTDLPMLVMLR-----KTDDGYASDRTLR---------ASDFTGN-LG -ESNNPEWKTIVYDEKTKSYVAPNGSVGFRW---------GEEGKWNLLPKNAANQEEILA -ELTCIDSRDDV----ASVGF----------------------------PHFNAGE----- --------------------------PGLLYRNVPVRKLKLA-SGEDVLVSSV-------- ----YDLQVAQ-YGIDRGL-------GGGNVTDSYEDDKVAYTPAWAEKVTGVKRADLIRT -GREF------AENASKTKGKSMVIMGAAINHWYHND-LSYRAIMNLLHMCGCVGQSGG-G ---WAHYVGQEKLRPQA---GWAPIAFATDWHRPPRHMNSTTFWYFQTDQWRYEKVSADGL -------LADNAKSKYKGYQLADYNVVSQRLGWLPS-----APHFN-KNPIDIVTEAEKAG -ATD------EASIAKHMVEQLKS---------------GKLYFASEDVDAPE-NFVRNLF -VWRSNLLGC---SAKGHEYFLKHLIGAQNGVLQ-----EGVEGRACKEIKWHENGPTAKL -DLMVDINFRLNSTGAYSDIILPTATW--YEKHDLNTTDMH-PFVHP----L-SEAVSPGW -ESKSDWQIFQNIAKAFSKLAEKHLGTK-KDVVALPMQHDSPFELAQAM----GVKDWKKG -ECEPIPGKTLPLLKVVSRDY--PNTLKKFQAIGPLLNKLGNNVKGIDWNTDQELNEL--- ------KSLNGEILEDGISKGMPSIAADIAACDAVLRMAPETNGEVAHKSWSALSKK---- ------TGIDHHHLYAGRH----E-DKITFR-DIQAQPRKIITAPTWSGIESETVSYTAGY -TNIHEHIPFRTLT------GRAQFYQDHEWMLDFGEGFCAFRPGLDMKAIEATPKSVLA- ------------------------------KPHLVLNW-------------------ITPH -SKWGIHSSYQDNLRMLNLFR---------------GGPYFWIAEDDAKSIGLEDNDWV-- ----------------EAVNGNGATVARVVVSQRVPRGMALMYHAQE-------------- ---KIVNVP-GSPTTGKRGGILNSVT---RVVVKPTNMVGGYAQ---------LSYGFNYY -GTV-GTQRDEFVVVHKIE-----DKDVDW-----LERPLTPER--EGKLNPPGVGPR--- ----- ->NASQAN2011_286_B_bin.1_k121_764018_13 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D-----------AHDGFVNVCFPYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->NASQAN2011_286_F_bin.29_scaffold_54_27 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D--------AHDGFVNVCF---PYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6 rank: A; thes:FHQ07_07000 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSY--------FLDRLNF--FKPAPE--PFA-DGHGAARREDR------SW-EDSYR -RRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLIRAALLK---------LWREARKS--KSPVEA -WASIVSDPVKAKSYKQKRGMGGFVRSTWDEVNEIIAASNLYTVKEF----GPDRV-VGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGGCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVAITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHV----D -QPSQYFTDYCRQYSDMPMLVRLER----RADGRLVPERYLR---------AADLGGL--G -ETNNPEWKTLAIDDNSGDITVPNGSVGFRW---------GEKGKWNIEEKD--------- --------SAGRETRLRLSLK------D--------HADGVESVSF---PYFGGIE----- -----------------NEYWTESKFSDVLERNVPVKRLNLA-DGKEWVVASV-------- ----YDLLLAQ-YGVDRGL--------GGGNVASSYDDNVPGTPAWQEKITGVPRAEVIQI -AREF------ARTADKTHGRSMVIVGAAMNHWFHND-MNYRGLINMLVMCGCVGQTGG-G ---WAHYVGQEKLRPQS---GWAPIAFGTDWSKPPRQMNGTSFFYFNSSQYRYEKLGVEEI -------LSPLADKSKYSGSLADYNLRAVRMGWLPS-----LPQLN-TNPMKLVREAEAAG -VAPV-----DYAVGKL-----KD---------------GSLDFAFADPDAPE-NYPRNLF -IWRSNLLGS---SGKGHEYMLKHLLGTRHGLQG--KDLGERGAAKPEEIKWRDEAPEGKL -DLLVTLDFRMCTTALYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIFKGIARTVSQLAPGVLGIE-KDLVLVPTLHDTPNEIAMPY----GVTDWKKG -ECDLIPGKTAPSMVVVERDY--PNLYKKFTSIGPLLDTQGNGGKGMNWDTTHEIEFL--- ------GKLNHEVLEAGVSHGRPQLETAIDCAEAIMHLAPETNGHVAVKAWASLETF---- ------TGREHQHLAVGKE----H-EAIRFR-DIQAQPRKIISSPIWSGLEDENVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHEWMRDFGEGFMQYRPPVDTKTIK--P--IIG- -------------------------KKPNGNREIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKSAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRMMNGIAMMYHAQE-------------- ---RILNTP-GSEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------LAYGFNYY -GTV-GTNRDELVVVRKMN-------KVDW---LDGEPVPATKEAAR-------------- ----- ->NarG_Escherichia_coli_NP_415742 -----------------------------------------------SK------------ ---------------FLDRFRY--FKQKGE--TFA-DGHGQLLNTNR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKYPMMRKRLMK---------MWREAKALH-SDPVEA -WASIIEDADKAKSFKQARGRGGFVRSSWQEVNELIAASNVYTIKNY----GPDRV-AGFS -PIPAMSMVS------YASGARYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYAEIAKLCDLWLAPKQG-TDAAMALAMGHVMLREFHL----D -NPSQYFTDYVRRYTDMPMLVMLE-----ERDGYYAAGRMLR---------AADLVDA-LG -QENNPEWKTVAFN-TNGEMVAPNGSIGFRW---------GEKGKWNLEQRD--GKT---- --------GEETELQLSLLGS------Q----------DEIAEVGF---PYFGGDG----- -----------------TEHFNKVELENVLLHKLPVKRLQLA-DGSTALVTTVYDL----- -------TLAN-YGLERGL--------NDVNCATSYDDVKAYTPAWAEQITGVSRSQIIRI -AREF------ADNADKTHGRSMIIVGAGLNHWYHLD-MNYRGLINMLIFCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWQPLAFALDWQRPARHMNSTSYFYNHSSQWRYETVTAEEL -------LSPMADKSRYTGHLIDFNVRAERMGWLPS-----APQLG-TNPLTIAGEAEKAG -MNPV-----DYTVKSL-----KE---------------GSIRFAAEQPENGK-NHPRNLF -IWRSNLLGS---SGKGHEFMLKYLLGT-EHGIQGKDLG-QQGGVKPEEVDWQDNGLEGKL -DLVVTLDFRLSSTCLYSDIILPTATW--YEKDDMNTSDMH-PFIHP----L-SAAVDPAW -EAKSDWEIYKAIAKKFSEVCVGHLGKE-TDIVTLPIQHDSAAELAQPL----DVKDWKKG -ECDLIPGKTAPHIMVVERDY--PATYERFTSIGPLMEKIGNGGKGIAWNTQSEMDLL--- -------RKLNYTKAEGPAKGQPMLNTAIDAAEMILTLAPETNGQVAVKAWAALSEF---- ------TGRDHTHLALNKE----D-EKIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLS------GRQQLYQDHQWMRDFGESLLVYRPPIDTRS----VKEVIG- -------------------------QKSNGNQEKALNF-------------------LTPH -QKWGIHSTYSDNLLMLTLGR---------------GGPVVWLSEADAKDLGIADNDWI-- ----------------EVFNSNGALTARAVVSQRVPAGMTMMYHAQE-------------- ---RIVNLP-GSEITQQRGGIHNSVT---RITPKPTHMIGGYAH---------LAYGFNYY -GTV-GSNRDEFVVVRKMK-------NIDW---LDGE---------GNDQVQESVK----- ----- ->NarG_Halomonas_maura_gb_AAT47523 ------------------------------------------------------------- ----MSH--------FIDRLNF--FRKARE--PFA-NDHGEVRDESR------GW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKHPLVRKPLLK---------LWREALEEK-GDPVDA -WASIVEDPAKTKQYKRARGMGGFVRADWNELNELIAASNVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVSVTPDYAEVSKLTDEWLSAKQG-TDAALAMAMGHVILKEFHL----D -RPSAYFTDYVRRYTDMPCLVELEA----REDGSYVPGKQLR---------ASDFEAS-LG -QDNNPEWKTVAWDETRDQLVVPRGSIGFRW---------GEEGKWNLEPRD--------- --------AEGAEIKTRLSLA------E--------AHDDVARVAF---PYFGGIA----- -------------HEHFDHVKSGGASDELLFHSLPAKRLTLA-DGREILAVTVFDL----- -------MCAN-YGIDRGF-RSQEGKEGEDDGATAYDQVKPYTPAWQEKITGVPAEQCLRI -AREF------ADNADKTHGRSMIIVGAGMNHWYHMD-MNYRGLINMLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWLPLAFGLDWQRPPRHMNSTSFFYNHSSQWRYXKLEIKEI -------LSPLAKPADYSGSLIDFNVRSERMGWLPS-----APQLA-TNPLSLAGKAAEAG -QSTA-----DYVVDQL-----KA---------------GGLRFAAEDPDDPQ-NFPRNMF -IWRSNLLGS---SGKGHEYLLKYLLGT-RHGIQGKDLG-EDGGQKPEEVVWHEAAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAATDPAW -ESRSDWDIYKGIARAFSKACVGHLGEE-TDLVTLPLQHDSPAELAQPE-----VKDWKRG -ECEPIPGKTMPALVEVKRDY--PATYERFTSVGPLLDSLGNGGKGIGWKTEKEVELL--- -------GKLNYVKTEGPAKGRPRIESAIDAAEVILTLAPETNGQVSVKAWEALSKI---- ------TGRDHRHLAEPKE----E-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTVS------GRQQFYQDHAWMRAFGESLLVYRPPIDTKAAV--SL----- ----------ADDKG-------------NGNPEIALNW-------------------ITPH -QKWGIHSTYSDNLLMQTLSR---------------GGPIVWLSKDDARSIGVEDNDWI-- ----------------ELYNANGAIAARAVVSQRVKNGMAMMYHAQE-------------- ---RILNMP-GSEVTGTRGGIHNSVT---RVCPKPTHMIGGYAQ---------LAYSFNYY -GTV-GSNRDEFVIVRKMK-------KIDW---LDGE---------GNDYEQEAVK----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7 rank: C; this:HZT40_10960 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FKQRKT--PFA-QGHGAVTHEKR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASFSWYIYSANRLKYPLIRKPLME---------LWRSAKARH-TDPVVA -WESIVENPLSTNDYKTKRGLGGFIRSSWEEVNELIAAANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCMSFYDWYCDLPPASPMIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKHADQWLNPKQG-TDAALALAFGHVILKEFHL----D -KPSTYFTDYVRRYTDWPNLVLLEK----RDDGSYQAGRFAR---------ASDFVEG-LG -ESNNPDWKTVAIDEATGEIIAPNGSIGYRW---------GENSKWNIQQKHG-------- --------TDQQEVTLALSLI---------------------------------------- ------------------------------------------------------------- ----------------------------------------------------KQHDQIVEL -CLPY--------------------FGGVPSDYFKGN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------VLKDVL----- ----------------------------RYQLPARQVTLAD-------------------- ------------------------------------------------------------- ----------------GTTGL---------------------------------------- --------------------------------LVTVYDLNMAN------------------ -----------------------Y------------------------------------- --------------------GISRGLGADDSAQDFNDA---------TAPYT--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------PAWQEAI------------------------- ------------------------------------------------------------- ----- ->king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1 rank: A; gpb:HDN1F_13240 narG; Nitrate reductase, alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLQF--FNKVKS--TFA-DGHGAVVNEDR------GW-ENAYR -SRWQY------DNIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCQRGASYSWYLYSANRLKYPMMRKPLLE---------LWRE--ARKSLSPVDA -WESIVENPVKSKAYKTKRGLGGFIRVDWEEANELVAAANIYTAKKY----GPDRI-NGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPSSPQTWGEQTDVPESADWYNSTFLMLWGSNVPQTRTPDAH -FYTEVRYKGAKSVVITPDYSEAAKFADLWLAPKQG-TDAALAMAFGHVVLKELHL----D -NPSEYFTEYCRKTTDMPHLVMLKT-----RGNAFVADRFLR---------ASDLSDN-LQ -QSNNPEWKTLVINENTNEMVVPNGSIGFRW---------GEDGKWNIQATDS-------- --------ADGSDIKARLSLI------E-----------NADQVVSVEFPYFGNLN----- -----------------HPHFTHTEHAEILERNVPARRIQLA-DGSDAYVVTVFDL----- -------LVAN-YGIDRGL--------GGENVAKSFDDDQPYTPAWQERITGVKREHVITV -ARQF------AENAHKTHGKSMVILGAGLNHWYHMD-MNYRGIINLLMMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWHRPPRHMNGTSFFYNHTSQWRHEKLDVREI -------LSPLADKTAWSGSLLDYNVRAERMGWLPS-----APQLN-VNPLELTKAAAAAG -QSPV-----DYAVENL-----KS---------------GKLAFACEDPDNPV-NFPRNLF -VWRSNLLGS---SGKGHEYFLKYLLGTTHGVQG--KDLGEMGAPKPEEVVWHEQGAEGKL -DLLVTLDFRMSTTCMYSDVVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIARKFSELSVGHLGVE-KDLVLVPTLHDTPSELGQAV----GVKDWKKG -ECEPIPNKTLPNMVVVERDY--PNTYKKFTALGPLLDKLGNGGKGISWNTQSEVEQL--- ------RDLNYRVTEEGVSKGLPRIESDIDACEVVLMLAPETNGQVAMKAWAALSKI---- ------TGRDHTHLALPRE----D-DKIRYR-DVQAQPRKIISSPTWSGLESEHVSYNAGY -TNVHEMIPWRTLT------GRQQFYQDHLWMLGFGESLCVYKPPIDTKTIA--P--LLN- -------------------------QRSNGNGEVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPCVWMSETDAKKVGIEDNDWI-- ----------------EAFNLNGALVARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-ASEITKTRGGIHNSVT---RTCPKPTHMIGAYAQ---------QSYGFNYY -GTV-GSNRDEFVIVRKLS-------KVDW---LDTPVAQA-------------------- ----- ->NarG_Pseudomonas_fluorescens_gb_AEV63780 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFS-DGHGETRKESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKIRKPLLK---------LWRE--ARQTLPPVEA -WASIVEDKAKADSYKSKRGMGGFIRSNWEEVNEIIAAANVYTVKEH----GPDRV-VGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----D -KPSAYFTEYAKRYTDLPVLVMLKPMLGAAPGAGYQPDRFLR---------ASDLTDN-LG -QDNNPEWKTIALD-AAGELVSPQGSIGYRW---------GEKGKWNILPREG-------- --------GEGREIDLKLSLI-------------------GGDVAEVAFPYFAGEA----- -----------------QEYFQHVAGDAVQFRRVPVHSVVLA-DGSVAKVATVFDL----- -------SAAN-LAIDRGL-------GGANVAKDYNDASVPGTPAWQEQITGVSREKAIQI -AREF------ADNADKTRGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWNRPPRQMNGTSFFYGHSSQWRHEKMSMHDV -------LSPLADKSQFPEHALDYNIRAERAGWLPS-----APQLN-TNPLHICRDAAAAG -MEPK-----DYVVKSL-----QD---------------GSLRFACEQPDSPV-NFPRNMF -IWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN--EDIGHSTECKPTEAEWVDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -ESRSDWEIYKGIAKAFSAMSVGHLGVE-KDLVTVPLMHDSVGELAQPF----GGTDWKSA -GVAPVPGKNAPNLQVVERDY--PNIYKQFTSLGPMLEKLGNGGKGINWNTDTEVKFL--- ------GELNHKEVEAGISQGRPKIDSAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGIDHSHLAISKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDDHVSYNAGY -TNVHESIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVNTRTIA----GVKG- -------------------------KRSNGETEIVLNW-------------------ITPH -QKWGIHSTYSDNLLMLTLSR---------------GGPIVWLSEIDAKRAGIEDNDWI-- ----------------ECFNVNGALTARAVVSQRVKEGMVMMYHAQE-------------- ---RIVNVP-GSETTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMV-------KVDW---LDGSSGDDLPRPLPTDIEEN-------- ----- ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFA-DGHGETRIESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWREARRN--MTPVDA -WASIVEDKAKAESYKSKRGMGGFIRSSWDEVNEIIAAANVYTVKQY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQIWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKLTDLWLNPKQG-TDAALAQAFAHVIFKEFHL----E -KPSEYFRDYAKRYTDLPVLVRLN-----EKDGSYIADRFLR---------ASDLADN-LG -QENNPEWKTIAVDGSTGELVSPLGSIGYRW---------GEKGKWNIEARE--G------ --------KDGRDVDLSLTQI------E---------GGETAEVAF---PYFGGIL----- -----------------HEHFQHAEGESIQLRRVPVRTITLA-DGSTTKVATVFDL----- -------MAAN-LGIDRGL-------GGGNVASSYDDASVPGTPAWQEVITGVSREKAIQI -AREF------ADNADKTHGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWSRPPRQMNGTSFFYNHSSQWRHEKMSIHEV -------LSPLADKSQFPEHMLDYNIRAERAGWLPS-----APQLN-RNPLQICRDAEAAG -MSPV-----DYVTQSL-----KD---------------GSLKFACEQPDNPD-NFPRNMF -VWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN-EDLGKRADGFKPTEAEWQDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EAKSDWEIYKGIAKAFSKMAEGQLGVE-KDLVTVPLLHDSPGELAQPF----GGTDWKTA -GVDPQPGKNCPNMAVVERDY--PATYKKFTSLGPLLDKLGNGGKGINWNTQDEVDFL--- ------GELNYKVRDEGVSQGRPQIESAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLALPKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHEYIPWRTIT------GRQQFFQDHPWMQAFGEQLMSYRPPINTR------------ -TIDYVK-------GKKSNGNP----------EIVLNW-------------------ITPH -QKWGIHSTYSDNLIMLTLSR---------------GGPIVWMSEVDAKKAGIEDNDWI-- ----------------ECFNANGALTARAVVSQRVMEGMVMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMA-------KVDW---LDGPNGNDLPQPLPQDI----------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16 rank: A; ocm:CBP12_03810 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------ETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRVKYPKVRKALLK---------LWRE--ARKNLKPVEA -WASIVEDPVKAQSYKSKRGLGGFVRSSWDEVQELIAAANVYTTKTY----GPDRV-VGFS -PIPAMSMIS------YASGARYLSL----------------------------------- ----MGGACLSFYDWYCDLPPSSPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----E -KPSEYFTDYVRRTTDFPMLVLLD-----EHGEGYKTGRFLR---------ASDLTGQ-LG -QDNNPEWKTIALDELSGELVSPLGAIGYRW---------GEKGKWNIEAREG-------- --------SKGADTKLKLSLI------D------------EGQVAEVAFPYFGGDL----- -----------------HDHFQHVEGDNLQYRRIPVREVQLA-DGRSAKVATVFDI----- --------TAGGLAIDRGL-------GGKNVASSYDDASIPGTPAWQEQITGVTREKAIQI -AREF------ADNADKTKGRSMIIVGAAMNHWYHMD-MNYRGLINMLMMCGCVGQTGG-G ---WAHYVGQEKLRPQT---GWTPVAFGLDWHRPPRHMNGTSFFYNHSSQWRYEKMNMHDI -------LSPTANKAEFPEHALDYNIRAERAGWLPS-----APQLN-RNPLQICRDAKAAG -LSPK-----DYAVKAL-----QE---------------GSLRFSCEQPDNPV-NFPRNMF -VWRSNLLGS---SGKGHEYMLKHLLGAEKHGVI---GDETAAGFTPKDVDFSQEGARGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EARSDWEIFKGIAKKFSELSVGHLGVE-QDLVTIPMQHDSVGELAQPF----GGLDWKTT -GEPLVPGKNAPNMVVVERDY--PNTYKKFTSLGPLLNTQGNGGKGISWNTDDEVEFL--- ------GDLNHRVLDEGVSEGRPQMLSAIDAAECVLSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLAVGKE----H-ESIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVSTRSIE----KVQG- -------------------------KMSNGNPEIALNW-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAQKVGIEDNDWV-- ----------------ECFNANGALTARAVVSQRVKEGMIMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMN-------KVDW--LEGSDTDDLPQPLPQNI------------ ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11 rank: C; pbm:CL52_03700 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ----MSR--------LLDQLRF--FKRKQD--EFA-DGHGETRIENR------EW-ENGYR -ARWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1 rank: A; reu:Reut_B5002 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLRF--LSRTKE--TFS-DGHGAVVDEDR------SW-ENAYR -GRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPLVRGRLME---------MWRE--ARQTMSPTDA -WESISQDPVKAKRYKSVRGQGGFVRASWDDVSEIIAAANAFTIKEF----GPDRV-LGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----IGGACLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTYLMVWGSNVPQTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMVKFGDIWLAPKQG-TDAALAMAMGHVILKEWHT----S -AQSDYFTRYVKQYTDLPMLVILK----LGKSGQLVPDYFLR---------ASHLSLA--E -QANNPEWKTLLIDCASGELIAPNGSIGFRW-----GESGDKVGRWNLELKDGGSARAIDP -CLS----LIDSHDDIVEVGF----------------------------DYYGGKD----- -------------------------ADDVLLRRVPAKRVKLA-DGSEALVTTVFDL----- -------TMAN-YGVDRGL--------GGGNVAMSYDDDVPYTPAWQERHTGVKRNLVIQV -AREF------AQNAHDTQGKSMVIVGAALNHWYHND-MIYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFAGDWVRPPRHMNGTSFFYNHTSQWRHEKLALDEI ------LAPTADAGPYSKLALLDLNAKAERLGWLPS-----APQLE-TNPLDIVDAADSKN -MDPV-----KYAVEEI-----KA---------------GRLNFSCDEPENPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALFG------DERDGIKPGEVKAGEAVEGKL -DLLTVLDFRMSTTCLYGDIVLPSATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKSDWEIYKTIAKKFSEIAGPYLGTR-KDLVLTPLLHDTPGELGQPF----EPKDWKHG -ECEPIPGKTMPQMTVVERNY--GDVYKKFTSIGPLLEKSGNGGKGIGWNTEHEVKEL--- ------AALNKLVTEPGVSQGRPKLETAIDAAEMILTLAPETNGHVAVKAWDALGKI---- ------TGRDHKHLAEGRD----H-DKIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHRWMLDFGEGLCIYKPAINTRTIE--P--MLG- -------------------------KHANGNAELVLNW-------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIE-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1 rank: C; cuh:BJN34_33750 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------K--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------HAN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------GNEELVLN-------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIEAKQAGIRDNDWV-- ----------------EVFNVNGTLTARVVVSQRVPVGMCLMYHAQE-------------- ---KIVNVP-GAETSGMRGGIHNSVT---RTVTKPTHMIGGYAQ---------LAYGFNYY -GTV-GSNRDEYVIVRKMK-------KVDW---LEGALKEEGEQA---------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6 rank: A; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MAACR------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------DWYCDLPPASPQIWGEQTDVAESADWYNSNYLMVWGSNIPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -RPSDYFTGYIRQYTDMPMLVMLKQ----DAAGRYLPDYFLR---------ASHLAGN-AD -QAHNPEWKTLVLDETSGNLAVPNGSAGFRW---------DQSGKWNLEEKA--G------ --------INSQPVKAQLSLI------A--------QSDEVVEVGF---PYFGAEH----- --------------------------DELITRRVPVRHIVLA-DGSTARVATVFDL----- -------MAAN-YGIDRGL--------GGGNVACSYLDDVPYTPAWQHKHTGVKPEMVIQV -AREF------AQNADQTHGRSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WCHYVGQEKLRPQT---GWAPLAFAGDWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LSPTADGKMANMALIDYNAKAERMGWLPS-----APQLT-TNPLDVTRHAAAAG -QDPI-----TYAVEQL-----KS---------------GQLDMACNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNAVMN-----SEEGCVKPSEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QAKSDWEIYKGFAKAISEVGGEYLGVQ-QDLVLTPLMHDTPEELGQPF----DPRDWKKG -ECEPIPGKTMPKMTVVERDY--RKIHDKFTSIGPLLEKVGNGGKGIGWQTGHEVDVL--- -------RGLNKTVASGVAAGQPRLDTAIDAAEMILTLAPETNGHVAVKAWAALSKI---- ------TGRDHTHLALPRE----H-DSIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHLWMRAFGEGLCLYKPHVDLK--T--TAAILG- -------------------------KKPNGHHEIVLNW-------------------ITPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWVSEIDAKKAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRVPEGMSLMYHAQE-------------- ---KIINVP-GAETSGKRGGIHNSVT---RTVVKPTHMIGGYVQ---------LAWGFNYY -GTV-GSNRDEFVIVRKMK-------NVDW---LDQPLSEHA------------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7 rank: C; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) -MEYARLVTHLAESENSRACFFLAPLLSNYPTLPPLPPPRSPSDQWAVCLRLLTIGGIGTG -LSGPANPLEARMSHFLDRLNF--LGKVKS--TFS-DGHGAVVKEDR------KW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGVLMQ---------HWRE--LRKKLGPIEA -WQRISQTPEIATQYKTQRGQGGFVRASWDEVNEIIAASNAFTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------I---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----GVPRLVL------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2 rank: A; chrm:FYK34_01610 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--MSKVKA--TFS-NGHGAVVKEDR------QW-EDAYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----ADL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGKLMQ---------MWREARKS--MGAIDA -WESISQNPEKAKEYKSRRGQGGFVRASWDEVNEMVAAANAYTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQIWGEQTDVAESADWYNSTYLMVWGSNVPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -KQSSYFTDYIRRLTDMPMLVRLK-----EEGGRYLPEYFLR---------ASHLEGG-LG -EDNNPDWKTLLIDENTGDIVAPNGSIGFRW-----GQPEGKTGKWNLEHRDGAT------ --------AREIQGQLTLLGQ------Q----------DEVVGVGF---PYFGAEH----- --------------------------DELLTRNVPAKRITLA-DGSTALVATVFDL----- --------MAANYGIDRGL--------GGGNVASSYMDDVPYTPAWQQKHTGVKPEMVIQV -AREF------AQNADQTQGKSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQS---GWAPLAFGADWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LCPTADGSMANMSLIDYNAKAERMGWLPS-----APQLS-TNPLDITRQAEAAG -QDPV-----AYTVQGL-----KD---------------GTLDMSCNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALMS-----DEANCITPTEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKTDWEIYKGFAKAISEVGGDYLGVQ-KDLVLTPLMHDTPQELGQAF----DPRDWKKG -ECEPIPGKTMPAMTVVERDY--KAIYQKFTSIGPLMEKAGNGGKGMAWKTGHEIEKL--- -------RAMNKVVQDGVAKGQPRLDTAIDAAEMILTLAPETNGHVAVKAWESLSKI---- ------TGRDHTHLAIPRE----H-DHITFR-DIQAQPRKIISSPIWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHQWMRAFGEGLCLYKPPVDLKT----------- -TAAVHR------------------HKPNGNTEILLNF-------------------LTPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWISEKDAQEAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRIPKGMTLMYHAQE-------------- ---KIVNVP-GAEMSGKRGGIHNSVT---RAVTKPTHMIGGYAQ---------YSYGFNYY -GTV-GANRDEFVVVRKMK-------NVDW---MDQPK----------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6 rank: C; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------T -ASHQAMMNSRS-----------------------------------------------NG -NPEIA------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------LN------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------F------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPCVWVSEVDATKIGLVDNDWV-- ----------------EAFNANGALCARVIVSQRVPEGMMMMYHAQE-------------- ---KIVNVP-GSEIMNTRGGIHNSVT---RAVVKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVILRKMN-------KVDWMDDEASPAGENS------------------- ----- ->nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------AW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--HRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCL-----VEKDGAYVPDRYVR---------AADLVGA-LG -EANNPDWKTLVIDEASDALTVPVGSIGFRWGQEKDGAPTADKGKWNLKEET--------- --------SDGRQIKPRLSLV------K--------HHDAVVEAAF---PYFGNIA----- -----------------HEHFNSTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVASSYDDDIPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLRVADL -------LSPLADKGKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLELSREAIAKG -LDPK-----EYVVNQL-----KS---------------GELKFSCEDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGHTGEVKPQDVVWHDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRFSELS---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DGYLGVEKDIVAVPIL--HDTAGE- ------------------------------------------------------------- -----IAQPYDTKDWKK-------------------GECEA-IPGKTMPNFVVVERNYSEI -H--------------EKFTSLGPLLDK--------------------------------- -------------------------------------------------------LGNGGK -GIN-------------------------W---NT-------------------------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------SW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--QRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCM-----VEKDGAYVPDRYVR---------AADLIGA-LG -EANNPDWKTLVIDEESDALTVPVGSIGFRWGQDKDGAPTADKGKWNLKEET--------- --------TDGRKIKPRLSLV------Q--------KHDAVVEAAF---PYFGNIE----- -----------------HEHFNNTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVAGSFDDDVPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWSRPPRHMNGTSFFYAHTDQWRYETLRVADL -------LSPLADKNKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLDLTREAIAKG -VDPK-----EYVVNQL-----KS---------------GELKFSCDDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGQTGDVKPQEVVWRDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRYSELSDGYLGVE-KDLVAVPILHDTAGEMAQPY----DAKDWKKG -ECEAIPGKTMPNFVVVERNY--SEIYEKFTSLGPLLDKLGNGGKGINWNTDHEIKLL--- ------GELNYKVRNEGVAHGRPNIDTDIDATEVVLTLAPETNGEVAVKAWAALSEF---- ------TGIDHRHLALTRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESEHVSYNAGY -TNVHELIPWRTLT------GRQQLYQDHEWMRAFGEGFCSYKPPVDLRSHQ--Q--VMN- -------------------------AKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWLSEVDAQKVGIEDNDWI-- ----------------EAFNSNGALCARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-GSEITQTRGGIHNSVT---RAVLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVVVRKMN-------KVDW---MDGPAQPAMEA----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF----FVTPTEGFA-DKHGATVDEDR------TW-EDGYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCQRGASYSWYLYSANRVKYPMVRSPLLK---------LWRE--KRKMLAPVDA -WKAITDDHNAVRSYQSQRGLGGFLRTTWDEVNEMIAAANVHTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCTSFYDWYCDLPPSSPQMWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMTEVRYRGTKVVSVFPDYAEGSKFGDLWLHPKQG-TDAALALAMGHVIVNEFHV----K -NKSDYFDQYCRQYTDMPNLVKL-----VKQGDYYVPDRLVR---------CSDFTDN-LG -QDNNPDWKTVVIDENTNMLTVPVGSIGFRW----GQKEGEDLGKWNLQEKN--------- --------AAGADIRPRLSLI-----------------GGHDGVVLVASPYFGNQQ----- -----------------HDHFQHTDHANILPHNIAVRKLQSR-DGE----ILVASV----- ----YDLFVAN-YGVDQGL--------GGPNVASSYDDDIPYTPAWQEKITGVKRHLVIQV -AREF------ADNADKTHGKSMVIVGASLNHWYHMD-MNYRSVINMLVMCGCIGQSGG-G ---WAHYVGQEKLRPQI---GWAALAFATDWHRPPRQMNGTSFFYAHTDQWRYETLSVKKI -------LSPLADPKKFSGSLIDFNVRSERMGWLPS-----APQLQ-TNPLQVCRDAQKAG -MSAK-----EYAVAQL-----KS---------------GKLRFSCEDTDHPD-NYPRNMF -IWRSNLLGS---SGKGHEYFLKHLLGTTHGVQG--KDLGQSGGQKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----F-SAAVDPAW -MARSDWEIYKGIAKKFSELTEGHLGVE-QDLVTVPIMHDTPDELGQAF----EPKDWKRG -ECEAVPGKTMPNFVLVERDY--PNTYKKFTALGPLMDKLGNGGKGINWNTQHEVKHL--- ------GELNYLVSEEGVTKGRPKIETDIDATEVILMLAPETNGEVAVKAWDALSKF---- ------TGIDHTHLAKTRE----D-EKIRYR-DIQAQPRKIISAPTWSGIESEHVSYNAGY -TNVHELIPWRTIT------GRQQLYQDHHWMRAFGEALCVYKPPIDTASHQ----AMMN- -------------------------SRSNGNPEIALNF-------------------ITPH -QKWGIHS----------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------F-GNLEH -DHFQG----------------------------------------TDHPSVLK----RRV -PVREVQL-KDGKAFVATVFDLFCANYGL-------------------------------- -----------------DRGLGG-----------------EHVARDY-------------- ------------------------------------------------------------- ----------------GAMEPYTPAWA---------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------E--------------------------------- ------------------------------------------------------------- ------------------------------------------------KITGVPADQIITI -AREF------ASNAEVTKGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLGVEEI -------LSPTAPEGDWDASLIDYNARAERMGWLPS-----APQLK-TNPLEVGKAIKASG -KDAK-----DYVAEAL-----QS---------------GALEMSCFDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGETGAQKPKEVKWHEEAPKGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWDIYKGIAKKFSEIAPEVLGVE-HDVVLTPIQHDSPNEIAQAY----DVADWGHG -QVEAIPGKTMANVALVERNY--AELYQKFTALGPLMEKLGNGGKGIGWNTDHEVEGL--- ------RKLNGTVAADGPAKGMAQIETAIDAAEVILMLAPETNGEVAVKAWADLGKK---- ------TGLDHTHLALPKE----D-EKIRFR-DIQAQPRKIISSPTWSGIESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEGLCVYRPPIDTKAVK--PML---- -------------------------DEAKDAPHVILNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KITNVP-GSPLTGQRGGIHNSVT---RAVLKPTHMIGGYVQ---------LAYGFNYY -GTV-GSNRDEYVIVRKLS-------KVDW---LEGALS-------EGETAA--------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1 rank: A; emv:HQR01_12825 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRHKKE--QFS-DGHGVTTAEAR------DW-EDSYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLIK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKKW----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALAMAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----IEQDGRLVPERLLR---------ASDFKGD-LG -EKNHPEWKSVAIDEARDEVVAPTGSAGFRW---------GDKGKWNLEEKD--------- --------GKGAEVKLRMTAI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------LDKDH---------------------------------------- ------------------------------------------------------------- -----------------------------------DEVVEVA------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKKE--PFS-EGHGVTTAEAR------DW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRKYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDFAGG-LG -ETNNPEWKCVAIDETSDEVVAPSGSVGFRW---------GEQGKWNLKEED--------- --------GRGEAVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFQGTDHPDVLMKRVPVREMQLA-EGRAYVATV--------- ----FDLLCAN-YGLDRGL--------GGQHVARDYADGAPYTPAWAEKITGIPADAIVTT -AREF------AANAEATNGKSMVILGAGVNHWYHMD-MTYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVGEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAARASG -LEPK-----DYIAQAL-----KG---------------GDLELSCMDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPREVKWHEEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESKSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGHG -EIEAIPGRTMATVALVERDY--PNLYNRFTALGPLMDKLGNGGKGIGWNTAAEVENL--- ------RRLNGVQDAGSPAAGMAKIETAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGINHRHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNQLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNTNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW------LEGALPEG--ENAA----------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKSE--TFS-DGHGLTTGEDR------HW-EDGYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWREARRT--LPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLMMWGSNVPQTRTPDAH -FMTEARYRGTKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDVKGG-LG -EGNNPEWKCVAIDEASDELVVPSGSAGFRW---------GEKGKWNLEEKD--------- --------GQGREVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFEGTDHPDVLMKRVPVRQLDLT-EGR----AYVATV----- ----FDLLCAN-YGLDRGL--------GGEHVARDYAAMSPYTPAWGEKITGVPADAIITA -AREF------AANAEATNGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVSEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAAKASG -MEPK-----DYVAQAL-----KG---------------GDLELSCLDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPQEVKWHDEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGKG -EVEPIPGKTMATVAVVERDY--PNLYKRFTALGPLMDKLGNGGKGIGWNTVTEVDNL--- ------RKLNGTVGDDGPTKGMARIDTAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGRDHKHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW---LEGALS-------EGENAA--------- ----- ->NASQAN2015_010_A_bin.16_Ga0466474_000034_25 rank: A; oca:OCAR_5043 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLLF--FKKKVD--TFS-GTHGVVTNEDR------SW-ESSYR -SRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKFPMIRGRLVR---------LWRE--ARLSLDPVDA -WASIVEDPLKSAEYKSKRGLGGLVRANWDEVNEIIAAANIYTAKTF----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVSMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FMTEARYKGAKVVVVSPDYSEASKFADLWLHPKQG-TDAALAMAIGHVILKEFHV----E -GQSPYFNGYVRENTDLPFLVMLK-----EQDGYYVQDRFLR---------ASDFSGS-LG -QDNNPDWKTVAYDELNGQIVPPCGSIGFRW---------GESGQWNIEQKT--------- --------SDNQAVKLRLSLI------D-----------IKDEVASVGFPYFGGSE----- -----------------HPHFTHSAHDAIQKRNVPVKKIILA-DGTEVLATTVFDL----- -------LVAN-YGIDRGL--------GGGNVAASYDEDVPYTPAWQEKITGVSRSNVIAV -AREF------AINAEKTKGRSMVILGAGINHWYHMD-MNYRGIMNMLMLCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWLPLAFGLDWKRPPRQMNSTSFFYNHTSQWRYETLKVSEI -------LSPTAKPEDWQGSLIDFNVKSERMGWLPS-----APQLQ-TNPLQVVRDAKAAG -IAPA-----DYVVAGL-----KN---------------GSLKMSCEDPDNPL-NFPRNMF -VWRSNLLGS---SGKGHEYFLKYLLGTQHGIQG---KDLGDDGDKPSEVVWHEKAAEGKL -DLLVTLDFRMSTTCLYSDIILPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIAKKFSELTIGHLGLE-QDIVTVPVLHDTPGELAQPF----EVKDWKKG -ECEPVPGKTMPSLVVVERDY--PNTYKMFTSLGPLLSKIGNGGKGIAWNTETEVKQL--- ------GELNYLVTEEGISKGLPRIASDIDATEVILMLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAKPRE----D-DKIRFR-DVQAQPRKIISSPTWSGLESEQVCYNACY -TNVHERIPWRTLT------GRQQFYQDHSWMRAFGETLCVYKPPVDTRSIT--P--ILG- -------------------------QKPNGNDELVLNF-------------------LTPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMGEIDAAKVGIKDNDWI-- ----------------EAFNVNGALVARAVVSQRVPEGMCMMYHAQE-------------- ---KIVNMP-GAETTGGRGGIHNSVT---RATLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIIRKMS-------KVDW---LEEPKPEQA------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1 rank: A; tun:J9260_09180 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- --------------NMLAMCG---CVGQSG------------------------------- -----------------------------------------------------------GG -WAHYV---------------------------------------------GQEKL----- ------------------------------------------------------------- --------------------------------------------------------RPQTG -WL------------------PLAFALDWSRPPRQM-NSTSFFY----------------- ------------------------------------------------------------- ------------------------------------------------------------- --------SHSNQWRYEKLEL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------KEILSPL -ANPA------------------RHSGSLIDYNVRSE------------------------ ------------------------------------------------------------- -----------------------------RMGWLPS-----APQLN-TNPLRIAKAAQAAG -MSPA-----EYTVAAL-----KA---------------GKIAFAAEDPDNPQ-NFPRNLF -VWRSNLLGS---SGKGHEYMLKYLLGTQHGVQS--KDLGVMGGAKPEEVKWHDTAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAAVDPAW -EARSDWEIYKGIAKAFSKVCEGHLGVE-TDLVTLPLLHDAPAELGQAM----GVKDWKKG -ECELIPGKTAPALVAVERHY--PDTYARFTAIGPLLEKLGNGGKGISWNTETEVAFL--- -------GQLNHQQTTGINEGRPCLNSAIDAAEMILSLAPETNGQVAVKAWQALSKI---- ------TGIDHSHLAIHKE----D-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHDWMRDFGESMLVYRPPINTKTIK--P--LLN- -------------------------QRSNGNPELALNW-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWMSETDAKTLGIQDNDWI-- ----------------DLFNANGAIAARAVVSQRVMPGMVMMYHAQE-------------- ---KIVNVP-GSVITGHRGGIHNSVT---RVCPKPTHMIGGYAQ---------QAYGFNYY -GTV-GSNRDEFVIVRKMT-------QVEW---LDNE---------GNDYAQEAVQ----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1 rank: C; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLN---FLARKNADTFS-DGHGVTTTENR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLIRSRLLK---------LWRK------------ ------------------------------------------------------------- --------------------ERTIK------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------TPIGAWAAIQEN--------- --------PEKRADYMKMRGL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1 rank: A; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------FLARKNAGTFS-DGHGVTTTESR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLVRSRLLK---------LWRK--ERTIKTPIGA -WAAIQENPEKRADYMKMRGLGGFVRATWEEVNEIIAAANAYTVKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEVRYKGAKSVVVSPDYSEAAKFSDLWLHPKQG-TDAALAMAMGHVILREFHL----D -RQADYFEDYCRRYTDMPMLVKLTG----KDGHFIPD-RFVR---------ASDFTGA-LD -ETNNPEWKTVAVDAKTKQFVSPGGSIGYRW---------GEQGKWNLEAKDGKGADVDLA -MSFI---LDGEHDTIANVGF----------------------------PYFGNRE----- -----------------HDYFEGTDHDSVLVRKVPARKVKLA-DGEALVATV--------- ----FDLFVAN-YGLDRGL--------NDPNSAKSYQENLPYTPAWAEKITGVPRDQIIAV -AREF------ASNAEKTNGRSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNGTSFFYAHTDQWRYETLKVDEI -------LSPTAPEGPWDASLIDYNIRAERMGWLPS-----APQLK-TNPLEVSKQAAAAG -KEAK-----DFVAEQL-----KA---------------GALSMSCEDPDDKA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTKHGVLG--KDLGEEGRQISKEAVWHDEAPEGKL -DLLVTLDFRMSTTCVYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SSAADPAW -DARSDWEIFKGIARKFSEVAPEVLGVE-KDVVLVPTLHDTAGELAQPI----DVKDWKKG -EIEPIPGRTMPTVAVVERDY--PNLYKKFTSVGTLLDTVGNGGKGIAWNTEHEVDLL--- ------ARLNGVVQEEGVTRGRPRIESDIDATEVILSLAPETNGEVAVKAWEALSKF---- ------TGRDHTHLAIPKE----D-EKIRFR-DVVAQPRKIISSPTWSGLESEKVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFCVYRPPIDTKT----------- -VNPAIR------------------SKADGKPHLVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWISEPDAKRAGIVDNDWV-- ----------------EVYNTNGAIVARAVVSQRMKDGTVFMYHAQE-------------- ---KIVNTP-GSPITGQRGGIHNSVT---RVITKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDEFVVVRKLE-------TVDW---LEGPHTESVAY--NKEAAE--------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206 rank: A; bprc:D521_0425 Respiratory nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--LSADKE--EFS-DGHGVTVGEDR------TW-EDAYR -SRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKYPMIRGRLLK---------QWREAKSVA-KSPVDA -WANLVENTAKRKEWMELRGKGGFVRSSWDEVNEIIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADIWMHPKQG-TDAAIAMAMGHVILKEFYF----N -KRTEYFDDYVRRYTDMPNLVMLEEKVLDDGRKVLVPGRYAR---------SSDFDGK-LG -QTNGADWKTVAFD-TAGKPVVPNGSIGFRW----GPEGRKDQGKWNLESKE--A------ --------NYGNDVKLKLSLMEDQSIHD------------VVPVGF---PYFGGID----- -----------------TPYFDANKQSDVLVQNIPAKKIILT-ENGVEKEVFVATV----- ----FDLLAGN-YGIDRGL---------GGECAKSYDDNVPYTPAWQESITGVKREQVIAV -ARQF------AENAEKTKGKSMVIIGAAMNHWYHCD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWIRPPRQQNSTSFFYAHTDQWRYEKLGMEEV -------LSPLANKEEYTGSMIDFNVRAERMGWLPS-----APQLK-TNPLEVVKEALAAG -KDPK-----KYVVDGL-----KS---------------GTLQMSCEDPDHPS-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGADEARPSEVEWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -EARSDWDIYKGFAKKFSEVCVGHLGVE-KEIVMTPLMHDTPAELAQAF----DVQEWKKG -ECDLIPGKTAPQIAVVERDY--PNTYNRFTALGPLMDKVGNGGKGIAWDTKVEVEQL--- -------RELNGRVEHGEMKGMAKISTDIDAAEVVLMLAPETNGHVAVKAWDALSKI---- ------TGLEHAHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNACY -TNVHEYIPWRTLT------GRQQFYQDHKWMRAFGEGFVSYRPPVDLKTII--------- -----------EVKGIKPNGNK----------EIVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDAVKAGIVDNDWV-- ----------------ELYNANGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVTVRKMR-------NIDW---LDTENANSVQA----------------- ----- ->whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1 rank: A; pde:Pden_4236 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNF--LKSTRK-DTFA-DGHGQTTIENR------DW-EDTYR -SRWRH------DKIVRSTHG-VNCTGSCSWKIYVKNGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKTPLVRGRLMR---------RWRDLRRT--LGPIEA -WTAIQSDPAARADYVKARGRGGFVRASWDEVTEIVAAANAYTAKTW----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEARYRGTKSAVVSPDYSEAAKFGDIWLNAKQG-TDAALAIAMGHVILREFHL----D -RQVDYFEDYTRRYSDFPMLVKLEP-----KGDRFVPGRMLR---------AADIDGA-LG -ETNNPDWKTVAIDDASGRLVAPNGSIGHRW---------GEQGTWNLEEKA--------- ---------GAESVRLRTTLI------------LDGQNDGTAGVDF---PYFGGSA----- -----------------TNGWQACDTPDVLTRAIPVRKVALK-DGE----AMVATV----- ----FDLLCAN-YGLDRGL--------GGDWVARDYGSDMPGTPAWAERITGVPADRIIQV -AREF------AANAEKTGGKSMIIIGAAMNHWYHMD-MNYRGVINMLVMCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWGRPPRHMNSTSAWYAHTDQWRYETVRSDEI ------LSPTAPAGDWSSLSLIDYNIRAERMGWLPS-----APQLR-TNPLQVAAAAKAEG -TEVR-----DYVAREL-----KA---------------GRLEMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVLG--KDLGEEGRRKPVEARWHDKAPEGKL -DLLTCIDFRMSTTAVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKTDWEIFKAIAAKLSEIVPGYLGVE-TDVVQLPLQHDSPGEVAQPR-----VADWKQG -QCDLIPGKTAPAFIAVERDY--PNLYRRFTALGPLMEKAGNGGKGIAWDTKHEVAHL--- ------RALNGTVTDEGPTKGMARIDTAIDAAEVILMLAPETNGEVAVKAWEALSKA---- ------TGREHKHLALPKE----D-EKNRFR-DIAAQPRKIISSPTWSGIESESVCYNAGW -TNVHELIPWRTLT------GRQQLYQDHEWMLAFGEFFLAWRPPVDLKTIT--APATGA- -----------------LGANE---------KHVVLNF-------------------ITPH -QKWGIHSTYSDNLLMLTL------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17 rank: A; acis:CBP35_16735 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--TFS-QGHGQTNGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLK---------HWRA-ALLLAKSPVDA -WANIVENESAKREWQKQRGLGGFVRSTWDEVNQMIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSSFIIAWGSNVPQTRTPDAH -FLTEVRYKGTKVVSITPDYSEVAKLGDLWMHPKQG-TDAAVAMAMGHVILKEFYFKDGGK -GRSTYFDDYARRYTDLPLLVVLKEKTLPDGRTVMVPDRYVR---------ASDFPGQ-LD -QSNNPDWKTVGYD-ELGQVTLPNGSIGFRW----GADGRADEGLWNLENKE--A------ --------RTGNTVKLKLSVI------E--------DGEQAYDVADVAFPYFGGVQ----- ----------------TPNFTANEQGGDVMVRRVPVSHLELA-GHEAQGRVMVATV----- ----FDLLAGN-YGIDRGL--------PGEEPGGSYDADRPYTPAWQESITGVPREQIIAV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHCD-MNYRGIMNMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------LSPLADKKSYSGSMIDYNVRAERMGWLPS-----APQLK-TSPLQVAKDAAAKG -MDAK-----DYVVQSL-----KD---------------GSLQMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGRDEAKPEEVQWHANAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QAKSDWEIYKGFAKAVSEVSVGHLGVE-KDVVLTPIMHDTAGEMAQPY----GVRDWKKG -DCELIPGKTAPQVTVVERDY--PNLYKRFTALGPLMDKAGNGGKGIGWNTQTEVGQL--- ------GDLNGRVKEEGVTQGMPRIVSDIDATEVVLMLAPETNGHVACKAWEALGKQ---- ------TGRDHVHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMRDFGEGFVSYRPPVHLKALH----EVEG- -------------------------KKPNGNREIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAASAGIVDNDWV-- ----------------ELFNANGAIAARAVVSQRVNPGMVMMYHSQE-------------- ---KIINTP-GSEITGTRGGIHNSVT---RIVLKPTHMIGGYAQ---------YSYGFNYY -GTI-GTNRDEFVLVRKMD-------RVDWLDDEVSDTGAHA------------------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1 rank: A; hyb:Q5W_04195 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------QG------------------------------------------- ------------------------------------------------------------- -------------------------------------TDAALAMAMGHVVLKEFYFPAN-G -QRSSYFDDYARRYTDLPMLVMLKEQTLPDGSTTLVPDRYLR---------ASDFNGK-LG -QANNPDWKTVAFD-TTGKAVLPNGSIGFRW----GDQGREDAGKWNLESKE--A------ --------RDNGDVKLKLSVL------E-----DGAQDHQVVDVGF---PYFGGQQ----- ----------------TPNFPANAAVGDVNQAKVPAVRLRLG-KAGEERYALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKNYDDNAPYTPAWQETITGVPRQQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWLRPPRQQNSTSFFYAHTDQWRYEKLDVSEI -------VSPLADKAKFGGSMIDYNVRAERMGWLPS-----APQLK-TNPMQVVKDATAAG -MDPK-----DYVVQAL-----RD---------------GSLEMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTENGVQG---KDLGADEAKPTEVKWHKDAPQGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSKSDWEIYKGFAKRFSEVCVGHLGVE-KEVVLTPLMHDTAAELAQPF----EVKEWKKG -ECELVPGKTAPQIAVVERDY--PNLYKRFTALGPLMNKLGNGGKGIGWKTEIEVEQL--- ------GQLNGVTREEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMVAFGEGFSSYRPPVDLK--T--TDVVQG- -------------------------LRPNGHKEIVLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEDDAKSAGIQDNDWI-- ----------------ELFNVNGAVAGRAVVSQRVKNGMVMMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMQ-------KVDW---LDTP---------RDDHLVKAVQSQGEN -P--- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------LYSANRVKYPLVRGRLLE---------RWRT-ALKTARTPVDA -WATIVENPDARRDYQKVRGMGGFVRSSWDEVNQLIAAANVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAVTPDYSEVAKLADLWLHPKQG-TDAALAMAMGHVALNEFYF----K -QRSPYFDDYARRYTDLPLLVMLKEHILPDGSKTLVPDRYLR---------ASDFNGK-LG -QDNNPEWKTVAFD-AGGRAVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RHGAEVKLKLSVI------E--------DGTQAHEVVGVGLPYFGGVS----- ----------------TPHFTANAQQGEVNFVKVPAVRLRLG-KEGEQREALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKSYDDNAAYTPAWAESITGVPGDQIITV -ARQF------ADNAHKTRGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------VSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVKDATAAG -LDAK-----DYVVRGL-----RD---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTESGVQG---KDLGKDDARPAEVAWHEHAPEGKL -DLLVTLDFRMSTTCLYSDVVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCIGHLGVE-KEVVLTPIMHDTAGEIAQPF----DVKEWKKG -QCELIPGKTAPQVTVVERDY--PNVFKRFTALGPLMDKLGNGGKGIGWKTGTEVEQL--- ------GQLNGTTQADGPTKGMPQIVTDIDACEVILQLAPETNGHVAVKAWQALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DVQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMIAFGESMSSYRPPVDLKT----TSGIHN- -------------------------IKGNGNPEILLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDARLAGVQDNDWV-- ----------------EVFNINGAIAARAVVSQRVNPGMLMMYHAQE-------------- ---KIINTP-GSQITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMS-------KVDW---LDTPR--------DDHLAAAYQAQGENP ----- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FTLPRE--RSA-DGHGVVTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------------RWRAALTTARTPVDA -WAT--------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------IVENP------------ ------------------------------------------------------------- ------------------------------------------------------------- -DARRDYQKVRGMG----------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPQE--TYS-GRHGVATNEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIADDESARRDYQQVRGLGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSSFIIAWGSNIPQTRTPDAH -FFTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVILKEFYFKDGGQ -GRSAYFDDYARRYTDLPLLVMLKEHQLADGSTTLVPDRYLR---------ASDFSGQ-FG -QDNNPEWKTLAFD-TSGNPVLPNGSIGFRW---GEQLDEGELAKWNLESKD--A------ --------RNGQDVKLKLSVV------E--------DGAQPHEIAEVAFPYFGGVE----- ----------------TPNFPANAAQGEINRAKVPTVRLDLVGQGGESRQALVATV----- ----FDLQVAQ-YGIDRGF----------GSGAIDYDDNVPYTPAWQESITGVPRDQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNGTSFFYAHTDQWRYEKLGVEEV -------LSPLADKAAFGGSMIDYNVRAERMGWLPS-----APQLK-THPMQVVKDASAAG -LDAK-----DYVARAL-----KD---------------GSLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGADEAKPTEVKWHAKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QAKSDWEIYKGFAQAFSEVCVGHLGVE-KEVVLTPLMHDTPAELAQPF----GVQDWKKG -ECALIPGKTAPQVTVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTDLEVTQL--- ------GQLNGVTLEEGVTKGMPKIVTDIDACEVILQLAPETNGHVAVKAWEAQSKA---- ------TGRDHVHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLK-----TTGGLS- -------------------------IKSNGNAEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEEDATKVGIVDNDWI-- ----------------ELFNSNGAIVGRAVVSQRVKPGMTMMYHSQE-------------- ---KIINTP-GSEITGARGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLEEPAGAPASGAGH----------------- ----- ->eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPRE--AFS-GDHGLTTNEDR------TW-EDAYR -NRWAH------DKVVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIAEDDAARRDYQQVRGMGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSNFIIAWGSNVPQTRTPDAH -FLTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVVLKEFYFKDGGK -GRSAYFDDYARRYTDLPLLVMLKEHKLPDGSITLVPDRYLR---------ASDFNGK-LG -QGNNPEWKTVAFD-ADGRAVLPNGSIGFRW---GEKLGEGETPKWNLESKE--A------ --------RHGQDVKLKLSVV------E--------EGEQEHEIAEVAFPYFGGVQ----- ----------------TPNFPANSAQGEINRAKVPAVRLRLG-KEGDERYALVATV----- ----FDLQAAQ-YGIDRGF----------GSGAASYDDNAPYTPAWQEAITGVPRDQVVTV -ARQF------ADNADKTQGRSMVIIGAAMNHWYHSD-MNYRGVINLLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNSTSFFYAHTDQWRYEKLGMEEV -------ISPLADRKIYDGSMIDYNVRAERMGWLPT-----APQLK-TNPMQVVRDAAAAG -LDAR-----DYVAKAL-----KA---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGAGDAKPSEVKWHASAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KDVVLTPLMHDTPAELAQPF----EVKDWKKG -ECELIPGKTAQQITVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTELEVTQL--- ------GQLNGVTLEEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKV---- ------TGREHKHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLKT----TAEIAG- -------------------------VKPNGNPEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEEDAAKAGIVDNDWV-- ----------------ELFNVNGAISARAVVSQRVKPGMTLMYHAQE-------------- ---KQINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDEPAGTAGSGH---------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSQPKE--TFS-GDHGLTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRSRLLE---------RWRA-AMKTAKTPVDA -WATIVEDDAARRDYQKVRGMGGFVRSSWDEVNQIIAASNVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWG--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2011_265_B_bin.52_k121_959771_6 rank: A; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------GEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FYTEVRYRGTKSAVVSPDYSEAAKFGDIWLNPQAG-TDAALAMAMGHVILREYHL----D -RQAEYFEDYARKYTDMPMLVRLE-----DRDGHLVPGRMLR---------AEDFDGK-LG -ETNNPDWKTVAYDEATGQIAVPNGSIGFRW---------GEEGKWNLEQRA--------- ---------KGAEANLRLSQILDGHHDE---------------IVGVDFPYFGGVA----- -----------------TGDFVKCDHPEVLTRNIPARRAKLA-DGSQVLAATVFDL----- -------FCAN-YGLDRGL--------GGKWVSKDFNDDSPYTPAWAEKITGVAREKIIAV -AREF------AGNAEKTHGKSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCIGQEGG-G ---WSHYVGQEKLRPQT---GWAPLAFALDWNRPPRQMNSTSCWYAHTDQWRYETLRAGEI -------LSPTAPEGDWHISLIDYNIRAERMGWLPS-----APQLK-TNPLEVAKAAKAA- ----------GKAIPAYVAEQLKS---------------GALQMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVMG--KDLGEEGGVMPKEAVWHDEAPKGKL -DLLVTIDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKSDWEIFKSIARKFSEVAPEVLGVE-TDIVQLPLLHDTPGELAQAH-----VRDWKKG -ECDLIPGKTAPNYIAVERDY--PNLYKKFTSVGPLLEKLGNGGKGINWDTKVEVGHL--- ------RDLNGVVQDEGVSKGMAKLDTAINAAEMILMLAPETNGEVAVKAWEELEKP---- ------TGRHHAHLAEGAH----H-TKIRFR-DVAAQPRKIISSPTWSGIESETVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFVSYRPPVDLKTI---TKAVNN- -------------------------DAAEGNPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVVWMSEVDAQKARLVDNDWV-- ----------------EAYNINGALTARVVVSQRIKQGTLFMYHAQE-------------- ---KIVNTP-GSEKTGHRGGIHNSVT---RTTLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIVRKMK-------KVDWLD-TPATHKVEAAE----------------- ----- ->NASQAN2011_265_B_bin.52_k121_465271_4 rank: C; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNFFQSKELEQ---FS-DGWGQTTRENR------DW-EDVYR -NRWRH------DKIVRSTHG-VNCTGSCSWKIYVKSGIVTWETQQTDYPRTR-----AGL -PNHEPRGCARGASYSWYLYSANRVKNPLIRGALMR---------AWRK--MRPTMTPVAA -WAAIQNDPVLRASYTKTRGKGGFVRATWDEATEIIAAANAYTAKTY----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -F----------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSH--FSAPKE--EFA-DGHGVATGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALLVAKSPVDA -WASIVENPQARAEWQKQRGLGGFVRSTWEEINQLVASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----D -KRSAYFDNYVRRYTDMPNLVQLEERTLPDGRKVMVPGRYLR---------ASDFDGK-LG -QSNNPEWKTVALD-QDDKIVLPNGSIGFRW----GAAEREDLGKWNLENKE--A------ --------RGDTQVTLKLSLM------E----GAKDGSAADYEVGDVGFPYFGGID----- -------------TPNFDANKQSAAVGDVLVRKVPVRRVKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------PGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWVRPPRQMNSTS -FFY------------------AH------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------TDQWR--------------------------------- ------------------------------------------------------------- -----------------------Y------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------ERLGVDE------ ------------------------------------------------------------- -------------------------------ILSPL------------------------- --------------ADKSK------------------------------------------ ----- ->NASQAN2015_172_B_bin.54_k121_327740_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------IWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRQVVVPGRYIR---------ASDFNGK-LG -QDNNPDWKTVALD-QNDKIVLPNGSIGFRW----GAEGRSDEGRWNLENKE--A------ --------RGDGDVKLKLSLM------E--------GEDSEYQVGEVAFPYFGGID----- -------------TPNFHANKQVSAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------DGETAAKDYEEDVPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAVG -MDPK-----EYAIKAL-----QD---------------GSLKMSCEDPDNPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGPEDAKPAEVKWHDKAPEGKL -DLLVTLDFRMSTTCMYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----EVNEWQKG -KCELIPGKTAPQITVVERDY--PSTYKRFTALGPLMAKVGNGGKGIGWNTADEVQQL--- ------GELNGHVRTEGVTKGFPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHPWMIAFGEGLTSYRPPVDLKT----VDDMID- -------------------------RKPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKDAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEISGMRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVIVRKMR-------KIDW---LDNEANNQVQV----------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_678_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- -------------------------------------NGKLGQDNNP------EW-KTVAL -DQA--------DRVVL-----PNGSIGFRWGAEGRSD--------------------AGK -WNLEDKEARGG--------NEVKLKLSLM------------------------------- ---------------------------------------------------------EGEG -ADYEVGEVA--------------------------------------------------- ----------------------FPYFGGIDT------------------PNFSANKQASA- -------------------------------------VD---------------------D ------------------VLVR--------------------------------------- ------------------------------------------------------KVPVR-- ------------------------------------------------------------- -------------------------------------RIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKT----VDEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQA----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--AFS-GGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRAALAVA-KSPVDA -WTSIVENPNARLEWQEQRGLGGFVRSTWEEVNQIIASANVYTIKQY----GADRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QADRMVLPNGSIGFRW----GAEGRSDAGKWNLEDKE--A------ --------RGGNEVKLKLSLM------E--------GEGADYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVIWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKTV----DEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQV----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--PFS-GGHGVTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRA-ALAVAKSPVDA -WASIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RGDSEVKLKLSLM------E--------GEGSEYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----DYAVKAL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEDAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLMPLMHDTPAELAQAF----DVKEWSKG -ECELIPGKTGPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTTDEVHQL--- ------GELNGKVRAEGVTQGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMQAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKNAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KVDW---LDGEAPATVQA----------------- ----- ->NASQAN2011_028_B_bin.24_k121_53788_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALAVAKSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERNLPDGRKVMVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKEA-------- --------RGDNEVKLKLSLM------E--------GEGSDYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRVKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKQDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMKVVKDALAQG -MDPK-----DYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGIEDAKPTEVHWHDQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----DVKEWKKG -ECELIPGKTAPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTADEVHQL--- ------GELNGKVRAEGVTKGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RKPNGHKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KIDW------------------------LDGEAPA -TVQA ->NASQAN2015_227_F_bin.21_scaffold_4919_3 rank: C; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRAALAVA-KSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_25058_1 rank: C; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--SFS-GDHGVTTGEDR------TW-EDAYR -TRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSMQPVDA -WASIAQSDEKRREYQTVRGLGGFVR------------SNVYTIKKH----GPDRI-VGFS -PIPAMSMVS------YGAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYF----P -DGGKPRSAY---FDDMPMLVMLKEHQLPNGDTVMVPDRYVR---------ASDFNGK-LG -AANNPDWKTVAFD-ESGKVVLPNGAIGFRW----GPDGRADEGQWNLEAKE--A------ --------RHGTEVKLKLSVM------E--------GDNPSLETAKVGFPYFGGIV----- -------------SEHFPNNATGDAAKDVLVRTVPVQRISLG-KEGDKREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------AENADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGMDEV -------LSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPFQVVKDAEAAG -MSPV-----DYTVKSL-----KD---------------GSLAMSCEDPDHPN-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG--------------------------- --------------------------------KDLGADEAK-------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PTEVVW------------------------------ -----------------------------------------HKEAPEGKLAL--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----VVTLD---------------------------------------------------- -----------------------------F------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4 rank: C; buq:AC233_31260 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --WRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGPQDAKPTEVKWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -QSRSDWEIYKGFAKKFSEVCVGHLGVE-QEVVLTPLMHDSPAELGQPM----GVQDWKRG -DCELIPGKTAPQITVVERDY--PNVFKRFTALGPLMNKVGNGGKGIAWNTQVEVTQL--- ------GQLNGLVREEGVTKGMPKIDTDIDACEVVLQLAPETNGHVAVKAWEALSKA---- ------TGRAHKHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHAWMLAFGEGFGSYRPPVDMKA----TALMHN- -------------------------QRPNGQPEILLNF-------------------ITPH -QKWGIHSTYTDNVLMLTLSR---------------GGPIVWLSEDDAKSAGIVDNDWV-- ----------------ELFNVNGAIAARAVVSQRVKPGMVMMYHAQE-------------- ---KIINTP-GSEITHVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMD-------KIDW---LDTPVG-------AERVTRVQAQGENA- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3 rank: C; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY----FSQPTEPFS-NEHGITTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCQRGASYSWYLYSANRVKHPMVRARLLK---------HWRE--ARLHHDPVDA -WASIMANETKRRDYQQVRGLGGFVRSSWDEVNEIIAAANVHTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGCKTVAVTPDYSEVAKLADLWMHPKQG-TDAALAMAMGHVILKEFYF----D -RRAAYFDDYARRYTDLPMLVMLREQTLDNGRTVLVPDRLLR---------ASDFNGK-LG -QANNPDWKTIAFD-TTGKAVAPNGSIGFRW----GPEGRADAGRWNLEDKD--A------ --------RTGADTKLKLSVL------EDEHGEGAAQAHEIVEVGF---PYFGGVV----- ----------------NPHFTGNDQGGDVRRIHVPAVRLRLG-KAGEERHALVATV----- ----FDLQAGQ-YGIDRGL----------GTGAKNFDDDAPYTPAWQEAITGVPREQVIAV -ARQF------AENAEKTEGRSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWIRPPRQQNSTS -FFY------------------AH------------------------------------- ---------------------------TDQWRYE--------------------------- -----------------------------------------------------KLGMDEVL -SPLADKAAFKGSAIDFK------------------------------------------- ------------------------------------------------------------- --------------------------------APQLNVNPIQVAKA--------------- -------------------------ARAA-------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------VDPKDYTVQGLKNGS---- --------------------------------------IDLACHDPDAP------------ -----------------------------QNW----------------------------- -------PRNMFV----------------W------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2 rank: A; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ----------------------S-------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------MNYRGVINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMDEI -------LSPLADKKAYAGSMIDYNVRAERMGWLPS-----APQLK-TNPLKVVRDASAAG -MDPK-----DYTVKGL-----KD---------------GTLKMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGRDEAKPSEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWDIYKGFAKKFSEVCVGHLGVE-REMVLSPMMHDSPGELAQPL----DVKDWKRG -EVDLIPGKTAPNMVVVERDY--PNVYKRFTALGPLMNKVGNGGKGIAWNTQTEVKQL--- ------GELNGLITEQGVTCGMPRIDSDIDACEVVLQLAPETNGHVAVKAWQALGKQ---- ------TGIDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFTSYRPPVDLKTT---------- ----------AGIHGIKSNGNP----------EILLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKRAGIVDNDWV-- ----------------ELFNINGAIAARAVVSQRVNNGMTLMYHAQE-------------- ---KIINTP-GSEITGIRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDTPADASNPA------------GSHA- ----- ->NASQAN2016_164_F_bin.17_scaffold_8891_2 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPRE--SFS-GDHGVTTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSQDPVDA -WASIAQSDAKRKEYQSVRGLGGFVRSSWDEVNEMVAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNS----------------DAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYFPDGGK -ARSTYFDDYVRRYTDMPMLVMLKEQTLPSGEVVMVPDRYLR---------ASDFNGK-LG -AANNPEWKTVALD-ESGKVVLPQGAIGFRW----GPDGRADEGQWNLQAKE--A------ --------RHGNDVKLKLTVM------E-----GEQASLETAKVGF---PYFGGIE----- -------------SEHFPNNATGAGANNVLVRTVPVQRIALG-KAGDTREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFGLDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEV -------LSPLADKKAFGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVRDAQAAG -MEPK-----DYAVKGL-----KE---------------GTLSMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDMGHDEAKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2015_227_B_bin.17_k121_559871_7 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPKE--AFS-GEHGVSTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWREARLS--MDPVDA -WASIAQDDAKRKEYQSVRGLGGFVRSGWDEVNEMVAAANIYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYC-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2 rank: A; aon:DEH84_18240 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- --------------------AA-------------------------------DW-VRPSR -QQN--------STSFFYAHT---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DQWRYEKL----------------- --------------GVNEVLSPLADKAKF-------------------------------- ------------------------------------------------------------- ----------------------------------------GGSMI---------------- ---------------------------D--------------------------------- ------------------------------------------------------------- ----YNVRAER-------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------MGWLPS-----APQLQ-TNPLNLVKEAQAKG -MDAK-----DYAVQSL-----KD---------------GSLKMSCEDPDNPA-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGPNDAKPQEVQWHNQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -EARSDWEIYKGFAQKFSEVCVGHLGAE-REVVMTPIMHDTAAELAQPF----GVQEWKKG -EIDLIPGKTAPQIAVVERDY--PNTFKRFTSLGPLMNKLGNGGKGIGWNTQDEVHAL--- ------GELNGTVREEGVSQGMPKIVSDIDASEVVLMLAPETNGHVAVKAWEALGKQ---- ------TGRDHTHLALHRE----D-EKIRYR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFVSYRPPVDLKT----LDDIKG- -------------------------VKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNNGMVLMYHAQE-------------- ---KIVNTP-GSEITGTRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLDDESSNQGVHA------------------- ----- ->NASQAN2016_164_F_bin.17_scaffold_1152_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -----------------VTCG---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------MPKI- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------TDIDAC------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------EVVLQLAPETNGHVAVKAWKALGKQ---- ------TGLDHTHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNA-- --------------------GYTNVHEMIPWRTR--EGFTTYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSETDAKSVGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW--------------------LEEEAQGENA- ----- ->NASQAN2015_227_F_bin.21_scaffold_2406_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------VSYNAGYTNVHEMI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------PWRTL-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------T------------------------------------- --------------------GRQQFYMDHPWMTAFGENFSSYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAKSAGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMA-------KVDWLDDEGSSTEPTATHN---------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSSPKE--SFS-DGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTRD-----DL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLQ---------HWRA-ALAVSKSPVDA -WANIVENTAARSEWQKQRGLGGFVRSTWEEVNQLIASANVYTAKKY----GPDRV-MGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYSEVAKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----N -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVMVPGHYLR---------ASDFNGK-LG -QDNNPEWKTVAID-ENDKIVLPNGSIGFRW----GAEGRSDMGKWNLESKEA-------- --------RGDAEVKLKLSLM------E--------GATPDYEVGDVGFPYFGGID----- -------------TPNFNANKQGEAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------AGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTKGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLE-TNSFQVVKDAQAAG -MDTK-----DYVVKSL-----KD---------------GSLKMSCEDPDNPK-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG---KDLGAEEAKPTEVQWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAQAYSEVCVGHLGVE-KEVVLTPLMHDTPSELAQAF----DVKEWKKG -ECDLIPGKTAPTIAVIERDY--PNTFARFTALGPLMEKAGNGGKGIGWDTKVEVQQL--- ------QSLNGKVHTEGVSKGMAKIVTDIDAAEVILQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAIHRE----D-EKIRFR-DVQAQPRKIISSPTWSGI----------- ----------------------------ESETVSYNAGYTNVHE----------------- ----------------------------------MIPWRTLT------------------- ------------------------------------GRQHFYL------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- --------------------------------TLT-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------GRQHFYLDHDAYIAFGEHLSTYKPSPT-------------- ----------PEAYGDLRKT-----VNDGHAKMLN---------------------CLTPH -GKWHIHSTYGDTLRMLTLSR---------------GNEPCWLSEEDAAELGIKDNDHV-- ----------------EVYNDHGVYVARACVSARIPKGVCIVYHAVERTYNIP-------- ---KSQIRR-GEHGEPRRGGMNNSFT---RVHLKPNLMCGGYGQ---------FTYHFNYW -GPV-GVNRDTHVLVRKMH-------VVEY------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- --------------------MG--------------WIQDLFAPEQR------SW-EDFYR -NRWAH------DKVVRTTHG-VNCTGSCSWNVYVKQGVVTWEMQALDYPTID-----RSI -PNYEPRGCQRGISTSWYIYSPLRVKHPYMRGALLD------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------LWQEARRE--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------HP------------------ ----------DDPVAAW-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------ASIT----------------------------------- ------------------------------------------------------------- ----- ->AFN37208|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIVTWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGFRRATWDECLELVASSLLYTAKKY----GPDRV-VAFA -PIPAYSYLS------FGAGTRFIQL----------------------------------- ----FGGFTLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVANGANMNMTRTPDVH -FISEARHNGTKFVVIAPDFSQVAKYSDWWLPVKAG-QDQALWMGIDHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGKVAVTTA--------- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEPYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWSCWALGKDWVPTSRLQQSSSWHYAHSDQWRYEGDFTEYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPLDVVKQAEAAG -AKT------DEQIVKWVVEQVKS---------------KQLKFAIEDVDAPE-NWPRTWL -IWRGNALQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVTFREPAPRGKM -DLLCQLNFRMDTTATYCDVVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMTPLAHDTPDELSQDYQAGMKVLDWGKG -EIEMIPGKTAPHFKVVERDY--ANIYNQWITFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRK----TGDIV-- -------------------------RSPVDDESVVLNY-------------------ITPH -GKWHIHSTYYDNHRLLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPE-------------- ---RTISIPKSQVRGNRRGGAHNSLT---RIRINPMQMAGGYAQ---------WTYAWNYW -GPIGIMTRDTHVAVR--------------------------------------------- ----- ->AFN37205|Nitrolancea_hollandica_Lb ------------------------------------------------------------- -----------------------------------------------------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRHRWQRARGKGGFRRATWDECLELVASALLYTAKKY----GPDRV-VAFA -PIPAYSYLS------YGAGSRFIQL----------------------------------- ----FGGFNLSFYDWYADLXNSFPEVWGDQTDVCESADWYNSKFIVSNAANMNMTRTPDVH -FISEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTCWALGKDWIPPSRLQQTSTWHYANSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPFEVVKQAEAAG -AKT------DEQIVKWVVAQLKS---------------KQLRLAIEDVDAPE-NWPRTWL -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVVVREPAPRGKM -DLVCQLNFRMETTATYSDIVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMQPLAHDTPDELSQDYLAEMKVLDWGKG -EVDLIPGKTAPHFKIIERDY--ANLYNQWTSFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMVYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYAFNYW -GPIGIFTRDTHVA----------------------------------------------- ----- ->AFN37207|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRC-AAFA -PIPAYSYLS------YGAGSRFFQL----------------------------------- ----FGGFNMSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVIAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIDYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCVGYRW-------ATKETGKWNISMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------EVAQVEF----- ---------------------DIFGTGKVARRGVPIKYLETS-EGK-VAVTTAFDL----- -------LLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPIEAPILTGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTTWALGRDWIPPSRLQQSPVWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAIDLLASAVRMGWMPF-----YPQFN-RNPLEIVKQAEAAG -AKS------DEQIVKWVVGQLKS---------------GNLRYAIEDIDAPE-NWPRTWV -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EEHAKGRVKDVVLRDPAPRGKM -DLVCDINFRMETTALYSDMVLPTAMW--YEKNDLNTTDLH-SFIHP----L-GAAVPPVW -EAKTDYEIFKAIAKKVSELAPSVFPQPVKDIISNPLIHDTPDELAQDYLSEMKVLDWGKG -EIDLIPGKTGPHLKIVERDY--VNLYNRWISFGPKARENGISGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGGRYPRLEFAEEAANLLLHLSPETNGEVCYHAFKEEEKQ---- ------IGMPLADLAESIR----G-VRMNYF-DLTRQVRRTMISPCWTGMINDGRAYAAWC -LNVERLVPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRKTG--DIVRSP- ----------VDDES------------------VVLNY-------------------ITPH -GKWHIHSTYYENHRMLTLSR---------------GIEPCWINDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMFNYW -GPIGIFTRDTHVAVR--------------------------------------------- ----- ->AFN37206|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRV-TAFA -PIPAYSYVS------FGAGARFIQL----------------------------------- ----FGGFHLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEGYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLSLVS---AWQSWALAKDWFPPSRVQQSSTWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPM-----YPQFN-RNPLELVKQAEAAG -AKS------DEQVVEWVVGQLKS---------------GNLRYAIEDVDAPE-NWPRVWL -IWRGNAFQS---SAKGAEYFLRHYSGTHDNAVA-----EEHAKGRVKDVVFREPAPRGKF -DLLCDLNFRMDTTALYSDIVLPTAMW--YEKNDLNTTDLH-TFIHP----L-GAAVPPVW -EAKSDYEIFKSLAKKVSELAPSVFPQPVKDIVSNPLAHDTPDELSQDYLAEMKVLDWGKG -EIEMIPGKTAPHFKIVERDY--VNFYNRWISYGRKARENGIVGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGQRYPRLEFAEEACNLIMFLAPESNGEVCYHAFKEEEKQ---- ------LGLPLADLAEAVR----G-VRMNFF-DLTRQVRRTLISPCWTGMVNDGRAYSAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMWNYW -GPIGILTRDTHVAVR--------------------------------------------- ----- ->WP_005004540|Nitrococcus_mobilis ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMEDG-------- --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGSVLVATV--------- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIHDLDNSPID- ------------------------------DKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVE-------------- ---RTIYIPKSQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->Nitrococcus_mobi_EAR23355 ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMED--G------ --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGS----VLVATV----- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIH--DLD---- -------------------------NSPIDDKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVERT------------ ----IYIPK-SQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MS-WIEDIISPNTR------KW-EEFYR -NRWQY------DKVVRSTHG-VNCTGGCSWAIHVKDGIVVWEMQQLDYPQFN-----KDV -PPYEPRGCQRGISYSWYLYSPIRVKYPIIRGALID---------LFRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------E ------------------------------------------------------------- ------------------------------------------------------------- --------KKKCG------------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- -----------------------------------------DPVLA--------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------ANLQADDTK------------ ---------------------------RKRYQRA--------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Nitrobacter_winogradskyi_gb_ABA05326 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLAD---------LWHEAKASY-PDPVQA -WASLVEDEEKRNRIQKARGKGGFRRAKWEELIELIAASCLYTARKH----GPDRV-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----FGGGLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWSTVAMALDWNKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPNFH-RNPIEVVAEAERAG -AKS------TADIATYVADQVAS---------------KKLDLAINDPDAEE-NWPRVWF -IWRANAIQS---SAKGHEFFLRHYLGAHDNVIA-----EERAKGKTTTVKYRDTAPQGKY -DLVVDINFRMNTTGLYSDIILPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDIVLQPLMHDTPDELAQPE-----ILDWAEG -ECKLVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVNIPIKKQYDQMLEN -PIMPMPDSRHMRCVEWGGKRYPSLEDVLDACNVVLLCAPVANGEVSYQGFVNEEQH---- ------VGLPLADIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLVNDGRAYSAWC -MNIERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRLLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RIRINPLFLAGGYAQ---------FTYGWNYW -GPTGIFTRDTHVVVRKME-------KVEW------------------------------- ----- ->WP_011314088|Nitrobacter_winogradskyi ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYVRGPLYD---------LWKEAKASH-PDPVQA -WASLVGDEQKRSRIQKARGKGGFRRAKWEELVELIAAAALYTARKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TADIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLISKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNIPIKKQYDQMLDN -PIMPMPDARHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLTNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->Nitrobacter_sp_Nb_311A_ZP_01048070 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLYD---------LWREAKASH-PDPVQA -WASLVGDEQKRLRMQKARGKGGFRRAKWEELVELIAAAALYTARKW----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------AKRVARY--Q -DVENGDWKMLVLDSKTGEPRAFKGQVGDRW--------GSTHGKWNLSAED----TLDNS -PIDPVLSFIDQSDGVVQVGF------D---------------------DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGEVLVTTG--------- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDENAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLQAKAVRSGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TDDIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGMTNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDSQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->A_Nitrobacter_hamburgensis_YP_578638 ------------------------------------------------------------- --------------------MS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLLD---------MWREAKASS-ADPVQA -WGALIGDEQKRSRIQKARGKGGFRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFVDYIKRYTDLPFLVELES-----NGNTYKTGRLLR---------SNRVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVKRVATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWATVALALDWAKPPRLVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPKWAKGHAIDLEAKAVHNGWMPF-----TPHFN-RNPIEVAAEAERSG -AKN------VQDIETYVVDQVVS---------------KKLQMAIDDPDAAE-NWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNAIA-----EDRAKGKAQVVKYHETAPRGKY -DLVIDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIGKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWSLG -ECKAVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPNR----N-VAATFY-DLTRQPRRIITSPCWTGMVNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- -----SR---------------------VDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->B_Nitrobacter_hamburgensis_YP_578186 ---------------------------------------------------------MTTG -LAAGQR--------TEETQMS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRIKYPYVRGPLLD---------MWREAKASS-ADPVQA -WGALVGDEQKRARMQKARGKGGYRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLLSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGTTYKTGRLLR---------ARHVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVRRIATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATTAEYTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWASIALALDWSKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKAVRSGWMPF-----TPHFN-RNPIEVAAEAERAG -AKS------TEDIATHVIDQVAS---------------KKLNLAIEDPDAAE-NWPRLWF -IWRGNAIQS---SAKGHEFFLRHYLGTHDNAIA-----EDRAKGKTHTVKYHDTAPRGKY -DLVVDLNFRMDTSSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWDIFKLIAKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNVPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPTR----N-VATTFY-DLTRQPRRLLTSPCWTGMMNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14 rank: A; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGQRSTWGVVSESRRRFLVKAGL -ASAAGA--------AINLNLFGCGRSHAPLQHFKGTTAGHFDLGPRTTPKLGNW-QDLYR -QRWTW------DKVVKGSHGWANCRSACEWDLYVKDGIVVREEQSATYEASE-----PGV -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------PRGSGQWEKISWEQAIKEIAQKTVDAVTEF----GTDTVFQDLG -PNFDFGPST--------AGRFKFMYQAGSLFADM-------------------------- ---------WGEI---GDLNFGATMALGAAQIGGSSDEWFLSDFIVVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPIETG-TDAALGLAVARHLFEVNAI----D -------LPFVREQTDLPLLVRLDTGRFLRETDLNSG------------------GNA--- ----------------------------------------DQLYLWHPQKNAPVFAPGC-- --------TGNTTRKLTLDFE----------------------------APIDGQW----- -------------------------------------TIKLH-DGKEVAIAPVGAL----- ----LKEHLEP-WTFEHTA-----------------------------SVTHLHVDQVKKF -AEGW-----------AKCQRPMVLSSWGSNRFVHSD-LMNRSKILCLMLKGALGKKGT-G ----YQATGIVDMEGFNNAMQMDHEGVR--------------------------------- -------------------------------GRLGALLGIMPPADLFQAVLDIVMQRKTEG -DVAL-----ETEMNYL-----KHHLCSSDVMESNFKAPGYRAAVVKEHEGMLPRSLESYY -QEARQKDWS---QGLPRKAPVKVYFSGGANILRRSNMP-----------QYYKTFIWDEM -QCIVDINPKYSFTGTQSDYILPAAGW--YEKAGIKYTMSYVPYLH-----YCDVAVPPLG -ESKGEWEIFWLLTREMERYA---------------------------------------- ---KEKNLPVLDGCGRGSNDF--KTLHQRYSNQGELGQ----------------------- --------------------------------HDDEKVMKEILHGDATEGMTIEGLKQTGI -AKFTSAGKPVAADAINNP----D-WKGEGV-MTTLTRFTVHKEPWPTYS----------- --------------------GRITSFIDHPWFIEMREQFPIHKDSPKAGG----------- ---------------------------------------------------DYPFQFVSCH -ARWSIHSTWRDTPMMLRLQR---------------GEPLVYINPIDAERVGVKDFEYV-- ----------------EIFNNYGSVRMRVKVAAMVRPGVAYYYHAWE-------------- ---------------PHQFPNHQSFKWLIPGLVNPLYMAGGYGQ---------INHAMNRY -QPG-SAVQDTRIGIR------------PW---HGQATGAHPVKRPEAAATSK-------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1 rank: C; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGNLIKTGIASASRRKFLVMAGA -ASAAGA---------ALSLFGCGRAPLQH--FKGTTASGRFDLGPRTAPKLGNW-QDLYR -QRWTW------DKVAKGSHGWANCRSACEWDLYVKDGVVVREEQSATYEASE-----PGI -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------SRGSGKWEKISWEQAMKEIAQKTVDAAEKW----GTDTIYQDLG -PNFDFGAST--------AGRFKFQF----------------------------------- ---MAGGVFADNWAEIGDLNVGASITTGAAHLGGSSDEWFLSDFIIVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPLESG-TDAALGLAVARHLLETGAI----D -------LPYIREQTDLPLLARLDTGRFLRESEMVNG------------------GNA--- ----------------------------------------DQLYMWHPQKNAPVPAPGC-- --------LNNTTRNLKLDFE----------------------------PPIDGQW----- -------------------------------------KVKLA-DGKEVGVVPVGAM----- ----LKEHLDS-WTFEHAA-----------------------------KVTHLHIDQIKKF -AEGW-----------AKAQRPMVLSSWGSNRYVHSD-LMNRTKLLLLMLKGAMGKKGA-G ----------YQATGWV-------------------------------------------- ----------------------------------------------DLDGFGNAMQMEKSG -MT------------------------------------GRLAVMLNAM------------ ---------P--------------------------------------------------- ------------------------------------------P------------------ ------------------------------------------------------------- -----------------------KELFNA-------------------------------- --------------------------------VVDIIKKRKTEGDVALEG----------- ----------------ENN----Y-LRTK-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------LCTSDVVEVNLKSDGY--- -----------------------RAALNKEQKGLYPHELDEYYKEAHD------------- -----------------------------KGWAP--------------------------- -----GLPRKAPPKIFF-------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3 rank: A; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MSISRRHFIVGSAV -AVAGVG------------LYS--LRPKKP--VVYPVGVRAPKVAAR-KVHYNDY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQAAIYEPHR-----PDV -PDFNPRGCQKGACYTQLQVSEARVKYPLKCVG---------------------------- -----------------ERGEGKWKRVSWDTALDEIADRLIDIAVRDGTESIIFDDTTNVG -YGPE-----------TAGDVRFAAA----------------------------------- ----IQATRLDSWSGVGDMPNGLIQTWGLYNCEGTSDDWYLSDYIVIWVGNPNYTRIPDAH -FLHEARYRGAKLVVVAPDLNPSTAHADLWINVNAE-TDSALALSCAQVMIAEKLY----K -------KDYVLQQTDFPFLVRKDDQRFLRAADMVKG--------------GAD------- ----------------------------------------NALYLWDEAKHAPVIAPGCEG --------DGDGGRIMALGGI------K---------------------PALSGTF----- -------------------------------------KVTTQ-DGKTVEVQTVFDM----- ----IRAKLDAEYTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPKAMIIASYGSCKHYHHD-LNQRSFVLLMNLTGNQGQQGG-G ----------YRISAW-----WAMDGLD--------------------------------- -------------------------------QMADSTVPLKDMLRIIPKAIRGLSPRDYEG -LFTEYSDKEGHTPALLFLY--LH---------------GGYKEMWDKPHLQDPALPRPF- ---ADYVQES---IDKGW-SKVHPPLGREPRAYI---FTGGNPLRRWPSPQIAKQHLWPKF -ELVVSVNFRMSTSSLFSDYVLPVAAY--YEKYGIKYAQTYVPYIIT----S-DKATEPLG -ESKSDWETFGLLSKHVAERARVRGVTMVRGL----------------------------- ----------------KDVLFDLSKAYEVHTHHG--------------------KYDP--- ----------------------------TDPEDPIKLMDAIFANSPSIGCNTGREALDMGA -VPVIGTGRPSLIDQNYSP----YDPKDTYW-PHKDFIDKKIAWPTLT------------- --------------------GRQQFYIDHPWFLEGKEHLPTFKPSIHANSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHAVWRDVKLLLRLQR---------------GQPACWLNPKEAEKRGIKDGDMV-- ----------------RVFNDHGTCECMVKVSAITAPGEVIIYHAW--------------- ----------EPYQFKKWQGNQEPVE---APW-KALHLAGGYAQ---------LHWRVYYH -GPN-HSPRGAPVEVEKIGYEGG-------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4 rank: C; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MQISRRGFIVGSAV -AAAGVG--------LYSLKSK--KAVIKPGITLP-DKTPAKKIKYN------DY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQNAIYEPPR-----PGI -PDQNPRGCQKGACYTALQLSESRVKYPLKRAG---------------------------- -----------------NRGEGKWKRISWDEALTEIADKLLDIAVAEGTETICFDDLSNTG -YGPETAGDFR-----FSTGMQVSRL----------------------------------- ----------DGWSGVGDMPLGVIQTWGAFNCEGTSDDWFRSDYIVIWLGNPSYTRIPDAH -FLHEARYRGAKLVVVAPDLNATTVHADMWLNVKPE-TDAALGLACAQIMISENLY----K -------KDYVLEQTDFPFLVRKDNQRFLRVSDVVKG--------------GAD------- ----------------------------------------NAFYLWDEAKNAIAMAPGCEG --------DGDGGRSLKLGAL------K---------------------PALSGTR----- -------------------------------------SVKLA-DGSTVECITVFDM----- ----IKERLDKEHTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPSAMIIASYGACKHYHSD-LFQRSFILLMNLTGNQGKPGG-G -MRVAAWWGMDGLDAMA----DSTIPMA--------------------------------- -----------------------------------------DMMKIIPKAVRGLTPRDYES -LYTDYSNREGHTPTMVFLY--VH---------------GGYKELWDKPYLQDPNLPRNI- ---SSYMRES---IDKGW-TKVHPPENKSPKAYI---FTGGNPLRRWPSPQIAREKLWPKF -DLVCSVTFKMSTSTLWADYVLPVAAY--YEKYGIKYAQSYVPYIIS----S-DKATEPLG -ESKSDWETFGLMAKKVAERAKARNITMVRGL----------------------------- ----------------DDKPFDVSKVYDFYTGNG--------------------KYDP--- ----------------------------TDPEDPVRLMDEIFAGSPNVACNSAREALQRGA -VPVTGPGRPSLINQNYSD----YDGKDTYW-PHRDFIEKKVAWPTIT------------- --------------------GRQQFYIDHPWFIEGKEALPTHKAPPLATSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHSIWRDVKLLLRLQR---------------GQPAAWMNPAELQKRGLKDGDMV-- ----------------RVYNDHATFECNIKSSPATAPGEIIVYHAWEPFQFK--------- -----------------KWQSNQEVT---EAPVKGLHLAGGYTQ---------LHFRVYYG -SMH-HTPRGAAVEVEKAPT----------------------------------------- ----- ->NASQAN2015_111_B_bin.76_k121_226837_116 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVSRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDIWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVRAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVETR-TGK-VTVTTVFAL----- ----LRKRATE-HSPEKMS-----------------------------TETGLNPKAMRTV -AREF----------AKAGQRAMIYAGFSACKWLHGD-ILQRSMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLEEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DTAVKPLG -EAVDDFEALRRVSAAISTIAREKATPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRDSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQQGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDAGSFVCMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLYS-------RGKV---TAAKARIA-------------------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVNTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------NVETR-TGK-VTVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKRAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DQAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLHS-------RGKV---------------------------TAAK -VRIA ->NASQAN2014_190_B_bin.96_k121_3766_2 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLTHSAL -AAGAAL--------ALHHGAA--------------MADALSR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIDEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VAVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------DETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPIYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDATARNVRDGDLI-- ----------------EVFNDGGSFICMAHVSAGIMPGTVYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---------------------------TAAK -VRIA ->greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHTAL -ASAALA--------LQHGAAM--ADALTR--------------PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVYKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGDI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VTVTTVFAL----- ----LKKRAAD-HSPENMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRIVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRASGN--------------RWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTAAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVWNSDESP----FHADIA------ESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARNVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---TAAKVRIA-------------------- ----- ->providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4 rank: A; shal:SHALO_2978 molybdopterin oxidoreductase, alpha subunit (db=kegg) ----------------------------------------------MANSSRRNFLKASG- ---------------FSAAMLAGQGTLFAKTDVIK-VENAKDSYPNA------SFTETNYR -DEFKFTYGEKAEHGYAYHCV--NCQGNCAWEVWGNNGIVTRENQSAKYPAF------GHN -PDFNPRGCNKGVQHSQVMYEKDRILYPMKRIG---------------------------- -----------------ERGKGKWKRISWDEAATEVAQKLYTTM-------------IDPK -KGPAAITVH------AGTGLLTEGRRPSVLRFGT-------------------------- ---QLGASRIYPASYLGDMFTGAAIAYGEGNMGCTYDFMFNVSTSIMWGANPSATRIPDAH -FVWEGKYNGSKIIVITPEYNATAARAHLWVPIKPG-TDSFLAMSIINEMLAKKLY----- ------LPQAVKTYTDLPFLVDAKTKRFIRRSDAEHA------------------------ ---------------HDEKTHHLYE---------------DEFYCWNLKSGKPELMPGTEG -SERKTIMLKDKGWDI-----------D---------------------PALEGEW----- -------------------------------------EMTLQ-GGKKVKVTTVFEL----- ----LKKEASK-YSAKDTQ-----------------------------KITGVHLDVVTEL -ATHI-----------AKDKCVEITTGFSLNKYFNGV----LSIWNIATICGLTGRFGPRG ------------------------------------------------------------- -------------------------------GLNTE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------NEFQLSG------------------------------------------------ ------LEALSGFAGKYS------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PRFA-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------SGFLSEFM------------------------------------------- ------------------------------------------------------------- ----- ->muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MKLTRRTVLQGIAG -ASAATVVGGQD---ALGEAGAPAAKTGKD--VPVIIDDPREHYPNT-----RPV-EDMYR -SEFADTFGDPDDHGTAFHCV--NCQGNCAWQVWIKDGKVTRENQSAAYPAIR-----EDI -PDSNPRGCNKGVQHSQVMYEADRIRYPMKRVG---------------------------- -----------------ERGGGKWERISWDEAIDTIAQKLYRTM-------------VERG -PQGNYVH--------VGAGLLSEARGASIKRMGA-------------------------- ---LLGAVRPYIASYVGDMFPGVSLVYGEGNIGCSYDFMYGTNVQVYWGCNPNTSRIPDAH -YVWEGKYNGSKVIVISPEFNSTAIHADRWIPIKPG-FDGHLAMSLMHELVDKQLY----D -------AELVRKFTDLPMLIREDSGAMLRLSDIDPARAAAEGALAFDAELAEKFGKKAHG -KKDHAEDVFLAVNEVGGKLTAMPGGEGSAL---------GTLR----------------- --------LQDVGWKIT--------------------------------PALSGNW----- -------------------------------------TVTLR-DGKTVRVHTVFDA----- ----LRKELEA-FTPEKTH-----------------------------KLTGVHPTLVRDL -ARDI-----------ALPEVVSVTMGFALGKHFNGM-LTQRAIASLMALTCRMGPRGGLN --TENEWSISGLGGLSGFDGAFKHRFAS--------------------------------- -------------------------------GAVSEH----QLGDGAATSKKAYTDDEIRE -ATG------QDAASYR----------------------AEIAALLEKS-----KNDRGVD -PAKGRFGKPWWDTVETFFIVADARFRRNKSGYR--------------------EAFLDKA -KFFAVADMKMGETARFADIVLPSASH--YEVWDLRVNPGYHRFANIA---QPPKGLEPVG -EAKSEWHIATMLVTRMQEIA---------------------------------------- --------------------L--AEYAR--------------------------------- --------------------------------TKNIGVMHIPDPTHTRDGIRPLDKF---- -------------VELFTD----H------------------------------------- --------------------GKLGT---DKQAVEFALGHV--------------------- ------------------------------------------------------------- -------DQFRGEDLESCYDR----------------GGFLVVNDKGGKT----------- -------------------------------SPLYP------------------------- ------------------------------------------------------------- -----DKPYSTF----------------------------------ENHF----------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MSISRRDALRNLLF -GTVAAG--------VAAKVPTAEAKEFSDPQPVR-VDDPRKSYPDT------QTTEDFYR -AEFQAVRGNPDERGFAYHC--VNCQGNCAFEVWTENGKVTRENQSASYPQLA-----PNL -PDANPRGCNKGSQHSQVMYEADRLLYPMKRAG---------------------------- -----------------ERGSGKWKRISWDEAITEIAENL------------HRGL-VEKG -PSSNYVH--------IGAGVLTEARAASIKRLGSL------------------------- ----IGAVRPYIASYVGDMFPGVTVVYGEGNIGCTYDFVFTTNVAVFWGCNPNTSRIPDAH -YLWEGKYNGSKIIVITPEFNSTAIHADLWVPLKAG-YDGHLALSIIHRIIQRKLF----R -------PEFLKEYTDLPFLVRKDTKELVRLSDVALD--------------AKGFDGA--- ----------------SARLFGEHPH--------------ECFLAFNTKNRKFTAMPGTEG -SGVETLRLQDMDWDI-----------D---------------------PALNGSW----- -------------------------------------KLTLK-DGKQVQVTTAFEL----- ----FKKEVAA-FAPEKVQ-----------------------------KLTGVHPSIVDEL -ATDL-----------TKAKVSLVTMGFAVGKHFNGM-LSQRAIASLTAFCGKLGPEGGLN --TENEWNISGLEGLSGFQGKYQHRFAS--------------------------------- -------------------------------GFVSE-----FMLGEGLEDADALYSDEDMR -RGT------GDSKAEY-----KA---------------KVQALLEQGKNDERYKEGKPYW -T-----------TVENFLLFADSRFRRNKGNYQ--------------------KAFLEKA -KFIAYGDVRANDMAIYADILLPCKTP--YECWDLRTNPGYHRYANIA---YPPPNLKPVG -ESKSEWEIATLVVEKLEALAKQKAAAT--------------------------------- ----------------GEDRY---------------------------------VVIP--- --------------------------------DKTHTQEGVRRLDELVREFTKDGTL-RTD -KDAVEYALEHVDQFKPNDTKSLY-ERGGFL-QLNEKAGKSS--PLYADK-----PYNTFE -NQLFLHQRFDTLT------GRLTFYVDHPLWIAANAHVPTAKQPIRPARHP--------- ------------------------------------------------------FVLMTPH -ARWSIHSTYKTSPILLRLQR---------------GKPCVMINPEIARARGIQDGDTI-- ----------------KMFNELGEVRVMAKLSPACPPDALVMEHGWE-------------- ---------------PFMYDGKKGHNLIIGDMLNLLELTDGWGH-------LKFGTNWDGN -----QHAYESTMDIAKA------------------------------------------- ----- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60 rank: A; sul:SYO3AOP1_1175 molydopterin dinucleotide-binding region (db=kegg) -----------------------------------------------MTVSRRDLLKAAAL -GSVAIGSNTLAKNAFTEPIPQKEAKDI----PVI-VEDPRASYLNTK-----SI-EDMYR -REFAETFGEKKDHGYAYHCV--NCQGNCAWQVWTKDGKVTRENQSASYPQIA-----PNI -PDYNPRGCNKGVQHSQIMYEQDRLLYPMKRVG---------------------------- -----------------PRGEGKWKRISWDEAITEVSENLYNTMQE---K----------- --GPAGNYIH------IGAGVLTEGRAASVKRLGT-------------------------- ---LLGAVRPYIASYVGDMFPGVSTVYGEGNIGCTYDFIFKTNVAIFWGCNPNTSRIPDAH -FLWEGKYNGSKIVVISPEYNSTAIHADLWVPIKPG-YDGHLAMAVLNEIVFKKMY----N -------ESFVKEFTDLPLLVRKDNKELVRFAEIDTKDSNFD---------SKSSEKL--- --------------LKKILKRELKEHEVF--------------LAWNQKTNKMTVLPGSEG -SPVETLRLKDRGWNI-----------N---------------------PALSGTW----- -------------------------------------KIKLK-DGHTVEVTTVFDL----- ----FKQELKK-FDPLRMH-----------------------------AVTGVHPTIVSEL -ARDM-----------IVPKNTLVTMGFSLGKYFNGM-LIQRAISALTAISGRLGESGGLN -T-ENEWNITGLSGLSGFEGKYQHRFAS--------------------------------- -------------------------------GFVSE-----YMLGDNLNDYDHLYAEAEIK -EST------GLGKKQY-----RE---------------KIEKIVKDG------ANDEGFK -NGKPYWTTM---ETFLLFADAR--FRRNKGSYK--------------------EAFLKKA -KFIAYGDYRMSDFCNYADILLPCKSH--YEVWDIRTNPG---YHRFANIAYPPANLKNVG -EAKSEWEISTLIAEKIQDIA------------------LKKYKS--------------SG -DKKAIHVPDTTHTQTGFRAL--DEVVNEFTIGG---------------------KVR--- --------------------------------SDKDAVEYMLEHVDQFKPNSTKTMY-ERG -GFLVLNDKAGKSSPLYSN----K-PYNT------FESNKLLYQPFETLT----------- --------------------GRLTFYVDHHLWIETGAHIPTARNPIRPKK----------- ----------------------------------------------------FPFVLMTPH -ARWSIHSTYKTSKILQRLQR---------------GKPYIMINPKVAEAKGIKDGDEV-- ----------------KMFNDLGETFLMAKITPSAPEHSLVMEHGWEPFMYKNKVGH---- ----------------------NALV---GDMINLLELSDGWGH-------LKFGTNWDGN -----QHAYETTVDIVKA------------------------------------------- ----- diff --git a/bin/adjectives.py b/bin/adjectives.py index ed408e96..f829d57a 100755 --- a/bin/adjectives.py +++ b/bin/adjectives.py @@ -1,19 +1,25 @@ #!/usr/bin/env python """Contains main entry point to the program and helper functions""" + import os import ast import click import polars as pl +from pathlib import Path from rule_parser.src.rules import evaluate_rules_on_anno from utils.excel import write_summarized_genomes_to_xlsx +from utils.logger import get_logger -class PythonLiteralOption(click.Option): +logger = get_logger(filename=Path(__file__).stem) + +class PythonLiteralOption(click.Option): def type_cast_value(self, ctx, value): try: return ast.literal_eval(value) - except: + except Exception as e: + logger.error(e) raise click.BadParameter(value) @@ -24,10 +30,9 @@ def get_assets_path(local_path): :param local_path: :returns: """ - abs_snake_path = os.path.join(os.path.dirname( - os.path.abspath(__file__)), - "assets", - local_path) + abs_snake_path = os.path.join( + os.path.dirname(os.path.abspath(__file__)), "assets", local_path + ) return abs_snake_path @@ -55,11 +60,25 @@ def get_assets_path(local_path): @click.command() -@click.option('--annotations', type=click.Path(exists=True), required=True, help="One of only 2 required files. Path to a DRAM annotations file.") -@click.option('-o', '--output', type=click.Path(), default='traits.xlsx', help="Path for the output table. A true false table created by this script.") -@click.option('--rules_tsv', type=click.Path(exists=True), - default=get_assets_path('traits_rules.tsv'), - help="This is an optional path to a rules file with strict formatting. It will over write the original rules file that is stored with the script.") +@click.option( + "--annotations", + type=click.Path(exists=True), + required=True, + help="One of only 2 required files. Path to a DRAM annotations file.", +) +@click.option( + "-o", + "--output", + type=click.Path(), + default="traits.xlsx", + help="Path for the output table. A true false table created by this script.", +) +@click.option( + "--rules_tsv", + type=click.Path(exists=True), + default=get_assets_path("traits_rules.tsv"), + help="This is an optional path to a rules file with strict formatting. It will over write the original rules file that is stored with the script.", +) # @click.option('-a', '--adjectives_list', default="", callback=validate_comma_separated, help="A comma seperated list of adjectives ('adj1,adj2,adj3'), by name, to evaluate. This limits the number of adjectives that are evaluated and is faster.") # @click.option('-p', '--plot_adjectives', multiple=True, default=[], help="A list of adjectives, by name, to plot. This limits the number of adjectives that are plotted and is probably needed for speed.") # @click.option('-g', '--plot_genomes', multiple=True, @@ -85,13 +104,15 @@ def get_assets_path(local_path): # " available, you can pass these names to limit the" # " adjectives that are evaluated") # @click.argument('-p', type=click.Path(exists=True)) -def evaluate(annotations:str, output:str, - rules_tsv:str=get_assets_path('traits_rules.tsv'), - # adjectives_list:list=None, plot_adjectives:list=None, - # plot_genomes:list=None,plot_path:str=None, - # debug_ids_by_fasta_to_tsv:str=None, - # strainer_tsv:str=None, strainer_type='pgtb' - ): +def evaluate( + annotations: str, + output: str, + rules_tsv: str = get_assets_path("traits_rules.tsv"), + # adjectives_list:list=None, plot_adjectives:list=None, + # plot_genomes:list=None,plot_path:str=None, + # debug_ids_by_fasta_to_tsv:str=None, + # strainer_tsv:str=None, strainer_type='pgtb' +): """Using a DRAM annotations file make a table of adjectives.""" rules = pl.read_csv(rules_tsv, separator="\t") @@ -99,34 +120,33 @@ def evaluate(annotations:str, output:str, sample_col = "input_fasta" group_by_col = "topic_ecosystem" if group_by_col not in rules.columns: - rules = rules.with_columns( - pl.lit("traits").alias(group_by_col) - ) + rules = rules.with_columns(pl.lit("traits").alias(group_by_col)) for name, data in rules.group_by(group_by_col): dfs[name[0]] = evaluate_rules_on_anno( rules=data.lazy(), annotations_path=annotations, sample_col=sample_col, parent_col="alias", - rules_col="rule" + rules_col="rule", ) write_summarized_genomes_to_xlsx( df=None, output_file=output, group_by=group_by_col, sort_order_columns=sample_col, - extra_frames=dfs + extra_frames=dfs, ) + # Maybe someday we will add all of this back in? - # if plot_path is not None: - # rules.plot_cause(plot_path, adjectives=plot_adjectives, - # genomes=plot_genomes, show_steps=False - # ) - # if strainer_tsv is not None: - # strainer_data = get_positive_genes(rules, annotations, adjectives) - # strainer_data.to_csv(strainer_tsv, sep='\t') +# if plot_path is not None: +# rules.plot_cause(plot_path, adjectives=plot_adjectives, +# genomes=plot_genomes, show_steps=False +# ) +# if strainer_tsv is not None: +# strainer_data = get_positive_genes(rules, annotations, adjectives) +# strainer_data.to_csv(strainer_tsv, sep='\t') # @click.command() @@ -159,4 +179,4 @@ def evaluate(annotations:str, output:str, # rules.plot_rule(plot_path) if __name__ == "__main__": - evaluate() \ No newline at end of file + evaluate() diff --git a/bin/assets/forms/amg_database.20220928.tsv b/bin/assets/forms/amg_database.20220928.tsv old mode 100755 new mode 100644 index 42b93eae..36bf891e --- a/bin/assets/forms/amg_database.20220928.tsv +++ b/bin/assets/forms/amg_database.20220928.tsv @@ -277,4 +277,4 @@ K01599 EC:4.1.1.37 PF01208 Uroporphyrinogen decarboxylase (URO-D) Roux et al. PF13385 Concanavalin A-like lectin; extracellular arabinase Emerson et al. 2018 FALSE K01779 EC:5.1.1.13 racD; aspartate Racmase Trubl et al. 2018 FALSE PF01786 Plastoquinol terminal oxidase (PTOX) Sullivan et al. 2010; Ignacio?Espinoza et al. 2012; Roux et al. 2016 FALSE - PF01077; PF03460 rdsrA; reverse-acting dissimilatory sulfite reductase (alpha subunit) Anantharaman et al. 2014 FALSE \ No newline at end of file + PF01077; PF03460 rdsrA; reverse-acting dissimilatory sulfite reductase (alpha subunit) Anantharaman et al. 2014 FALSE diff --git a/bin/assets/forms/db_description_builder.py b/bin/assets/forms/db_description_builder.py deleted file mode 100755 index c9b4d7d9..00000000 --- a/bin/assets/forms/db_description_builder.py +++ /dev/null @@ -1,964 +0,0 @@ -""" -*DRAM v1/early v2 DB description builder script* - -Contains most of the backend for the DRAM_setup.py script, used to setup databases for each user. -""" -from os import path, mkdir -from datetime import datetime -from shutil import move, rmtree, copyfile -from glob import glob -import gzip -from collections import defaultdict -import logging -import tarfile - -from skbio import read as read_sequence -from skbio import write as write_sequence - -from dram2.utils.database_handler import DatabaseHandler -from db_utils import ( - run_process, - download_file, - merge_files, - remove_prefix, - setup_logger, -) - -NUMBER_OF_VIRAL_FILES = 2 - - -DEFAULT_DBCAN_RELEASE = "10" -DEFAULT_DBCAN_DATE = "07292021" -DEFAULT_UNIREF_VERSION = "90" -DEFAULT_VOGDB_VERSION = "latest" -DFLT_OUTPUT_DIR = "." -LOGGER = logging.getLogger("database_processing.log") -DEFAULT_MMMSPRO_DB_NAME = "db" - -from dram2.camper_kit import download as download_camper_tar_gz -from dram2.camper_kit import process as process_camper_tar_gz -from dram2.camper_kit import DOWNLOAD_OPTIONS as CAMPER_DOWNLOAD_OPTIONS -from dram2.camper_kit import PROCESS_OPTIONS as CAMPER_PROCESS_OPTIONS -from dram2.camper_kit import DRAM_SETTINGS as CAMPER_DRAM_SETTINGS -from dram2.fegenie_kit import download as download_fegenie_tar_gz -from dram2.fegenie_kit import process as process_fegenie_tar_gz -from dram2.fegenie_kit import DOWNLOAD_OPTIONS as FEGENIE_DOWNLOAD_OPTIONS -from dram2.fegenie_kit import PROCESS_OPTIONS as FEGENIE_PROCESS_OPTIONS -from dram2.fegenie_kit import DRAM_SETTINGS as FEGENIE_DRAM_SETTINGS -from dram2.sulphur_kit import download as download_sulphur_tar_gz -from dram2.sulphur_kit import process as process_sulphur_tar_gz -from dram2.sulphur_kit import DOWNLOAD_OPTIONS as SULPHUR_DOWNLOAD_OPTIONS -from dram2.sulphur_kit import PROCESS_OPTIONS as SULPHUR_PROCESS_OPTIONS -from dram2.sulphur_kit import DRAM_SETTINGS as SULPHUR_DRAM_SETTINGS - -KEGG_CITATION = "Kanehisa, M., Furumichi, M., Sato, Y., Ishiguro-Watanabe, M., and Tanabe, M.; KEGG: integrating viruses and cellular organisms. Nucleic Acids Res. 49, D545-D551 (2021)." -GENE_KO_LINK_CITATION = "" -KOFAM_CITATION = "" -UNIREF_CITATION = "" -PFAM_CITATION = "" -DBCAN_CITATION = "" -VOGDB_CITATION = "" -VIRAL_REFSEQ_CITATION = "" -PEPTIDASE_CITATION = "" -DRAM_CITATION = "" -# TODO: check if dbcan or pfam is down, raise appropriate error -# TODO: upgrade to pigz? - - -def get_iso_date(): - return datetime.today().strftime("%Y%m%d") - - -def download_pfam_hmm(output_dir=".", logger=LOGGER, verbose=True): - pfam_hmm = path.join(output_dir, "Pfam-A.hmm.dat.gz") - link_path = ( - "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.hmm.dat.gz" - ) - logger.debug(f"Downloading Pfam from: {link_path}") - download_file(link_path, logger, pfam_hmm, verbose=verbose) - return pfam_hmm - - -def download_dbcan( - output_dir=".", - logger=LOGGER, - dbcan_hmm=None, - version=DEFAULT_DBCAN_RELEASE, - verbose=True, -): - dbcan_hmm = path.join(output_dir, f"dbCAN-HMMdb-V{version}.txt") - if int(version) < int(DEFAULT_DBCAN_RELEASE): - link_path = ( - f"http://bcb.unl.edu/dbCAN2/download/Databases/dbCAN-HMMdb-V{version}.txt" - ) - else: - link_path = f"http://bcb.unl.edu/dbCAN2/download/dbCAN-HMMdb-V{version}.txt" - - logger.debug(f"Downloading dbCAN from: {link_path}") - download_file(link_path, logger, dbcan_hmm, verbose=verbose) - return dbcan_hmm - - -def download_dbcan_fam_activities( - output_dir=".", - logger=LOGGER, - version=DEFAULT_DBCAN_RELEASE, - upload_date=DEFAULT_DBCAN_DATE, - verbose=True, -): - dbcan_fam_activities = path.join( - output_dir, f"CAZyDB.{upload_date}.fam-activities.txt" - ) - link_path = f"https://bcb.unl.edu/dbCAN2/download/Databases/V{version}/CAZyDB.{upload_date}.fam-activities.txt" - logger.info(f"Downloading dbCAN family activities from : {link_path}") - download_file(link_path, logger, dbcan_fam_activities, verbose=verbose) - return dbcan_fam_activities - - -def download_dbcan_subfam_ec( - output_dir=".", - logger=LOGGER, - version=DEFAULT_DBCAN_RELEASE, - upload_date=DEFAULT_DBCAN_DATE, - verbose=True, -): - dbcan_subfam_ec = path.join(output_dir, f"CAZyDB.{upload_date}.fam.subfam.ec.txt") - link_path = ( - f"https://bcb.unl.edu/dbCAN2/download/Databases/" - f"V{version}/CAZyDB.{upload_date}.fam.subfam.ec.txt" - ) - logger.info(f"Downloading dbCAN sub-family encumber from : {link_path}") - download_file(link_path, logger, dbcan_subfam_ec, verbose=verbose) - return dbcan_subfam_ec - - -def download_kofam_hmm(output_dir=".", logger=LOGGER, verbose=False): - kofam_profile_tar_gz = path.join(output_dir, "kofam_profiles.tar.gz") - download_file( - "ftp://ftp.genome.jp/pub/db/kofam/profiles.tar.gz", - logger, - kofam_profile_tar_gz, - verbose=verbose, - ) - return kofam_profile_tar_gz - - -def generate_modified_kegg_fasta(kegg_fasta, gene_ko_link_loc=None): - """ - Takes kegg fasta file and gene ko link file, adds kos not already in headers to headers - Whish I knew about this, oh well I may split this out. - """ - genes_ko_dict = defaultdict(list) - if gene_ko_link_loc is not None: - if gene_ko_link_loc.endswith(".gz"): - gene_ko_link_fh = gzip.open(gene_ko_link_loc, "rt") - else: - gene_ko_link_fh = open(gene_ko_link_loc) - for line in gene_ko_link_fh: - gene, ko = line.strip().split() - genes_ko_dict[gene].append(remove_prefix(ko, "ko:")) - for seq in read_sequence(kegg_fasta, format="fasta"): - new_description = seq.metadata["description"] - for ko in genes_ko_dict[seq.metadata["id"]]: - if ko not in new_description: - new_description += "; %s" % ko - seq.metadata["description"] = new_description - yield seq - - -def process_kegg( - kegg_loc, - output_dir, - logger, - gene_ko_link_loc=None, - download_date=None, - threads=10, - verbose=True, -): - if download_date is None: - download_date = get_iso_date() - if gene_ko_link_loc is not None: - # add KOs to end of header where KO is not already there - kegg_mod_loc = path.join(output_dir, "kegg.mod.fa") - write_sequence( - generate_modified_kegg_fasta(kegg_loc, gene_ko_link_loc), - format="fasta", - into=kegg_mod_loc, - ) - else: - kegg_mod_loc = kegg_loc - # make mmseqsdb from modified kegg fasta - kegg_mmseqs_db = path.join(output_dir, "kegg.%s.mmsdb" % download_date) - make_mmseqs_db( - kegg_mod_loc, - kegg_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("KEGG database processed") - return {"kegg": kegg_mmseqs_db} - - -def process_kofam_hmm( - kofam_profile_tar_gz, - output_dir=DFLT_OUTPUT_DIR, - logger=LOGGER, - threads=1, - verbose=False, -): - kofam_profiles = path.join(output_dir, "kofam_profiles") - mkdir(kofam_profiles) - run_process( - ["tar", "-xzf", kofam_profile_tar_gz, "-C", kofam_profiles], - logger, - verbose=verbose, - ) - merged_kofam_profiles = path.join(output_dir, "kofam_profiles.hmm") - merge_files( - glob(path.join(kofam_profiles, "profiles", "*.hmm")), merged_kofam_profiles - ) - run_process(["hmmpress", "-f", merged_kofam_profiles], logger, verbose=verbose) - LOGGER.info("KOfam database processed") - return {"kofam_hmm": merged_kofam_profiles} - - -def download_kofam_ko_list(output_dir=".", logger=LOGGER, verbose=False): - kofam_ko_list_gz = path.join(output_dir, "kofam_ko_list.tsv.gz") - download_file( - "ftp://ftp.genome.jp/pub/db/kofam/ko_list.gz", - logger, - kofam_ko_list_gz, - verbose=verbose, - ) - return kofam_ko_list_gz - - -def download_pfam(output_dir=".", logger=LOGGER, verbose=True): - pfam_full_zipped = path.join(output_dir, "Pfam-A.full.gz") - download_file( - "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.full.gz", - logger, - pfam_full_zipped, - verbose=verbose, - ) - return pfam_full_zipped - - -def download_viral( - output_dir=".", logger=LOGGER, viral_files=NUMBER_OF_VIRAL_FILES, verbose=True -): - """Can only download newest version""" - # download all of the viral protein files, need to know the number of files - # TODO: Make it so that you don't need to know number of viral files in refseq viral - - faa_base_name = "viral.%s.protein.faa.gz" - viral_faa_glob = path.join(output_dir, faa_base_name % "*") - for number in range(viral_files): - number += 1 - refseq_url = ( - "ftp://ftp.ncbi.nlm.nih.gov/refseq/release/viral/viral.%s.protein.faa.gz" - % number - ) - refseq_faa = path.join(output_dir, faa_base_name % number) - download_file(refseq_url, logger, refseq_faa, verbose=verbose) - - # then merge files from above - merged_viral_faas = path.join(output_dir, "viral.merged.protein.faa.gz") - run_process( - ["cat %s > %s" % (" ".join(glob(viral_faa_glob)), merged_viral_faas)], - logger, - shell=True, - ) - return merged_viral_faas - - -def download_uniref( - output_dir=".", - logger=LOGGER, - version=DEFAULT_UNIREF_VERSION, - threads=10, - verbose=True, -): - uniref_fasta_zipped = path.join(output_dir, "uniref%s.fasta.gz" % version) - uniref_url = ( - "https://ftp.uniprot.org/pub/databases/uniprot/uniref/uniref%s/uniref%s.fasta.gz" - % (version, version) - ) - download_file(uniref_url, logger, uniref_fasta_zipped, verbose=verbose) - return uniref_fasta_zipped - - -def download_peptidase(output_dir=".", logger=LOGGER, verbose=True): - peptidase_faa = path.join(output_dir, "merops_peptidases_nr.faa") - merops_url = "ftp://ftp.ebi.ac.uk/pub/databases/merops/current_release/pepunit.lib" - download_file(merops_url, logger, peptidase_faa, verbose=verbose) - return peptidase_faa - - -def download_vogdb( - output_dir=".", logger=LOGGER, version=DEFAULT_VOGDB_VERSION, verbose=True -): - vog_hmm_targz = path.join(output_dir, "vog.hmm.tar.gz") - vogdb_url = f"http://fileshare.csb.univie.ac.at/vog/{version}/vog.hmm.tar.gz" - download_file(vogdb_url, logger, vog_hmm_targz, verbose=verbose) - return vog_hmm_targz - - -def process_kofam_ko_list( - kofam_ko_list_gz, output_dir=".", logger=LOGGER, threads=1, verbose=False -): - # TODO: fix this so that it is gunzipped to the path - kofam_ko_list = path.join(output_dir, "kofam_ko_list.tsv") - run_process( - ["gunzip", "-c", kofam_ko_list_gz], - logger, - save_output=kofam_ko_list, - verbose=verbose, - ) - LOGGER.info("KOfam ko list processed") - return {"kofam_ko_list": kofam_ko_list} - - -def process_uniref( - uniref_fasta_zipped, - output_dir=".", - logger=LOGGER, - version=DEFAULT_UNIREF_VERSION, - threads=10, - verbose=True, -): - uniref_mmseqs_db = path.join( - output_dir, "uniref%s.%s.mmsdb" % (version, get_iso_date()) - ) - make_mmseqs_db( - uniref_fasta_zipped, - uniref_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("UniRef database processed") - return {"uniref": uniref_mmseqs_db} - - -def process_mmspro( - full_alignment, - output_dir, - logger=LOGGER, - db_name=DEFAULT_MMMSPRO_DB_NAME, - threads=10, - verbose=True, -): - mmseqs_msa = path.join(output_dir, "%s.mmsmsa" % db_name) - run_process( - ["mmseqs", "convertmsa", full_alignment, mmseqs_msa], logger, verbose=verbose - ) - mmseqs_profile = path.join(output_dir, "%s.mmspro" % db_name) - run_process( - [ - "mmseqs", - "msa2profile", - mmseqs_msa, - mmseqs_profile, - "--match-mode", - "1", - "--threads", - str(threads), - ], - logger, - verbose=verbose, - ) - tmp_dir = path.join(output_dir, "tmp") - run_process( - [ - "mmseqs", - "createindex", - mmseqs_profile, - tmp_dir, - "-k", - "5", - "-s", - "7", - "--threads", - str(threads), - ], - logger, - verbose=verbose, - ) - return mmseqs_profile - - -def process_pfam( - pfam_full_zipped, output_dir=".", logger=LOGGER, threads=10, verbose=True -): - pfam_profile = process_mmspro( - pfam_full_zipped, output_dir, logger, "pfam", threads, verbose - ) - LOGGER.info("PFAM database processed") - return {"pfam": pfam_profile} - - -def process_dbcan(input, output_dir, logger=LOGGER, verbose=True, threads=1): - output = path.join(output_dir, path.basename(input)) - move(input, output) - run_process(["hmmpress", "-f", output], logger, verbose=verbose) - LOGGER.info("dbCAN database processed") - return {"dbcan": output} - - -def process_viral( - merged_viral_faas, - output_dir=".", - logger=LOGGER, - viral_files=NUMBER_OF_VIRAL_FILES, - threads=10, - verbose=True, -): - refseq_viral_mmseqs_db = path.join( - output_dir, "refseq_viral.%s.mmsdb" % get_iso_date() - ) - make_mmseqs_db( - merged_viral_faas, - refseq_viral_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("RefSeq viral database processed") - return {"viral": refseq_viral_mmseqs_db} - - -def process_peptidase( - peptidase_faa, output_dir=".", logger=LOGGER, threads=10, verbose=True -): - peptidase_mmseqs_db = path.join(output_dir, "peptidases.%s.mmsdb" % get_iso_date()) - make_mmseqs_db( - peptidase_faa, - peptidase_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("MEROPS database processed") - return {"peptidase": peptidase_mmseqs_db} - - -def process_vogdb( - vog_hmm_targz, - output_dir=".", - logger=LOGGER, - version=DEFAULT_VOGDB_VERSION, - threads=1, - verbose=True, -): - hmm_dir = path.join(output_dir, "vogdb_hmms") - mkdir(hmm_dir) - vogdb_targz = tarfile.open(vog_hmm_targz) - vogdb_targz.extractall(hmm_dir) - vog_hmms = path.join(output_dir, f"vog_{version}_hmms.txt") - merge_files(glob(path.join(hmm_dir, "VOG*.hmm")), vog_hmms) - run_process(["hmmpress", "-f", vog_hmms], logger, verbose=verbose) - LOGGER.info("VOGdb database processed") - return {"vogdb": vog_hmms} - - -def download_vog_annotations( - output_dir, logger=LOGGER, version=DEFAULT_VOGDB_VERSION, verbose=True -): - vog_annotations = path.join(output_dir, "vog_annotations_%s.tsv.gz" % version) - download_file( - "http://fileshare.csb.univie.ac.at/vog/%s/vog.annotations.tsv.gz" % version, - logger, - vog_annotations, - verbose=verbose, - ) - return vog_annotations - - -def download_genome_summary_form( - output_dir, logger=LOGGER, branch="master", verbose=True -): - genome_summary_form = path.join( - output_dir, "genome_summary_form.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/genome_summary_form.tsv" - % branch, - logger, - genome_summary_form, - verbose=verbose, - ) - return genome_summary_form - - -def download_module_step_form(output_dir, logger=LOGGER, branch="master", verbose=True): - function_heatmap_form = path.join( - output_dir, "module_step_form.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/module_step_form.tsv" - % branch, - logger, - function_heatmap_form, - verbose=verbose, - ) - return function_heatmap_form - - -def download_etc_module_database( - output_dir, logger=LOGGER, branch="master", verbose=True -): - etc_module_database = path.join( - output_dir, "etc_mdoule_database.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/etc_module_database.tsv" - % branch, - logger, - etc_module_database, - verbose=verbose, - ) - return etc_module_database - - -def download_function_heatmap_form( - output_dir, logger=LOGGER, branch="master", verbose=True -): - function_heatmap_form = path.join( - output_dir, "function_heatmap_form.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/function_heatmap_form.tsv" - % branch, - logger, - function_heatmap_form, - verbose=verbose, - ) - return function_heatmap_form - - -def download_amg_database(output_dir, logger=LOGGER, branch="master", verbose=True): - amg_database = path.join(output_dir, "amg_database.%s.tsv" % get_iso_date()) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/amg_database.tsv" - % branch, - logger, - amg_database, - verbose=verbose, - ) - return amg_database - - -def check_file_exists(*paths): - for i in paths: - if i is None: - continue - elif path.isfile(i): - continue - else: - raise ValueError(f"Database location does not exist: {i}") - - -def prepare_databases( - output_dir, - loggpath=None, - kegg_loc=None, - gene_ko_link_loc=None, - kofam_hmm_loc=None, - kofam_ko_list_loc=None, - kegg_download_date=None, - uniref_loc=None, - uniref_version=DEFAULT_UNIREF_VERSION, - pfam_loc=None, - pfam_hmm_loc=None, - dbcan_loc=None, - dbcan_fam_activities: str = None, - dbcan_subfam_ec: str = None, - dbcan_version=DEFAULT_DBCAN_RELEASE, - dbcan_date=DEFAULT_DBCAN_DATE, - viral_loc=None, - peptidase_loc=None, - vogdb_loc=None, - vogdb_version=DEFAULT_VOGDB_VERSION, - vog_annotations=None, - genome_summary_form_loc=None, - module_step_form_loc=None, - etc_module_database_loc=None, - function_heatmap_form_loc=None, - amg_database_loc=None, - camper_tar_gz_loc=None, - number_of_viral_files=NUMBER_OF_VIRAL_FILES, - fegenie_tar_gz_loc=None, - sulphur_tar_gz_loc=None, - skip_uniref=False, - keep_database_files=False, - branch="master", - threads=10, - verbose=True, - select_db=None, - clear_config=False, -): - - dram_settings = { - "kegg": { - "name": "KEGG db", - "description_db_updated": "Unknown, or Never", - "citation": KEGG_CITATION, - }, - "gene_ko_link": {"name": "KEGG Gene KO link", "citation": KEGG_CITATION}, - "kofam_hmm": {"name": "KOfam db", "citation": KOFAM_CITATION}, - "kofam_ko_list": {"name": "KOfam KO list", "citation": KOFAM_CITATION}, - "uniref": { - "name": "UniRef db", - "description_db_updated": "Unknown, or Never", - "citation": UNIREF_CITATION, - }, - "pfam": {"name": "Pfam db", "citation": PFAM_CITATION}, - "pfam_hmm": { - "name": "Pfam hmm dat", - "description_db_updated": "Unknown, or Never", - "citation": PFAM_CITATION, - }, - "dbcan": {"name": "dbCAN db", "citation": DBCAN_CITATION}, - "dbcan_fam_activities": { - "name": "dbCAN family activities", - "citation": DBCAN_CITATION, - }, - "dbcan_subfam_ec": { - "name": "dbCAN subfamily EC numbers", - "citation": DBCAN_CITATION, - }, - "vogdb": {"name": "VOGDB db", "citation": VOGDB_CITATION}, - "vog_annotations": { - "name": "VOG annotations", - "description_db_updated": "Unknown, or Never", - "citation": VOGDB_CITATION, - }, - "viral": { - "name": "RefSeq Viral db", - "description_db_updated": "Unknown, or Never", - "citation": VIRAL_REFSEQ_CITATION, - }, - "peptidase": { - "name": "MEROPS peptidase db", - "description_db_updated": "Unknown, or Never", - "citation": PEPTIDASE_CITATION, - }, - "genome_summary_form": {"name": "Genome summary form"}, - "module_step_form": {"name": "Module step form"}, - "function_heatmap_form": {"name": "Function heatmap form"}, - "amg_database": {"name": "AMG database"}, - "etc_module_database": {"name": "ETC module database"}, - } - dram_settings.update(CAMPER_DRAM_SETTINGS) - dram_settings.update(FEGENIE_DRAM_SETTINGS) - dram_settings.update(SULPHUR_DRAM_SETTINGS) - database_settings = { - "kegg": {}, - "gene_ko_link": {}, - "kofam_hmm": {}, - "kofam_ko_list": {}, - "uniref": {"version": uniref_version}, - "pfam": {}, - "pfam_hmm": {}, - "dbcan": {"version": dbcan_version}, - "dbcan_fam_activities": {"version": dbcan_version, "upload_date": dbcan_date}, - "dbcan_subfam_ec": {"version": dbcan_version, "upload_date": dbcan_date}, - "vogdb": {"version": vogdb_version}, - "vog_annotations": {"version": vogdb_version}, - "viral": {}, - "peptidase": {}, - "genome_summary_form": {"branch": branch}, - "module_step_form": {"branch": branch}, - "function_heatmap_form": {"branch": branch}, - "amg_database": {"branch": branch}, - "etc_module_database": {"branch": branch}, - } - database_settings.update(CAMPER_DOWNLOAD_OPTIONS) - database_settings.update(FEGENIE_DOWNLOAD_OPTIONS) - database_settings.update(SULPHUR_DOWNLOAD_OPTIONS) - process_settings = { - "kegg": {}, - "gene_ko_link": {}, - "kofam_hmm": {}, - "kofam_ko_list": {}, - "uniref": {"version": uniref_version}, - "pfam": {}, - "pfam_hmm": {}, - "dbcan": {}, - "dbcan_fam_activities": {}, - "dbcan_subfam_ec": {}, - "vogdb": {}, - "vog_annotations": {}, - "viral": {"viral_files": number_of_viral_files}, - "peptidase": {}, - "genome_summary_form": {}, - "module_step_form": {}, - "function_heatmap_form": {}, - "amg_database": {}, - "etc_module_database": {}, - } - process_settings.update(CAMPER_PROCESS_OPTIONS) - process_settings.update(FEGENIE_PROCESS_OPTIONS) - process_settings.update(SULPHUR_PROCESS_OPTIONS) - - # setup temp, logging, and db_handler - if not path.isdir(output_dir): - mkdir(output_dir) - temporary = path.join(output_dir, "database_files") - mkdir(temporary) - main_log = path.join(output_dir, "database_processing.log") - setup_logger(LOGGER, *[(main_log, loggpath) if loggpath is not None else main_log]) - db_handler = DatabaseHandler(logger=LOGGER) - if clear_config or select_db is None: - db_handler.clear_config() - - db_handler.config["log_path"] = main_log - db_handler.write_config() - LOGGER.info("Starting the process of downloading data") - - if skip_uniref: - LOGGER.info("Skipping UniRef") - del database_settings["uniref"] - - locs = { - i.removesuffix("_loc"): j - for i, j in locals().items() - if i.endswith("_loc") and j is not None - } - download_functions = { - i.removeprefix("download_"): j - for i, j in globals().items() - if callable(j) and i.startswith("download_") - } - process_functions = { - i.removeprefix("process_"): j - for i, j in globals().items() - if callable(j) and i.startswith("process_") - } - functions = { - i: j for i, j in globals().items() if callable(j) and i.startswith("download_") - } - - # Check any specified paths exist - missing_user_inputs = [i for i in locs if not path.exists(i)] - if len(missing_user_inputs) > 1: - raise ValueError( - f"The fallowing user provided paths don't seem to exist: {missing_user_inputs}" - ) - - un_obtainable = [ - i for i in database_settings if i not in locs and i not in download_functions - ] - - for i in un_obtainable: - LOGGER.info( - f"The {i}_loc argument was not used to specify a downloaded {i} file, and dram can not" - " download it its self. So it is assumed that the user wants to set up DRAM without it" - ) - del database_settings[i] - - # check inputs - if skip_uniref and uniref_loc is not None: - raise ValueError( - "Cannot skip UniRef processing and provide a location of UniRef." - " Skipping UniRef will cause provided UniRef file to not be used." - ) - - if select_db is not None: - miss_name = [i for i in select_db if i not in database_settings] - user_inputs = [i for i in locs if i not in select_db] - if len(miss_name) > 0: - LOGGER.error( - "Only the databases in the db list can be pased to select_db, " - f"you passed {miss_name} which is/are not in the list." - ) - raise ValueError("Bad user input, see log") - - if len(user_inputs) > 0: - LOGGER.error( - f"The user provided location for {user_inputs}, but required it not be used by proving" - f" the select_db argument for other databases. This would suggest that the" - " user may have made a mistake and so this error is rased." - ) - raise ValueError("Bad user input, see log") - - database_settings = {i: database_settings[i] for i in select_db} - - LOGGER.info("Database preparation started") - - # Download DBs - for i, j in database_settings.items(): - if locs.get(i) is None: - LOGGER.info(f"Downloading {i}") - if i in process_functions: - locs[i] = download_functions[i](temporary, LOGGER, **j, verbose=verbose) - else: - locs[i] = download_functions[i]( - output_dir, LOGGER, **j, verbose=verbose - ) - j["Download time"] = datetime.now().strftime("%m/%d/%Y, %H:%M:%S") - j["Origin"] = "Downloaded by DRAM" - else: - j = {k: "Unknown" for k in j} - j["Download time"] = "Unknown" - j["Origin"] = "Provided by user" - j["Original path"] = locs[i] - if i not in process_functions: - LOGGER.info(f"Copying {locs[i]} to output_dir") - locs[i] = copyfile( - locs[i], path.join(output_dir, path.basename(locs[i])) - ) - - LOGGER.info("All raw data files were downloaded successfully") - - # Process databases - for i in locs: - processed_locs = {} - if i in process_functions: - LOGGER.info(f"Processing {i}") - processed_locs = process_functions[i]( - locs[i], - output_dir, - LOGGER, - threads=threads, - verbose=verbose, - **process_settings[i], - ) - else: - processed_locs = {i: locs[i]} - for k, v in processed_locs.items(): - final_dest = path.join(output_dir, path.basename(v)) - if v != final_dest: - for db_file in glob("%s*" % v): - move(db_file, path.join(output_dir, path.basename(db_file))) - v = path.join(output_dir, path.basename(v)) - # update_dram_forms the settings per OUTPUT fill, including the process_settings - # and database_settings, which are per input file. - if db_handler.config.get("setup_info") is None: - db_handler.config["setup_info"] = {} - db_handler.config["setup_info"][k] = { - **dram_settings[k], - **process_settings[i], - **database_settings[i], - } - db_handler.set_database_paths(**{f"{k}_loc": v}) - db_handler.write_config() - LOGGER.info(f"Moved {k} to final destination, configuration updated") - - LOGGER.info("Populating the description db, this may take some time") - db_handler.config["description_db"] = path.realpath( - path.join(output_dir, "description_db.sqlite") - ) - db_handler.write_config() - db_handler.populate_description_db( - db_handler.config["description_db"], select_db, update_config=False - ) - # todo make db handler such that the destruction on success write_config - db_handler.write_config() - LOGGER.info("DRAM description database populated") - - if not keep_database_files: - rmtree(temporary) - LOGGER.info("Database preparation completed") - - -def update_dram_forms(output_dir, branch="master"): - if not path.isdir(output_dir): - mkdir(output_dir) - form_locs = dict() - form_locs["genome_summary_form_loc"] = download_genome_summary_form( - output_dir, branch - ) - form_locs["module_step_form_loc"] = download_module_step_form(output_dir, branch) - form_locs["etc_module_database_loc"] = download_etc_module_database( - output_dir, branch - ) - form_locs["function_heatmap_form_loc"] = download_function_heatmap_form( - output_dir, branch - ) - form_locs["amg_database_loc"] = download_amg_database(output_dir, branch) - db_handler = DatabaseHandler() - db_handler.set_database_paths(**form_locs) - - -""" - -os.system("DRAM.py annotate -i /home/projects-wrighton-2/DRAM/development_flynn/release_validation/data_sets/15_soil_genomes/all_data/Cytophaga_hutchinsonii_ATCC_33406.fasta -o test_15soil --use_camper --use_fegenie") -import os -os.system('DRAM-setup.py prepare_databases --output_dir /home/projects-wrighton-2/DRAM/dram_data/dram1.4_final_06_21_22/ --kegg_loc /home/Database/KEGG/kegg-all-orgs_20220603/kegg-all-orgs_unique_reheader_20220603.pep --threads 40') -os.system('DRAM-setup.py -h ') - version print DRAM version - prepare_databases Download and process databases for annotation - set_database_locations - Set database locations for already processed databases - update_description_db - Update description database - update_dram_forms Update DRAM distillate and liquor forms - print_config Print database locations - import_config Import CONFIG file - export_config Export CONFIG file -os.system('DRAM-setup.py print_config') -os.system('DRAM-setup.py export_config') -os.system('DRAM-setup.py import_config --config_loc dram2/CONFIG') -os.system('DRAM-setup.py set_database_locations') -os.system('DRAM-setup.py update_description_db') - -os.system('DRAM-setup.py prepare_databases --output_dir download_test') -os.system('DRAM-setup.py prepare_databases --output_dir download_test' -os.system('DRAM-setup.py prepare_databases --output_dir download_test --select_db vogdb') - ' --kegg_loc KEGG_LOC /home/Database/KEGG/kegg-all-orgs_20220129/kegg-all-orgs_unique_reheader_20220129.pep" ' # KEGG protein file, should be a single .pep, please merge all KEGG pep files (default: None) - '--threads 30' Number of threads to use building mmseqs2 databases (default: 10) - # '--gene_ko_link_loc ' # KEGG gene ko link, can be gzipped or not - '--kofam_hmm_loc' # hmm file for KOfam (profiles.tar.gz) (default: None) - '--kofam_ko_list_loc' # KOfam ko list file (ko_list.gz) (default: None) - ' --gene_ko_link_loc' # GENE_KO_LINK_LOC KEGG gene ko link, can be gzipped or not (default: None) - ' --kegg_download_date' # Date KEGG was download to include in database name (default: None) - ' --uniref_loc' # File path to uniref, if already downloaded (uniref90.fasta.gz) (default: None) - ' --uniref_version' # UniRef version to download (default: 90) - ' --skip_uniref' # Do not download and process uniref90. Saves time and memory usage and does not impact DRAM distillation - ' --pfam_loc' # File path to pfam-A full file, if already downloaded (Pfam-A.full.gz) (default: None) - ' --pfam_hmm' # pfam hmm .dat file to get PF descriptions, if already downloaded (Pfam-A.hmm.dat.gz) (default: None) - ' --dbcan_loc' # File path to dbCAN, if already downloaded (dbCAN-HMMdb-V9.txt) (default: None) - ' --dbcan_fam_activities' # CAZY family activities file, if already downloaded (CAZyDB.07302020.fam-activities.txt) (default: None) - ' --dbcan_version' # version of dbCAN to use (default: 10) - ' --vogdb_loc' # hmm file for vogdb, if already downloaded (vog.hmm.tar.gz) (default: None) - ' --vog_annotations_loc' # vogdb annotations file, if already downloaded (vog.annotations.tsv.gz) (default: None) - ' --viral_loc' # File path to merged viral protein faa, if already downloaded (viral.x.protein.faa.gz) (default: None) - ' --peptidase_loc' # File path to MEROPS peptidase fasta, if already downloaded (pepunit.lib) (default: None) - ' --genome_summary_form_loc' # File path to genome summary form,if already downloaded (default: None) - ' --module_step_form_loc' # File path to module step form, ifalready downloaded (default: None) - ' --etc_module_database_loc' # File path to etc module database, if already downloaded (default: None) - ' --function_heatmap_form_loc' # File path to function heatmap form, if already downloaded (default: None) - ' --amg_database_loc' # File path to amg database, if already downloaded (default: None) - ' --branch' # git branch from which to download forms; THIS SHOULD NOT BE CHANGED BY REGULAR USERS (default: master) - ' --keep_database_files' # Keep unporcessed database files (default: False) - - - - - - - - - - - - - - - - - - - - - - -) -""" \ No newline at end of file diff --git a/bin/assets/forms/db_utils.py b/bin/assets/forms/db_utils.py deleted file mode 100755 index fc9595bb..00000000 --- a/bin/assets/forms/db_utils.py +++ /dev/null @@ -1,287 +0,0 @@ -""" -*Old DRAM v1/early v2 DB utils code* - - -General utility, available to all dram tools -""" -import subprocess -from dataclasses import dataclass -from urllib.request import urlopen, urlretrieve -from urllib.error import HTTPError, URLError -from typing import Optional -from pathlib import Path -import logging - -# from os import getenv -import pandas as pd - - -def export_posible_path( - path: Optional[Path], relative_path: Optional[Path] = None -) -> Optional[str]: - if path is None: - return None - out_path = path.absolute() - if relative_path is not None and relative_path in out_path.parents: - out_path = out_path.relative_to(relative_path) - return out_path.as_posix() - - -def import_posible_path( - path: Optional[str], relative_path: Optional[Path] = None -) -> Optional[Path]: - if path is None: - return None - out_path = Path(path) - if relative_path is None: - return out_path.absolute() - return (relative_path / out_path).absolute() - - -@dataclass -class Fasta: - """ - The Fasta Class - --------------- - - Store your data and access it safly - """ - - name: str - origin: Path - tmp_dir: Path - faa: Path - fna: None | Path - gff: None | Path - mmsdb: None | Path - - def export(self, output_dir): - return ( - self.name, - export_posible_path(self.origin), - export_posible_path(self.tmp_dir, output_dir), - export_posible_path(self.faa, output_dir), - export_posible_path(self.fna, output_dir), - export_posible_path(self.gff, output_dir), - export_posible_path(self.mmsdb, output_dir), - ) - - @classmethod - def import_strings( - cls, - relative_path: Path, - name: str, - origin: str, - tmp_dir: str, - faa: str, - fna: str, - gff: str, - mmsdb: str, - ): - ob = cls( - name, - import_posible_path(origin), - import_posible_path(tmp_dir, relative_path), - import_posible_path(faa, relative_path), - import_posible_path(fna, relative_path), - import_posible_path(gff, relative_path), - import_posible_path(mmsdb, relative_path), - ) - return ob - - def get_fna(self) -> Path: - """ - Get the fna and handel it not existing - - :returns: - :raises ValueError: - """ - if self.fna is None: - raise ValueError( - "The fna file is not defined, did you import allready called faa files?" - ) - return self.fna - - def get_gff(self) -> Path: - """ - Get the gff and handel it not existing - - :returns: - :raises ValueError: - """ - if self.gff is None: - raise ValueError( - "The gff file is not defined, did you import allready called faa files?" - ) - return self.gff - - def get_mmsdb(self) -> Path: - """ - Get the mmsdb and handel it not existing - - :returns: - :raises ValueError: - """ - if self.mmsdb is None: - raise ValueError( - "The mmsdb file is not defined, are you trying to skip or develop the annotate pipeline?" - ) - return self.gff - - -class DramUsageError(Exception): - "Raised when dram is not used corectly, usally it means you are missing a step" - pass - - -def get_package_path(local_path: Path): - """ - Locate the package data or non python files - - :param local_path: - :returns: - """ - abs_snake_path = Path(__file__).parent.parent.absolute() / local_path - return abs_snake_path - - -def download_file( - url: str, - output_file: Path, - logger: logging.Logger, - alt_urls: None | list[str] = None, -): - """ - Download a file, probably a database - - :param url: - :param output_file: - :param logger: - :param alt_urls: - :returns: - :raises URLError: - """ - # TODO: catching error 4 and give error message to retry or retry automatically - links = [url] if alt_urls is None else [url] + alt_urls - for link in links: - logger.debug("downloading %s" % url) - try: - urlretrieve(link, output_file) - return - except BaseException as error: - # BaseException is good http was to exact - logger.warning(f"Something went wrong with the download of the url: {link}") - logger.warning(error) - raise URLError( - "DRAM whas not able to download a key database, check the logg for details" - ) - # run_process(['wget', '-O', output_file, url], verbose=verbose) - - -def get_annotation_ids_by_row(data, logger): - # functions = {i: j for i, j in ID_FUNCTION_DICT.items() if i in data.columns} - # missing = [i for i in ID_FUNCTION_DICT if i not in data.columns] - logger.info( - "Note: the fallowing id fields " - f"were not in the annotations file and are not being used: {missing}," - f" but these are {list(functions.keys())}" - ) - out = data.apply( - lambda x: { - i - for k, v in functions.items() - if not pd.isna(x[k]) - for i in v(str(x[k])) - if not pd.isna(i) - }, - axis=1, - ) - return out - - -# def get_all_annotation_ids(data, logger): -# data = get_ids_from_annotations_by_row(data, logger) -# data.apply(list) -# out = Counter(chain(*data.values)) -# return out - - -def run_process( - command, - logger, - shell: bool = False, - capture_stdout: bool = True, - save_output: str = None, - check: bool = False, - stop_on_error: bool = True, - verbose: bool = False, -) -> str: - """ - Standardization of parameters for using subprocess.run, provides verbose mode and option to run via shell - """ - # TODO just remove check - try: - results = subprocess.run( - command, - check=check, - shell=shell, - stdout=subprocess.PIPE, - stderr=subprocess.PIPE, - text=True, - ) - except subprocess.CalledProcessError as error: - logger.critical(f"The subcommand {command} experienced an error") - if stop_on_error: - raise error - if results.returncode != 0: - logger.critical( - f"The subcommand {command} experienced an error: {results.stderr}" - ) - logging.debug(results.stdout) - if stop_on_error: - raise subprocess.SubprocessError( - f"The subcommand {' '.join(command)} experienced an error, see the log for more info." - ) - - if save_output is not None: - with open(save_output, "w") as out: - out.write(results.stdout) - - if capture_stdout: - return results.stdout - - -def merge_files(files_to_merge, outfile, has_header=False): - """It's in the name, if has_header assumes all files have the same header""" - with open(outfile, "w") as outfile_handle: - if has_header: - outfile_handle.write(open(files_to_merge[0]).readline()) - for file in files_to_merge: - with open(file) as f: - if has_header: - _ = f.readline() - outfile_handle.write(f.read()) - - -def divide_chunks(l, n): - # looping till length l - for i in range(0, len(l), n): - yield l[i: i + n] - - -def remove_prefix(text, prefix): - if text.startswith(prefix): - return text[len(prefix):] - return text # or whatever - - -def remove_suffix(text, suffix): - if text.endswith(suffix): - return text[: -1 * len(suffix)] - return text # or whatever - - -def get_ordered_uniques(seq): - seen = set() - seen_add = seen.add - return [x for x in seq if not (x in seen or seen_add(x) or pd.isna(x))] diff --git a/bin/assets/forms/distill_ag_Jan252024.slk b/bin/assets/forms/distill_ag_Jan252024.slk old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/custom_distill/test-1-multiple-gene-id.tsv b/bin/assets/forms/distill_sheets/custom_distill/test-1-multiple-gene-id.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/custom_distill/test-3-EC.tsv b/bin/assets/forms/distill_sheets/custom_distill/test-3-EC.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/distill_ag.tsv b/bin/assets/forms/distill_sheets/distill_ag.tsv old mode 100755 new mode 100644 index b863d049..fa63efc6 --- a/bin/assets/forms/distill_sheets/distill_ag.tsv +++ b/bin/assets/forms/distill_sheets/distill_ag.tsv @@ -1,235 +1,235 @@ gene_id gene_description pathway topic_ecosystem category subcategory note reference -K00531 nitrogenase delta subunit [EC:1.18.6.1] [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K02586 nitrogenase molybdenum-iron protein [EC:1.18.6.1] [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K02588 nitrogenase iron protein [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K02591 nitrogenase molybdenum-iron protein [EC:1.18.6.1] [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K22896 vanadium-dependent nitrogenase [EC:1.18.6.2] [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K22897 vanadium-dependent nitrogenase [EC:1.18.6.2] [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K22898 vanadium nitrogenase delta subunit [EC:1.18.6.2] [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K22899 vanadium nitrogenase iron protein [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation -K00370 narG, nitrate reductase, alpha subunit [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction -K00371 narH, nitrate reductase, beta subunit [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction -K00374 narI, nitrate reductase, gamma subunit [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction -K02567 periplasmic nitrate reductase NapA [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction -K02568 cytochrome c-type protein NapB [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction -K00368 nitrite reductase (NO-forming) [EC:1.7.2.1] [RN:R00783 R00785] nitrite → nitric oxide ag Nitrogen Cycling N Reduction -K15864 nitrite reductase (NO-forming) [EC:1.7.2.1] [RN:R00783 R00785] nitrite → nitric oxide ag Nitrogen Cycling N Reduction -K15877 fungal nitric oxide reductase (CYP55) [EC:1.7.1.14] nitric oxide → nitrous oxide ag Nitrogen Cycling NO to N2O -K04561 nitric oxide reductase [EC:1.7.2.5] [RN:R00294] nitric oxide → nitrous oxide ag Nitrogen Cycling NO to N2O -K00376 nitrous-oxide reductase [EC:1.7.2.4] [RN:R02804] nitrous oxide → nitrogen gas ag Nitrogen Cycling N2O to N2 -K02575 NRT; MFS transporter= NNP family= nitrate/nitrite transporter Nitrate/nitrite assimilation ag Nitrogen Cycling N Reduction -K00367 narB, assimilatory nitrate reductase [EC:1.7.7.2] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction -K10534 nr, assimilatory nitrate reductase [EC:1.7.7.2] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction -K00372 assimilatory nitrate reductase [EC:1.7.99.-] [RN:R00798] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction -K00360 assimilatory nitrate reductase [EC:1.7.99.-] [RN:R00798] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction -K17877 nirA, ferredoxin-nitrite reductase [EC:1.7.7.1] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction -K00366 assimilatory nitrite reductase [EC:1.7.7.1] [RN:R00790] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction -K26139 nasE, nitrite reductase FAD-binding subunit [EC:1.7.1.-] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction -K26138 nasD, nitrite reductase NADH-binding subunit [EC:1.7.1.-] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction -K00361 nirB, NADH-nitrite reductase large subunit [EC:1.7.1.15] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction -K00370 narG, nitrate reductase alpha subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nar system) ag Nitrogen Cycling N Reduction -K00371 narH, nitrate reductase beta subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nar system) ag Nitrogen Cycling N Reduction -K00374 narI, nitrate reductase gamma subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nar system) ag Nitrogen Cycling N Reduction -K02567 napA, periplasmic nitrate reductase catalytic subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nap system) ag Nitrogen Cycling N Reduction -K02568 napB, cytochrome c-type subunit of periplasmic nitrate reductase Dissimilatory nitrate reduction = nitrate → ammonia (via Nap system) ag Nitrogen Cycling N Reduction -K00362 nrfA, cytochrome c nitrite reductase large subunit [EC:1.7.2.2] Dissimilatory nitrate reduction = nitrite → ammonia (via Nrf complex) ag Nitrogen Cycling N Reduction -K00363 nrfH, cytochrome c nitrite reductase small subunit Dissimilatory nitrate reduction = nitrite → ammonia (via Nrf complex) ag Nitrogen Cycling N Reduction -K03385 nirB, nitrite reductase (NADH) large subunit [EC:1.7.1.15] Dissimilatory nitrate reduction = nitrite → ammonia (via NirBD complex) ag Nitrogen Cycling N Reduction -K15876 nirD, nitrite reductase (NADH) small subunit [EC:1.7.1.15] Dissimilatory nitrate reduction = nitrite → ammonia (via NirBD complex) ag Nitrogen Cycling N Reduction -K28504 ammonia monooxygenase subunit C [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation -K28504 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation -K10945 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation -K10946 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation -K10535 hydroxylamine oxidase [EC:1.7.2.6] [RN:R10164] Nitrification= hydroxylamine => nitrite ag Nitrogen Cycling Aerobic Ammonium Oxidation -K15864 nirS; hydroxylamine reductase, anammox Nitrite → nitric oxide ag Nitrogen Cycling Anaerobic Ammonium -K20932 hydrazine synthase subunit [EC:1.7.2.7] Nitric oxide + ammonium → hydrazine (HZS complex) ag Nitrogen Cycling Anaerobic Ammonium -K20935 hydrazine dehydrogenase [EC:1.7.2.8] Hydrazine → dinitrogen gas (N₂) ag Nitrogen Cycling Anaerobic Ammonium -K00368 nirK, nitrite reductase (NO-forming) [EC:1.7.2.1] Nitrite → nitric oxide ag Nitrogen Cycling Anaerobic Ammonium Oxidation -K20933 hzsB, hydrazine synthase subunit B [EC:1.7.2.7] Nitric oxide + ammonium → hydrazine (HZS complex) ag Nitrogen Cycling Anaerobic Ammonium Oxidation -K20934 hzsC, hydrazine synthase subunit C [EC:1.7.2.7] Nitric oxide + ammonium → hydrazine (HZS complex) ag Nitrogen Cycling Anaerobic Ammonium Oxidation -K01428 ureC, urease subunit alpha (largest alpha unit of protein structure) Urea → CO₂ + NH₃ ag Nitrogen Cycling Mineralization -K01429 ureB, urease subunit beta Urea → CO₂ + NH₃ ag Nitrogen Cycling Mineralization -K01430 ureA, urease subunit gamma Urea → CO₂ + NH₃ ag Nitrogen Cycling Mineralization +K00531 nitrogenase delta subunit [EC:1.18.6.1] [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K02586 nitrogenase molybdenum-iron protein [EC:1.18.6.1] [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K02588 nitrogenase iron protein [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K02591 nitrogenase molybdenum-iron protein [EC:1.18.6.1] [RN:R05185] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K22896 vanadium-dependent nitrogenase [EC:1.18.6.2] [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K22897 vanadium-dependent nitrogenase [EC:1.18.6.2] [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K22898 vanadium nitrogenase delta subunit [EC:1.18.6.2] [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K22899 vanadium nitrogenase iron protein [RN:R12084] Nitrogen fixation, nitrogen => ammonia ag Nitrogen Cycling N2 Fixation +K00370 narG, nitrate reductase, alpha subunit [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction +K00371 narH, nitrate reductase, beta subunit [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction +K00374 narI, nitrate reductase, gamma subunit [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction +K02567 periplasmic nitrate reductase NapA [EC:1.7.99.-] [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction +K02568 cytochrome c-type protein NapB [RN:R00798] nitrate → nitrite ag Nitrogen Cycling N Reduction +K00368 nitrite reductase (NO-forming) [EC:1.7.2.1] [RN:R00783 R00785] nitrite → nitric oxide ag Nitrogen Cycling N Reduction +K15864 nitrite reductase (NO-forming) [EC:1.7.2.1] [RN:R00783 R00785] nitrite → nitric oxide ag Nitrogen Cycling N Reduction +K15877 fungal nitric oxide reductase (CYP55) [EC:1.7.1.14] nitric oxide → nitrous oxide ag Nitrogen Cycling NO to N2O +K04561 nitric oxide reductase [EC:1.7.2.5] [RN:R00294] nitric oxide → nitrous oxide ag Nitrogen Cycling NO to N2O +K00376 nitrous-oxide reductase [EC:1.7.2.4] [RN:R02804] nitrous oxide → nitrogen gas ag Nitrogen Cycling N2O to N2 +K02575 NRT; MFS transporter= NNP family= nitrate/nitrite transporter Nitrate/nitrite assimilation ag Nitrogen Cycling N Reduction +K00367 narB, assimilatory nitrate reductase [EC:1.7.7.2] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction +K10534 nr, assimilatory nitrate reductase [EC:1.7.7.2] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction +K00372 assimilatory nitrate reductase [EC:1.7.99.-] [RN:R00798] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction +K00360 assimilatory nitrate reductase [EC:1.7.99.-] [RN:R00798] Assimilatory nitrate reduction =Nitrate → nitrite ag Nitrogen Cycling N Reduction +K17877 nirA, ferredoxin-nitrite reductase [EC:1.7.7.1] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction +K00366 assimilatory nitrite reductase [EC:1.7.7.1] [RN:R00790] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction +K26139 nasE, nitrite reductase FAD-binding subunit [EC:1.7.1.-] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction +K26138 nasD, nitrite reductase NADH-binding subunit [EC:1.7.1.-] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction +K00361 nirB, NADH-nitrite reductase large subunit [EC:1.7.1.15] Assimilatory nitrate reduction= Nitrite → ammonium ag Nitrogen Cycling N Reduction +K00370 narG, nitrate reductase alpha subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nar system) ag Nitrogen Cycling N Reduction +K00371 narH, nitrate reductase beta subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nar system) ag Nitrogen Cycling N Reduction +K00374 narI, nitrate reductase gamma subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nar system) ag Nitrogen Cycling N Reduction +K02567 napA, periplasmic nitrate reductase catalytic subunit [EC:1.7.99.-] Dissimilatory nitrate reduction = nitrate → ammonia (via Nap system) ag Nitrogen Cycling N Reduction +K02568 napB, cytochrome c-type subunit of periplasmic nitrate reductase Dissimilatory nitrate reduction = nitrate → ammonia (via Nap system) ag Nitrogen Cycling N Reduction +K00362 nrfA, cytochrome c nitrite reductase large subunit [EC:1.7.2.2] Dissimilatory nitrate reduction = nitrite → ammonia (via Nrf complex) ag Nitrogen Cycling N Reduction +K00363 nrfH, cytochrome c nitrite reductase small subunit Dissimilatory nitrate reduction = nitrite → ammonia (via Nrf complex) ag Nitrogen Cycling N Reduction +K03385 nirB, nitrite reductase (NADH) large subunit [EC:1.7.1.15] Dissimilatory nitrate reduction = nitrite → ammonia (via NirBD complex) ag Nitrogen Cycling N Reduction +K15876 nirD, nitrite reductase (NADH) small subunit [EC:1.7.1.15] Dissimilatory nitrate reduction = nitrite → ammonia (via NirBD complex) ag Nitrogen Cycling N Reduction +K28504 ammonia monooxygenase subunit C [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation +K28504 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation +K10945 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation +K10946 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification = ammonia => hydroxylamine ag Nitrogen Cycling Aerobic Ammonium Oxidation +K10535 hydroxylamine oxidase [EC:1.7.2.6] [RN:R10164] Nitrification= hydroxylamine => nitrite ag Nitrogen Cycling Aerobic Ammonium Oxidation +K15864 nirS; hydroxylamine reductase, anammox Nitrite → nitric oxide ag Nitrogen Cycling Anaerobic Ammonium +K20932 hydrazine synthase subunit [EC:1.7.2.7] Nitric oxide + ammonium → hydrazine (HZS complex) ag Nitrogen Cycling Anaerobic Ammonium +K20935 hydrazine dehydrogenase [EC:1.7.2.8] Hydrazine → dinitrogen gas (N₂) ag Nitrogen Cycling Anaerobic Ammonium +K00368 nirK, nitrite reductase (NO-forming) [EC:1.7.2.1] Nitrite → nitric oxide ag Nitrogen Cycling Anaerobic Ammonium Oxidation +K20933 hzsB, hydrazine synthase subunit B [EC:1.7.2.7] Nitric oxide + ammonium → hydrazine (HZS complex) ag Nitrogen Cycling Anaerobic Ammonium Oxidation +K20934 hzsC, hydrazine synthase subunit C [EC:1.7.2.7] Nitric oxide + ammonium → hydrazine (HZS complex) ag Nitrogen Cycling Anaerobic Ammonium Oxidation +K01428 ureC, urease subunit alpha (largest alpha unit of protein structure) Urea → CO₂ + NH₃ ag Nitrogen Cycling Mineralization +K01429 ureB, urease subunit beta Urea → CO₂ + NH₃ ag Nitrogen Cycling Mineralization +K01430 ureA, urease subunit gamma Urea → CO₂ + NH₃ ag Nitrogen Cycling Mineralization K01426 Amidase, amiE [EC:3.5.1.4] R–CONH₂ → NH₃ + R–COOH ag Nitrogen Cycling Mineralization Ekenler and Tabatabai, "Arylamidase and Amidohydrolases in Soils as Affected by Liming and Tillage Systems." -K01455 Formamidase [EC:3.5.1.49] Formamide → NH₃ + formic acid ag Nitrogen Cycling Mineralization -K18282 CynD, cyanide dihydratase [EC:3.5.5.1] Hydrogen cyanide → formamide → NH₃ ag Nitrogen Cycling Mineralization -K01207   N-acetyl-β-D-glucosaminidase (NAGase) [EC 3.2.1.52] Hydrolyzes chitin oligomers into N-acetylglucosamine monomers ag Nitrogen Cycling Mineralization -K01183 ChiC, chitinase [EC:3.2.1.14] Hydrolyzes β-1,4 linkages in chitin polymers ag Nitrogen Cycling Mineralization -K03791 Putative chitinase Hydrolyzes chitin or chitooligosaccharides ag Nitrogen Cycling Mineralization -K13381 ChiA, chitinase Degrades crystalline chitin into soluble oligomers ag Nitrogen Cycling Mineralization -K20547 ChiB, basic endochitinase B Degrades internal β-1,4 linkages in chitin polymers ag Nitrogen Cycling Mineralization -K17523 Chitinase-like enzyme [EC:3.2.1.14] Additional chitin-degrading hydrolase ag Nitrogen Cycling Mineralization -K17524 Chitinase-like enzyme [EC:3.2.1.14] Additional chitin-degrading hydrolase ag Nitrogen Cycling Mineralization -K17525 Chitinase-like enzyme [EC:3.2.1.14] Additional chitin-degrading hydrolase ag Nitrogen Cycling Mineralization +K01455 Formamidase [EC:3.5.1.49] Formamide → NH₃ + formic acid ag Nitrogen Cycling Mineralization +K18282 CynD, cyanide dihydratase [EC:3.5.5.1] Hydrogen cyanide → formamide → NH₃ ag Nitrogen Cycling Mineralization +K01207   N-acetyl-β-D-glucosaminidase (NAGase) [EC 3.2.1.52] Hydrolyzes chitin oligomers into N-acetylglucosamine monomers ag Nitrogen Cycling Mineralization +K01183 ChiC, chitinase [EC:3.2.1.14] Hydrolyzes β-1,4 linkages in chitin polymers ag Nitrogen Cycling Mineralization +K03791 Putative chitinase Hydrolyzes chitin or chitooligosaccharides ag Nitrogen Cycling Mineralization +K13381 ChiA, chitinase Degrades crystalline chitin into soluble oligomers ag Nitrogen Cycling Mineralization +K20547 ChiB, basic endochitinase B Degrades internal β-1,4 linkages in chitin polymers ag Nitrogen Cycling Mineralization +K17523 Chitinase-like enzyme [EC:3.2.1.14] Additional chitin-degrading hydrolase ag Nitrogen Cycling Mineralization +K17524 Chitinase-like enzyme [EC:3.2.1.14] Additional chitin-degrading hydrolase ag Nitrogen Cycling Mineralization +K17525 Chitinase-like enzyme [EC:3.2.1.14] Additional chitin-degrading hydrolase ag Nitrogen Cycling Mineralization K01150 ednA, deoxyribonuclease I [EC:3.1.21.1] Extracellular nuclease; degrades DNA to release organic N ag Nitrogen Cycling Mineralization Sieradzki et al., "Expression of Macromolecular Organic Nitrogen Degrading Enzymes Identifies Potential Mediators of Soil Organic N Availability to an Annual Grass." -A01 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A02 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A05 Endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A08 Endopeptidase, the bacterial signal peptidase II Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A11 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A22 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A24 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A26 Membrane-inserted endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A28 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A31 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A32 PerP peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -A37 Pepstatin-insensitive aspartic endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic -C01 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C02 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C10 Bacterial cysteine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C11 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C110 Cysteine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C113 IgdE peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C13 Asparaginyl endopeptidases and glycosylphosphatidylinositol:protein transamidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C14 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C15 Omega peptidases that release an N-terminal pyroglutamate residue Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C19 Ubiquitinyl hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C25 Cysteine endopeptidases from bacteria, notably gingipain R (##C25001##) and gingipain K (##C25002##) Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C26 Omega peptidase gamma-glutamyl hydrolase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C39 Bacteriocin-processing endopeptidases from bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C40 Bacterial cell-wall modifying enzymes Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C44 Self-processing precursor of amidophosphoribosyltransferase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C45 Autolytic endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C46 C-terminal, intein-like domains of the hedgehog proteins, which mediate autolytic cleavage of the proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C47 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C51 Endopeptidases that hydrolyse bacterial cell-wall crosslinking peptides Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C56 PfpI endopeptidase of {Pyrococcus furiosus} Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C59 Cys-dependent Ntn-hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C60 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C66 Bacterial endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C69 Dipeptidases and aminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C82 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C83 Exopeptidases some of which also have transferase activity Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C89 Self-cleaving precursor protein Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -C93 LapG peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine -G01 Endopeptidases from fungi Extracellular peptidases ag Nitrogen Cycling Mineralization Glutamic -M01 Aminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M02 Metallo-exopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M03 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M04 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M05 Metalloendopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M06 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M07 Metalloendopeptidase, snapalysin Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M08 Metallo-endopeptidase leishmanolysin and its homologues Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M09 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M10 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M11 A metallo-endopeptidase, gametolysin Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M12 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M13 Metalloendopeptidases restricted to action on substrates smaller than proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M14 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M15 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M16 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M17 Aminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M18 Metalloaminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M19 Dipeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M20 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M23 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M24 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M26 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M28 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M30 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M32 Metallocarboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M34 Highly-selective bacterial endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M35 Fungal metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M36 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M38 An omega peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M41 ATP-dependent metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M42 Metalloaminopeptidases some of which also have acylaminoacylpeptidase activity Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M43 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M44 Metalloendopeptidase from the pox viruses Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M48 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M49 Dipeptidylpeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M50 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M54 Aminopeptidases, sometimes termed archaelysins or archaemetzincins Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M55 Aminopeptidase and a number of uncharacterised putative peptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M56 Membrane-bound bacterial endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M57 Endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M60 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M61 Aminopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M64 Highly selective metalloendopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M66 A single metallopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M67 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M72 Metallo-endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M73 Metallo-endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M74 Murein endopeptidase MepA Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M75 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M76 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M78 Metallo-endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M79 Specialised endopeptidases that typically cleave a C-terminal tripeptide from an isoprenylated protein Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M81 Metallopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M82 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M84 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M85 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M86 Poly-gamma-glutamyl hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M88 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M93 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M96 signaling peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M97 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -M98 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo -N04 Tsh-associated self-cleaving domain Extracellular peptidases ag Nitrogen Cycling Mineralization Asparagine -N10 Extracellular peptidases ag Nitrogen Cycling Mineralization Asparagine -N11 Self-cleaving proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Asparagine -P01 Aminopeptidases and self-processing proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Mixed -S01 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S06 Serine endopeptidases of bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S08 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S09 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S10 Carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S11 Serine-type D-Ala-D-Ala carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S12 Serine-type D-Ala-D-Ala carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S13 Peptidases that cleave D-Ala bonds, acting either as carboxypeptidases or as atypical 'endopeptidases' Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S14 Endopeptidase Clp and its homologues Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S15 Xaa-Pro dipeptidyl peptidase and its homologues Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S16 Endopeptidases, mostly ATP-dependent Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S24 Two-domain proteins that undergo autolysis, separating the functional domains Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S26 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S28 Exopeptidases that hydrolyse prolyl bonds, and are known only from eukaryotes Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S33 Exopeptidases that act at the N-terminus of peptides Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S37 Tripeptidyl-peptidase from {Streptomyces} Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S41 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S45 Self-cleaving precursor proteins of N-terminal nucleophile acylases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S46 Dipeptidyl-peptidases from bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S49 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S50 Polyprotein processing endopeptidases from double-stranded RNA viruses Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S51 Exopeptidases that hydrolyse alpha-aspartyl bonds Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S53 Acid-acting endopeptidases and a tripeptidyl-peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S54 Membrane-bound serine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S55 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S59 Autolytic endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S60 Endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S66 Bacterial LD-carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -S73 Serine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine -T01 Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine -T02 N-terminal nucleophile hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine -T03 Self-processing proteins that express aminopeptidase as well as aminotransferase activities in their mature forms Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine -T05 Self-processing ornithine acetyltransferase precursor Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine -T07 CwpV (Clostridium difficile) self-cleaving threonine peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine -U32 Endopeptidases from bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown -U62 Microcin-processing peptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown -U69 Self-processing peptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown -U72 Isopeptidase and endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown -U73 Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown -U74 neprosin Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown -K01428 ureC, urease subunit alpha (largest aplha unit of protein structure) (EC 3.5.1.5) Urea Degradation ag Nitrogen Cycling Urea Transformation -K01429 ureB, urease subunit beta (EC 3.5.1.5) Urea Degradation ag Nitrogen Cycling Urea Transformation -K01430 ureA, urease subunit gamma (EC 3.5.1.5) Urea Degradation ag Nitrogen Cycling Urea Transformation -K10944 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation -K10945 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation -K10946 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation -K10535 hydroxylamine oxidase [EC:1.7.2.6] [RN:R10164] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation -K00261 glutamate dehydrogenase, gdhA alpha-ketoglutarate + NH3 -> glutamate ag Nitrogen Cycling Assimilation Addtion/Retention -K01915 glutamine synthetase glnA, [EC: 6.3.1.2] NH3 + glutamate -> Glutamine; GS pathway ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K00982 glnE; regulator regulator of GS, up or down based on N abundnace ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K00266 gltD; subunit GOGAT pathway ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K19338 Nac protein; N assimilation regulator gltBDF repressor ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K01914 asnA Asparagine synthase A ammonium dependent; expression is repressed under N-limiting conditions ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K01953 asnB Asparagine synthase B glutamine dependent ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K01916  efg (nadE), ammonium-dependent NAD synthetase ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K01956  carA, subunit of carbamoyl phosphate synthetase Carbamoyl phosphate syntheized from bicarbonate, ATP, and glutamine ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K01955 carB, subunit of carbamoyl phosphate synthetase Carbamoyl phosphate syntheized from bicarbonate, ATP, and glutamine ag Nitrogen Cycling Addtion/Retention Addtion/Retention -K03320 amtB, ammonia transporter transmembrane transporter and extracellular NH4+ sensor; expressed in low NH4+ ag Nitrogen Cycling Addtion/Retention -K00370 nxrA, nitrite oxidoreductase, alpha subunit [EC:1.7.99.4] [RN:R00798] nitrite => nitrate ag Nitrogen Cycling Aerobic Nitrate -K00371 nxrB, nitrite oxidoreductase, beta subunit [EC:1.7.99.4] [RN:R00798] nitrite => nitrate ag Nitrogen Cycling Aerobic Nitrate +A01 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A02 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A05 Endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A08 Endopeptidase, the bacterial signal peptidase II Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A11 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A22 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A24 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A26 Membrane-inserted endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A28 Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A31 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A32 PerP peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +A37 Pepstatin-insensitive aspartic endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Aspartic +C01 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C02 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C10 Bacterial cysteine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C11 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C110 Cysteine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C113 IgdE peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C13 Asparaginyl endopeptidases and glycosylphosphatidylinositol:protein transamidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C14 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C15 Omega peptidases that release an N-terminal pyroglutamate residue Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C19 Ubiquitinyl hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C25 Cysteine endopeptidases from bacteria, notably gingipain R (##C25001##) and gingipain K (##C25002##) Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C26 Omega peptidase gamma-glutamyl hydrolase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C39 Bacteriocin-processing endopeptidases from bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C40 Bacterial cell-wall modifying enzymes Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C44 Self-processing precursor of amidophosphoribosyltransferase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C45 Autolytic endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C46 C-terminal, intein-like domains of the hedgehog proteins, which mediate autolytic cleavage of the proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C47 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C51 Endopeptidases that hydrolyse bacterial cell-wall crosslinking peptides Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C56 PfpI endopeptidase of {Pyrococcus furiosus} Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C59 Cys-dependent Ntn-hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C60 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C66 Bacterial endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C69 Dipeptidases and aminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C82 Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C83 Exopeptidases some of which also have transferase activity Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C89 Self-cleaving precursor protein Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +C93 LapG peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Cysteine +G01 Endopeptidases from fungi Extracellular peptidases ag Nitrogen Cycling Mineralization Glutamic +M01 Aminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M02 Metallo-exopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M03 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M04 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M05 Metalloendopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M06 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M07 Metalloendopeptidase, snapalysin Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M08 Metallo-endopeptidase leishmanolysin and its homologues Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M09 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M10 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M11 A metallo-endopeptidase, gametolysin Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M12 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M13 Metalloendopeptidases restricted to action on substrates smaller than proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M14 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M15 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M16 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M17 Aminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M18 Metalloaminopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M19 Dipeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M20 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M23 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M24 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M26 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M28 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M30 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M32 Metallocarboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M34 Highly-selective bacterial endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M35 Fungal metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M36 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M38 An omega peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M41 ATP-dependent metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M42 Metalloaminopeptidases some of which also have acylaminoacylpeptidase activity Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M43 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M44 Metalloendopeptidase from the pox viruses Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M48 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M49 Dipeptidylpeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M50 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M54 Aminopeptidases, sometimes termed archaelysins or archaemetzincins Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M55 Aminopeptidase and a number of uncharacterised putative peptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M56 Membrane-bound bacterial endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M57 Endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M60 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M61 Aminopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M64 Highly selective metalloendopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M66 A single metallopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M67 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M72 Metallo-endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M73 Metallo-endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M74 Murein endopeptidase MepA Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M75 Metalloendopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M76 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M78 Metallo-endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M79 Specialised endopeptidases that typically cleave a C-terminal tripeptide from an isoprenylated protein Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M81 Metallopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M82 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M84 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M85 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M86 Poly-gamma-glutamyl hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M88 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M93 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M96 signaling peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M97 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +M98 Extracellular peptidases ag Nitrogen Cycling Mineralization Metallo +N04 Tsh-associated self-cleaving domain Extracellular peptidases ag Nitrogen Cycling Mineralization Asparagine +N10 Extracellular peptidases ag Nitrogen Cycling Mineralization Asparagine +N11 Self-cleaving proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Asparagine +P01 Aminopeptidases and self-processing proteins Extracellular peptidases ag Nitrogen Cycling Mineralization Mixed +S01 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S06 Serine endopeptidases of bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S08 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S09 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S10 Carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S11 Serine-type D-Ala-D-Ala carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S12 Serine-type D-Ala-D-Ala carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S13 Peptidases that cleave D-Ala bonds, acting either as carboxypeptidases or as atypical 'endopeptidases' Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S14 Endopeptidase Clp and its homologues Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S15 Xaa-Pro dipeptidyl peptidase and its homologues Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S16 Endopeptidases, mostly ATP-dependent Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S24 Two-domain proteins that undergo autolysis, separating the functional domains Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S26 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S28 Exopeptidases that hydrolyse prolyl bonds, and are known only from eukaryotes Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S33 Exopeptidases that act at the N-terminus of peptides Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S37 Tripeptidyl-peptidase from {Streptomyces} Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S41 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S45 Self-cleaving precursor proteins of N-terminal nucleophile acylases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S46 Dipeptidyl-peptidases from bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S49 Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S50 Polyprotein processing endopeptidases from double-stranded RNA viruses Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S51 Exopeptidases that hydrolyse alpha-aspartyl bonds Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S53 Acid-acting endopeptidases and a tripeptidyl-peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S54 Membrane-bound serine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S55 Endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S59 Autolytic endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S60 Endopeptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S66 Bacterial LD-carboxypeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +S73 Serine endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Serine +T01 Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine +T02 N-terminal nucleophile hydrolases Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine +T03 Self-processing proteins that express aminopeptidase as well as aminotransferase activities in their mature forms Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine +T05 Self-processing ornithine acetyltransferase precursor Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine +T07 CwpV (Clostridium difficile) self-cleaving threonine peptidase Extracellular peptidases ag Nitrogen Cycling Mineralization Threonine +U32 Endopeptidases from bacteria Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown +U62 Microcin-processing peptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown +U69 Self-processing peptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown +U72 Isopeptidase and endopeptidases Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown +U73 Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown +U74 neprosin Extracellular peptidases ag Nitrogen Cycling Mineralization Unknown +K01428 ureC, urease subunit alpha (largest aplha unit of protein structure) (EC 3.5.1.5) Urea Degradation ag Nitrogen Cycling Urea Transformation +K01429 ureB, urease subunit beta (EC 3.5.1.5) Urea Degradation ag Nitrogen Cycling Urea Transformation +K01430 ureA, urease subunit gamma (EC 3.5.1.5) Urea Degradation ag Nitrogen Cycling Urea Transformation +K10944 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation +K10945 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation +K10946 ammonia monooxygenase [EC:1.14.99.39] [RN:R00148] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation +K10535 hydroxylamine oxidase [EC:1.7.2.6] [RN:R10164] Nitrification= ammonia => nitrite ag Nitrogen Cycling Ammonium Transformation +K00261 glutamate dehydrogenase, gdhA alpha-ketoglutarate + NH3 -> glutamate ag Nitrogen Cycling Assimilation Addtion/Retention +K01915 glutamine synthetase glnA, [EC: 6.3.1.2] NH3 + glutamate -> Glutamine; GS pathway ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K00982 glnE; regulator regulator of GS, up or down based on N abundnace ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K00266 gltD; subunit GOGAT pathway ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K19338 Nac protein; N assimilation regulator gltBDF repressor ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K01914 asnA Asparagine synthase A ammonium dependent; expression is repressed under N-limiting conditions ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K01953 asnB Asparagine synthase B glutamine dependent ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K01916  efg (nadE), ammonium-dependent NAD synthetase ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K01956  carA, subunit of carbamoyl phosphate synthetase Carbamoyl phosphate syntheized from bicarbonate, ATP, and glutamine ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K01955 carB, subunit of carbamoyl phosphate synthetase Carbamoyl phosphate syntheized from bicarbonate, ATP, and glutamine ag Nitrogen Cycling Addtion/Retention Addtion/Retention +K03320 amtB, ammonia transporter transmembrane transporter and extracellular NH4+ sensor; expressed in low NH4+ ag Nitrogen Cycling Addtion/Retention +K00370 nxrA, nitrite oxidoreductase, alpha subunit [EC:1.7.99.4] [RN:R00798] nitrite => nitrate ag Nitrogen Cycling Aerobic Nitrate +K00371 nxrB, nitrite oxidoreductase, beta subunit [EC:1.7.99.4] [RN:R00798] nitrite => nitrate ag Nitrogen Cycling Aerobic Nitrate K07093 phoX, Alkaline phosphatase X ag Other Nutrients Siles et al., ìDistribution of Phosphorus Cycling Genes across Land Uses and Microbial Taxonomic Groups Based on Metagenome and Genome Mining.î K09474 phoN, Acid phosphatase class A ag Other Nutrients Siles et al., ìDistribution of Phosphorus Cycling Genes across Land Uses and Microbial Taxonomic Groups Based on Metagenome and Genome Mining.î K03788 aphA, Acid phosphatase class B ag Other Nutrients Siles et al., ìDistribution of Phosphorus Cycling Genes across Land Uses and Microbial Taxonomic Groups Based on Metagenome and Genome Mining.î @@ -243,518 +243,518 @@ K06163 phnJ, CñP lyase multienzyme complex ag Other Nutrients Siles et al., K05781 phnK, CñP lyase multienzyme complex ag Other Nutrients Siles et al., ìDistribution of Phosphorus Cycling Genes across Land Uses and Microbial Taxonomic Groups Based on Metagenome and Genome Mining.î K05780 phnL, CñP lyase multienzyme complex ag Other Nutrients Siles et al., ìDistribution of Phosphorus Cycling Genes across Land Uses and Microbial Taxonomic Groups Based on Metagenome and Genome Mining.î K06162 phnM, CñP lyase multienzyme complex ag Other Nutrients Siles et al., ìDistribution of Phosphorus Cycling Genes across Land Uses and Microbial Taxonomic Groups Based on Metagenome and Genome Mining.î -K04103 ipdC [EC:4.1.1.74] Indole-3-pyruvate → IAA ag Rhizosphere Transformations Auxin (IAA) -K00466 iaaM [EC:1.13.12.3] Tryptophan → IAM → IAA ag Rhizosphere Transformations Auxin (IAA) -K21801  iaaH [EC:3.5.1.4] Tryptophan → IAM → IAA ag Rhizosphere Transformations Auxin (IAA) -K01426 amiE [EC:3.5.1.4] IAM → IAA ag Rhizosphere Transformations Auxin (IAA) -K03397 iaaL [EC:6.3.2.20] Conjugates IAA → IAA-Lys (inactivation) ag Rhizosphere Transformations Auxin (IAA) -K10760 ipt [EC:2.5.1.112] Isopentenyl-AMP → cytokinins ag Rhizosphere Transformations Cytokinins -K00279 ckx [EC:1.5.99.12] Cytokinin degradation ag Rhizosphere Transformations Cytokinins -K04121 ks [EC:4.2.3.19] ent-kaurene synthase (ent-copalyl diphosphate → ent-kaurene; early GA biosynthesis) ag Rhizosphere Transformations Gibberellins -K20657  cps/ks [EC:5.5.1.13] ent-copalyl diphosphate / ent-kaurene synthase (bifunctional) ag Rhizosphere Transformations Gibberellins -K27636 cps/ks [EC:4.2.3.19] ent-copalyl diphosphate / ent-kaurene / ent-beyerene synthase ag Rhizosphere Transformations Gibberellins -K21719  cyp701A [EC:1.14.14.86] ent-Kaurene → GA intermediates ag Rhizosphere Transformations Gibberellins -K04123    cyp88A [EC:1.14.13.79] ent-Kaurenoic acid → GA12 ag Rhizosphere Transformations Gibberellins -K01505 acdS [EC:3.5.99.7] ACC → α-ketobutyrate + NH3 ag Rhizosphere Transformations ACC Deaminase -K21815  efe [EC:1.13.12.19] L-arginine → ethylene ag Rhizosphere Transformations AA Derivatives -K09840 abaA-like [EC:1.13.11.51] Mevalonate pathway → ABA ag Rhizosphere Transformations AA Derivatives -K09843 cyp707A-like [EC:1.14.13.93] ABA → phaseic acid ag Rhizosphere Transformations AA Derivatives -K01851 pchA [EC:5.4.4.2] Chorismate → salicylic acid ag Rhizosphere Transformations Phenolics -K04781 pchB [EC:4.2.99.21] Chorismate → salicylic acid ag Rhizosphere Transformations Phenolics -K00480 nahG [EC:1.14.13.1] Salicylic acid → catechol ag Rhizosphere Transformations Phenolics -K00454 lox [EC:1.13.11.12] Linolenic acid → hydroperoxides ag Rhizosphere Transformations AA Derivatives -K01723  aos [EC:4.2.1.92] Hydroperoxides → OPDA ag Rhizosphere Transformations AA Derivatives -K09591 det2-like [EC:1.3.1.-] Steroid metabolism → brassinolide-like compounds ag Rhizosphere Transformations AA Derivatives -K09587  dwrf [EC:1.14.-.-] Steroid metabolism → brassinolide-like compounds ag Rhizosphere Transformations AA Derivatives -K22944   cyaA [EC:4.6.1.1] ATP → cAMP (adenylate cyclase) ag Rhizosphere Transformations Nucleotides/Sides -K01769 gya [EC:4.6.1.2] GTP → cGMP (guanylate cyclase ag Rhizosphere Transformations Nucleotides/Sides -K00108 betA; choline dehydrogenase (EC 1.1.99.1) Glycine betaine biosynthesis from choline ag Stressors Methyl-related Compatible Solutes -K00130 betB; betaine-aldehyde dehydrogenase (EC 1.2.1.8) Glycine betaine biosynthesis from betaine-aldehyde ag Stressors Methyl-related Compatible Solutes -K02000 proV; glycine-betaine/proline transport system ATP-binding protein Glycine betaine/proline transport ag Stressors Methyl-related Compatible Solutes -K02001 proW; glycine-betaine/proline transport system permease protein Glycine betaine/proline transport ag Stressors Methyl-related Compatible Solutes -K02002 proX; glycine-betaine/proline transport system substrate-binding protein Glycine betaine/proline transport ag Stressors Methyl-related Compatible Solutes -K02168 betP; choline/glycine/proline betaine transport protein Glycine betaine/choline/proline transport ag Stressors Methyl-related Compatible Solutes -K03451 betT/BCCT; choline/carnitine/betaine/glycine transporter Choline/betaine transport (BCCT family) ag Stressors Methyl-related Compatible Solutes -K03607 proQ; ProP effector (proline/betaine regulation) Regulation of proline/betaine transport (ProP system) ag Stressors Methyl-related Compatible Solutes -K03762 proP; MFS transporter for proline/betaine Proline/betaine transport (ProP system) ag Stressors Methyl-related Compatible Solutes -K05020 opuD; glycine-betaine transporter Glycine betaine uptake ag Stressors Methyl-related Compatible Solutes -K05245 caiT; L-carnitine/gamma-butyrobetaine antiporter L-carnitine transport (osmoprotectant role) ag Stressors Methyl-related Compatible Solutes -K05845 opuC; osmoprotectant transport system substrate-binding protein Osmoprotectant transport (OpuC system) ag Stressors Methyl-related Compatible Solutes -K05846 opuBD; osmoprotectant transport system permease protein Osmoprotectant transport (OpuC system) ag Stressors Methyl-related Compatible Solutes -K05847 opuA; osmoprotectant transport system ATP-binding protein Osmoprotectant transport (OpuC system) ag Stressors Methyl-related Compatible Solutes -K10036 glnH; glutamine transport system substrate-binding protein Glutamine transport (osmotic adjustment role) ag Stressors Methyl-related Compatible Solutes -K10037 glnP; glutamine transport system permease protein Glutamine transport (osmotic adjustment role) ag Stressors Methyl-related Compatible Solutes -K10038 glnQ; glutamine transport system ATP-binding protein Glutamine transport (osmotic adjustment role) ag Stressors Methyl-related Compatible Solutes -K11440 betA; choline dehydrogenase (alternate) Glycine betaine biosynthesis from choline ag Stressors Methyl-related Compatible Solutes -K18896 gsmT; glycine/sarcosine N-methyltransferase Glycine → sarcosine → dimethylglycine synthesis ag Stressors Methyl-related Compatible Solutes -K18897 dmt; sarcosine/dimethylglycine N-methyltransferase Dimethylglycine → betaine synthesis ag Stressors Methyl-related Compatible Solutes -K00697 otsA (EC 2.4.1.15) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) -K01087 otsB (EC 3.1.3.12) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) -K01236 treZ (EC 3.2.1.141) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) -K06044 treY (EC 5.4.99.15) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) -K05342 treP (EC 2.4.1.64) Trehalose metabolism ag Stressors Sugar Compatible Solutes (Trehalose) -K05343 treS (EC 5.4.99.16) Trehalose metabolism ag Stressors Sugar Compatible Solutes (Trehalose) -K00009 mtlD (EC 1.1.1.17) Mannitol biosynthesis ag Stressors Sugar Compatible Solutes (Mannitol) -K02798 mtlA Mannitol transport ag Stressors Sugar Compatible Solutes (Mannitol) -K05947 mpgS (EC 2.4.1.217) Mannosyl-3-phosphoglycerate biosynthesis ag Stressors Sugar Compatible Solutes (Mannosyl glycerate) -K17314 treV Trehalose transport ag Stressors Sugar Compatible Solutes (Trehalose) -K02781 srlA; sorbitol transporter subunit II A Sorbitol transport ag Stressors Sugar Compatible Solutes (Sorbitol) -K02782 srlB; sorbitol transporter subunit II B Sorbitol transport ag Stressors Sugar Compatible Solutes (Sorbitol) -K02783 srlE; sorbitol transporter subunit II E Sorbitol transport ag Stressors Sugar Compatible Solutes (Sorbitol) -K10109 malF; maltose transport system permease protein Maltose transport ag Stressors Sugar Compatible Solutes (Maltose) -K10110 malG; maltose transport system permease protein Maltose transport ag Stressors Sugar Compatible Solutes (Maltose) -K10111 malK; maltose/maltodextrin transport system ATP-binding protein Maltose transport ag Stressors Sugar Compatible Solutes (Maltose) -K10227 smoE; sorbitol/mannitol transport system substrate-binding protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) -K10228 smoF; sorbitol/mannitol transport system permease protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) -K10229 sorbitol/mannitol transport system permease protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) -K10230 sorbitol/mannitol transport system ATP-binding protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) -K03782 katG [EC:1.11.1.21] Catalase–peroxidase ag Stressors -K04564 sodA [EC:1.15.1.1] Superoxide dismutase (Mn-dependent) ag Stressors -K04565 sodB [EC:1.15.1.1] Superoxide dismutase (Fe-dependent) ag Stressors -K01920 gshA [EC:6.3.2.2] Glutamate–cysteine ligase (first step in glutathione biosynthesis) ag Stressors -K01921 gshB [EC:6.3.2.3] Glutathione synthase (second step in glutathione biosynthesis) ag Stressors -K05909 mco [EC:1.10.3.2] Multicopper oxidase (laccase; oxidizes phenolics, triazines, and aromatics) ag Stressors -K00421 lcc [EC:1.10.3.2] Laccase (multicopper oxidase; lignin and aromatic oxidation) ag Stressors -K05910 npr [EC:1.11.1.1] NADH peroxidase (reduces hydrogen peroxide via NADH) ag Stressors -K00431 lip [EC:1.11.1.14] Lignin peroxidase (oxidizes lignin and aromatic compounds via H₂O₂) ag Stressors -K00799 gst [EC:2.5.1.18] Glutathione S-transferase (conjugates glutathione to xenobiotics for detoxification) ag Stressors -K00697 otsA [EC:2.4.1.15] Trehalose-6-phosphate synthase (trehalose biosynthesis) ag Stressors -K01087 otsB [EC:3.1.3.12] Trehalose-6-phosphate phosphatase (trehalose biosynthesis) ag Stressors -K00147 proA [EC:1.2.1.41] γ-Glutamyl phosphate reductase (proline biosynthesis) ag Stressors -K00931 proB [EC:2.7.2.11] Glutamate 5-kinase (proline biosynthesis) ag Stressors -K00286 proC [EC:1.5.1.2] Pyrroline-5-carboxylate reductase (proline biosynthesis) ag Stressors -K00006 gpd1 [EC:1.1.1.8] Glycerol-3-phosphate dehydrogenase (NAD⁺-dependent) ag Stressors -K00111 gpd2 [EC:1.1.5.3] Glycerol-3-phosphate dehydrogenase (quinone-dependent) ag Stressors -K00108 betA [EC:1.1.99.1] Choline dehydrogenase (glycine betaine biosynthesis) ag Stressors -K00130 betB [EC:1.2.1.8] Betaine aldehyde dehydrogenase (glycine betaine biosynthesis) ag Stressors -K16566 exoY Exopolysaccharide production protein ExoY (succinoglycan) ag Stressors Exopolysaccharide Production -K16557 exoA Succinoglycan biosynthesis glycosyltransferase ag Stressors Exopolysaccharide Production -K16556 exoM Succinoglycan biosynthesis mannosyltransferase ag Stressors Exopolysaccharide Production -K16555 exoO Succinoglycan biosynthesis protein ag Stressors Exopolysaccharide Production -K19290 alg8 Mannuronan synthase (alginate biosynthesis) ag Stressors Exopolysaccharide Production -K19291 alg44 Mannuronan polymer co-polymerase (alginate biosynthesis) ag Stressors Exopolysaccharide Production -K19293 algX Alginate biosynthesis protein ag Stressors Exopolysaccharide Production -K19295 algJ Alginate O-acetyltransferase complex protein ag Stressors Exopolysaccharide Production -K20997 pslA Psl polysaccharide biosynthesis protein ag Stressors Exopolysaccharide Production -K21001 pslH Psl polysaccharide biosynthesis protein ag Stressors Exopolysaccharide Production -K21154 pssM Exopolysaccharide glucosyl ketal-pyruvate-transferase ag Stressors Exopolysaccharide Production -K25902 pssA Acidic exopolysaccharide biosynthesis protein ag Stressors Exopolysaccharide Production -K25904 pssE Exopolysaccharide biosynthesis glucuronosyltransferase ag Stressors Exopolysaccharide Production -K25906 pssS Exopolysaccharide biosynthesis glucosyltransferase ag Stressors Exopolysaccharide Production -K19290 alg8 Mannuronan synthase (alginate biosynthesis) ag Stressors Biofilm Formation -K19291 alg44 Mannuronan co-polymerase (alginate biosynthesis) ag Stressors Biofilm Formation -K19293 algX Alginate biosynthesis protein AlgX ag Stressors Biofilm Formation -K19294 algI Alginate O-acetyltransferase complex protein AlgI ag Stressors Biofilm Formation -K19295 algJ Alginate O-acetyltransferase complex protein AlgJ ag Stressors Biofilm Formation -K19296 algF Alginate O-acetyltransferase complex protein AlgF ag Stressors Biofilm Formation -K11936 pgaC / icaA Poly-β-1,6-N-acetyl-D-glucosamine synthase (PGA/ICA matrix) ag Stressors Biofilm Formation -K11937 pgaD Biofilm PGA synthesis protein ag Stressors Biofilm Formation -K21001 pslH Psl polysaccharide biosynthesis protein ag Stressors Biofilm Formation -K20997 pslA Psl polysaccharide biosynthesis protein ag Stressors Biofilm Formation -K25205 pslC Psl polysaccharide biosynthesis protein ag Stressors Biofilm Formation -K21461 icaD Poly-β-1,6-N-acetyl-D-glucosamine synthesis protein ag Stressors Biofilm Formation -K01045 opd/mpd/pah/ophC2 [EC:3.1.8.1] Carbamates ag Stressors Pesticides -K14449 mcd [EC:3.1.1.88] Carbamates ag Stressors Pesticides -K25604 cehA [EC:3.5.1.137] Triazines ag Stressors Pesticides -K05394  atzA [EC:3.8.1.8] Triazines ag Stressors Pesticides -K03382 atzB [EC:3.5.99.3] Triazines ag Stressors Pesticides -K08710 atzC [EC:3.5.99.4] Triazines ag Stressors Pesticides -K05394 trzN [EC:3.8.1.8] Organochlorines ag Stressors Pesticides -K15236  linA [EC:4.5.1.-] Organochlorines ag Stressors Pesticides -K01563 linB [EC:3.8.1.5] Organochlorines ag Stressors Pesticides -K15237 "linC [EC:1.3.1.-] " Phenoxy herbicides ag Stressors Pesticides -K06912 tfdA [EC:1.14.11.-] Phenoxy herbicides ag Stressors Pesticides -K08719 tfdB [EC:1.14.13.2] Pyrethroids ag Stressors Pesticides -K08722 tfdF [EC:5.5.1.5] Pyrethroids ag Stressors Pesticides -K20992 pytH [EC:3.1.1.-] Pyrethroids ag Stressors Pesticides -K20993 estP [EC:3.1.1.88] Glyphosate ag Stressors Pesticides -K17842 gox [EC:1.13.11.59] Glyphosate ag Stressors Pesticides -K23996 phnY [EC:1.14.11.71] Methylphosphonate hydroxylase (oxidizes methylphosphonate to phosphate intermediates) ag Stressors Pesticides -K06164 phnI [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides -K06165 phnH [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides -K06166 phnG [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides -K05780 phnL [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides -K06162 phnM [EC:3.6.1.63] Alpha-D-ribose-1-methylphosphonate-5-triphosphate diphosphatase (hydrolyzes phosphonate intermediates) ag Stressors Pesticides -K06163 phnJ [EC:4.7.1.1] C–P lyase catalytic subunit (cleaves C–P bond in phosphonates including glyphosate) ag Stressors Pesticides -K06167 phnP [EC:3.1.4.55] Phosphoribosyl-1,2-cyclic phosphate phosphodiesterase (final phosphonate degradation step) ag Stressors Pesticides -K01560  Haloacid dehalogenases [EC:3.8.1.2] Broad (various pesticides) ag Stressors Pesticides -K03930 estA [EC:3.1.1.1] Carboxylesterase (broad-spectrum hydrolase acting on xenobiotic organoesters and pesticides) ag Stressors Pesticides -K00163 pyruvate dehydrogenase E1 component [EC:1.2.4.1] pyruvate → acetyl-CoA v1 ag Carbon Processing SCFA and alcohol conversions -K00174 2-oxoglutarate/2-oxoacid ferredoxin oxidoreductase subunit alpha [EC:1.2.7.3, 1.2.7.11] pyruvate → acetyl-CoA v2 ag Carbon Processing SCFA and alcohol conversions -K00656 formate C-acetyltransferase [EC:2.3.1.54] pyruvate → acetyl-CoA + formate v3 ag Carbon Processing SCFA and alcohol conversions -K00625 phosphate acetyltransferase [EC:2.3.1.8] [RN:R00230] acetate, pt 1 ag Carbon Processing SCFA and alcohol conversions -K00925 acetate kinase [EC:2.7.2.1] [RN:R00315] acetate, pt 1 ag Carbon Processing SCFA and alcohol conversions -K01905 acetate-CoA ligase (ADP-forming) subunit alpha acetate, pt 2 ag Carbon Processing SCFA and alcohol conversions -K01067 acetyl-CoA hydrolase [EC:3.1.2.1] acetate, pt 3 ag Carbon Processing SCFA and alcohol conversions -K00016 L-lactate dehydrogenase [EC:1.1.1.27] lactate (L) ag Carbon Processing SCFA and alcohol conversions -K00101 L-lactate dehydrogenase (cytochrome) [EC:1.1.2.3] lactate (L) ag Carbon Processing SCFA and alcohol conversions -K03778 D-lactate dehydrogenase [EC:1.1.1.28] lactate (D) ag Carbon Processing SCFA and alcohol conversions -K03777 D-lactate dehydrogenase (quinone/cytochrome variants) [EC:1.1.5.12, EC:1.1.2.4] lactate (D) ag Carbon Processing SCFA and alcohol conversions -K00634 phosphate butyryltransferase [EC:2.3.1.19] butyrate, pt 1 ag Carbon Processing SCFA and alcohol conversions -K00929 butyrate kinase [EC:2.7.2.7] butyrate, pt 2 ag Carbon Processing SCFA and alcohol conversions -K01896 medium-chain acyl-CoA synthetase [EC:6.2.1.2] butyrate, pt 2 ag Carbon Processing SCFA and alcohol conversions -K19697 propionate kinase [EC:2.7.2.15] propionate, pt 1 ag Carbon Processing SCFA and alcohol conversions -K01026 propionate CoA-transferase [EC:2.8.3.1] propionate, pt 2 ag Carbon Processing SCFA and alcohol conversions -K00001 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K00121 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K04072 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K13951 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K13952 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K13953 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K13954 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K13980 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K18857 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions -K00192 cdhA; anaerobic carbon-monoxide dehydrogenase, CODH/ACS complex subunit alpha [EC:1.2.7.4] [RN:R07157] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation -K00195 cdhB; anaerobic carbon-monoxide dehydrogenase, CODH/ACS complex subunit epsilon [RN:R07157] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation -K00193 cdhC; acetyl-CoA decarbonylase/synthase, CODH/ACS complex subunit beta [EC:2.3.1.169] [RN:R09096 R10219] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation -K00197 cdhE; acetyl-CoA decarbonylase/synthase, CODH/ACS complex subunit gamma [EC:2.1.1.245] [RN:R09096 R10219] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation -K00194 cdhD; acetyl-CoA decarbonylase/synthase, CODH/ACS complex subunit delta [EC:2.1.1.245] [RN:R09096 R10219] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation -K10944 particulate methane monooxygenase subunit A (pmoA) [EC:1.14.18.3] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K10945 particulate methane monooxygenase subunit B (pmoB) [EC:1.14.18.3] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K10946 particulate methane monooxygenase subunit C (pmoC) [EC:1.14.18.3] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K16157 soluble methane monooxygenase hydroxylase alpha subunit (mmoX) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K16158 soluble methane monooxygenase hydroxylase beta subunit (mmoY) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K16159 soluble methane monooxygenase hydroxylase gamma subunit (mmoZ) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K16160 soluble methane monooxygenase component B (mmoB) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K16161 soluble methane monooxygenase reductase component (mmoC) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -K16162 soluble methane monooxygenase regulatory protein (mmoD) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation -GH94 GH94 cellobiose phosphorylase (EC 2.4.1.20); laminaribiose phosphorylase (EC 2.4.1.31); cellodextrin phosphorylase (EC 2.4.1.49); chitobiose phosphorylase (EC 2.4.1.-); cyclic beta-1,2-glucan synthase (EC 2.4.1.-); cellobionic acid phosphorylase (EC 2.4.1.321); beta-1,2-oligoglucan phosphorylase (EC 2.4.1.-) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH1 GH1 beta-glucosidase (EC 3.2.1.21); beta-galactosidase (EC 3.2.1.23); beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); beta-xylosidase (EC 3.2.1.37); beta-D-fucosidase (EC 3.2.1.38); phlorizin hydrolase (EC 3.2.1.62); exo-beta-1,4-glucanase (EC 3.2.1.74); 6-phospho-beta-galactosidase (EC 3.2.1.85); 6-phospho-beta-glucosidase (EC 3.2.1.86); strictosidine beta-glucosidase (EC 3.2.1.105); lactase (EC 3.2.1.108); amygdalin beta-glucosidase (EC 3.2.1.117); prunasin beta-glucosidase (EC 3.2.1.118); vicianin hydrolase (EC 3.2.1.119); raucaffricine beta-glucosidase (EC 3.2.1.125); thioglucosidase (EC 3.2.1.147); beta-primeverosidase (EC 3.2.1.149); isoflavonoid 7-O-beta-apiosyl-beta-glucosidase (EC 3.2.1.161); ABA-specific beta-glucosidase (EC 3.2.1.175); DIMBOA beta-glucosidase (EC 3.2.1.182); beta-glycosidase (EC 3.2.1.-); hydroxyisourate hydrolase (EC 3.-.-.-) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH2 GH2 beta-galactosidase (EC 3.2.1.23) ; beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); alpha-L-arabinofuranosidase (EC 3.2.1.55); mannosylglycoprotein endo-beta-mannosidase (EC 3.2.1.152); exo-beta-glucosaminidase (EC 3.2.1.165); alpha-L-arabinopyranosidase (EC 3.2.1.-); beta-galacturonidase (EC 3.2.1.-); beta-xylosidase (EC 3.2.1.37); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH3 GH3 beta-glucosidase (EC 3.2.1.21); xylan 1,4-beta-xylosidase (EC 3.2.1.37); beta-glucosylceramidase (EC 3.2.1.45); beta-N-acetylhexosaminidase (EC 3.2.1.52); alpha-L-arabinofuranosidase (EC 3.2.1.55); glucan 1,3-beta-glucosidase (EC 3.2.1.58); glucan 1,4-beta-glucosidase (EC 3.2.1.74); isoprimeverose-producing oligoxyloglucan hydrolase (EC 3.2.1.120); coniferin beta-glucosidase (EC 3.2.1.126); exo-1,3-1,4-glucanase (EC 3.2.1.-); beta-N-acetylglucosaminide phosphorylases (EC 2.4.1.-) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH5 GH5 endo-beta-1,4-glucanase / cellulase (EC 3.2.1.4); endo-beta-1,4-xylanase (EC 3.2.1.8); beta-glucosidase (EC 3.2.1.21); beta-mannosidase (EC 3.2.1.25); beta-glucosylceramidase (EC 3.2.1.45); glucan beta-1,3-glucosidase (EC 3.2.1.58); licheninase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); glucan endo-1,6-beta-glucosidase (EC 3.2.1.75); mannan endo-beta-1,4-mannosidase (EC 3.2.1.78); cellulose beta-1,4-cellobiosidase (EC 3.2.1.91); steryl beta-glucosidase (EC 3.2.1.104); endoglycoceramidase (EC 3.2.1.123); chitosanase (EC 3.2.1.132); beta-primeverosidase (EC 3.2.1.149); xyloglucan-specific endo-beta-1,4-glucanase (EC 3.2.1.151); endo-beta-1,6-galactanase (EC 3.2.1.164); hesperidin 6-O-alpha-L-rhamnosyl-beta-glucosidase (EC 3.2.1.168); beta-1,3-mannanase (EC 3.2.1.-); arabinoxylan-specific endo-beta-1,4-xylanase (EC 3.2.1.-); mannan transglycosylase (EC 2.4.1.-); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-glucanase / laminarinase (EC 3.2.1.39); beta-N-acetylhexosaminidase (EC 3.2.1.52); chitosanase (EC 3.2.1.132); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH9 GH9 endoglucanase (EC 3.2.1.4); endo-beta-1,3(4)-glucanase / lichenase-laminarinase (EC 3.2.1.6); beta-glucosidase (EC 3.2.1.21); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); cellobiohydrolase (EC 3.2.1.91); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); exo-beta-glucosaminidase (EC 3.2.1.165) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH16 GH16 xyloglucan:xyloglucosyltransferase (EC 2.4.1.207); keratan-sulfate endo-1,4-beta-galactosidase (EC 3.2.1.103); endo-1,3-beta-glucanase / laminarinase (EC 3.2.1.39); endo-1,3(4)-beta-glucanase (EC 3.2.1.6); licheninase (EC 3.2.1.73); beta-agarase (EC 3.2.1.81); kappa;-carrageenase (EC 3.2.1.83); xyloglucanase (EC 3.2.1.151); endo-beta-1,3-galactanase (EC 3.2.1.181); [retaining] beta-porphyranase (EC 3.2.1.178); hyaluronidase (EC 3.2.1.35); endo-beta-1,4-galactosidase (EC 3.2.1.-); chitin beta-1,6-glucanosyltransferase (EC 2.4.1.-); beta-transglycosidase (EC 2.4.1.-); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-galactanase (EC 3.2.1.181) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH116 GH116 beta-glucosidase (EC 3.2.1.21); beta-xylosidase (EC 3.2.1.37); acid beta-glucosidase/beta-glucosylceramidase (EC 3.2.1.45); beta-N-acetylglucosaminidase (EC 3.2.1.52) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH6 GH6 endoglucanase (EC 3.2.1.4); cellobiohydrolase (EC 3.2.1.91) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH7 GH7 endo-beta-1,4-glucanase (EC 3.2.1.4); reducing end-acting cellobiohydrolase (EC 3.2.1.176); chitosanase (EC 3.2.1.132); endo-beta-1,3-1,4-glucanase (EC 3.2.1.73) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH8 GH8 chitosanase (EC 3.2.1.132); cellulase (EC 3.2.1.4); licheninase (EC 3.2.1.73); endo-1,4-beta-xylanase (EC 3.2.1.8); reducing-end-xylose releasing exo-oligoxylanase (EC 3.2.1.156) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH10 GH10 endo-1,4-beta-xylanase (EC 3.2.1.8); endo-1,3-beta-xylanase (EC 3.2.1.32); tomatinase (EC 3.2.1.-); xylan endotransglycosylase (EC 2.4.2.-); endo-beta-1,4-glucanase (EC 3.2.1.4) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH124 GH124 endoglucanase (EC 3.2.1.4) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH12 GH12 endoglucanase (EC 3.2.1.4); xyloglucan hydrolase (EC 3.2.1.151); beta-1,3-1,4-glucanase (EC 3.2.1.73); xyloglucan endotransglycosylase (EC 2.4.1.207) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH44 GH44 endoglucanase (EC 3.2.1.4); xyloglucanase (EC 3.2.1.151) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH45 GH45 endoglucanase (EC 3.2.1.4); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); endo-beta-1,4-mannanase (EC 3.2.1.78) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -GH48 GH48 reducing end-acting cellobiohydrolase (EC 3.2.1.176); endo-beta-1,4-glucanase (EC 3.2.1.4); chitinase (EC 3.2.1.14) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY -AA10 AA10 (formerly CBM33) proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); some proteins have been shown to act on chitin, others on cellulose; lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic cellulose monooxygenase (C4-dehydrogenating)(EC 1.14.99.56); lytic chitin monooxygenase (EC 1.14.99.53) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY -AA15 AA15 lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic chitin monooxygenase (EC 1.14.99.53) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY -AA16 AA16 Lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY -AA9 AA9 (formerly GH61) proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of cellulose chains with oxidation of carbons C1 and/or C4 and C-6); lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic cellulose monooxygenase (C4-dehydrogenating) (EC 1.14.99.56) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY -AA11 AA11 proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of chitin chains with oxidation of C-1 has been demonstrated for a AA11 LPMO from Aspergillus oryzae; Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY -AA13 AA13 proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of starch with oxidation of C-1 at the site of cleavage has been demonstrated for the LPMO encoded by gene NCU08746 from Neurospora crassa; Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY -AA13 AA13 proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of starch with oxidation of C-1 at the site of cleavage has been demonstrated for the LPMO encoded by gene NCU08746 from Neurospora crassa; Auxiliary Activities ag Carbon Processing Starch degradation CAZY -GH13 GH13 alpha-amylase (EC 3.2.1.1); pullulanase (EC 3.2.1.41); cyclomaltodextrin glucanotransferase (EC 2.4.1.19); cyclomaltodextrinase (EC 3.2.1.54); trehalose-6-phosphate hydrolase (EC 3.2.1.93); oligo-alpha-glucosidase (EC 3.2.1.10); maltogenic amylase (EC 3.2.1.133); neopullulanase (EC 3.2.1.135); alpha-glucosidase (EC 3.2.1.20); maltotetraose-forming alpha-amylase (EC 3.2.1.60); isoamylase (EC 3.2.1.68); glucodextranase (EC 3.2.1.70); maltohexaose-forming alpha-amylase (EC 3.2.1.98); maltotriose-forming alpha-amylase (EC 3.2.1.116); branching enzyme (EC 2.4.1.18); trehalose synthase (EC 5.4.99.16); 4-alpha-glucanotransferase (EC 2.4.1.25); maltopentaose-forming alpha-amylase (EC 3.2.1.-) ; amylosucrase (EC 2.4.1.4) ; sucrose phosphorylase (EC 2.4.1.7); malto-oligosyltrehalose trehalohydrolase (EC 3.2.1.141); isomaltulose synthase (EC 5.4.99.11); malto-oligosyltrehalose synthase (EC 5.4.99.15); amylo-alpha-1,6-glucosidase (EC 3.2.1.33); alpha-1,4-glucan: phosphate alpha-maltosyltransferase (EC 2.4.99.16); 6'-P-sucrose phosphorylase (EC 2.4.1.-); amino acid transporter Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH14 GH14 beta-amylase (EC 3.2.1.2) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH57 GH57 alpha-amylase (EC 3.2.1.1); alpha-galactosidase (EC 3.2.1.22); amylopullulanase (EC 3.2.1.41); cyclomaltodextrinase (EC 3.2.1.54); branching enzyme (EC 2.4.1.18); 4-alpha-glucanotransferase (EC 2.4.1.25) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH119 GH119 alpha-amylase (EC 3.2.1.1) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH126 GH126 alpha-amylase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH133 GH133 amylo-alpha-1,6-glucosidase (EC 3.2.1.33); Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH15 GH15 glucoamylase (EC 3.2.1.3); glucodextranase (EC 3.2.1.70); alpha,alpha-trehalase (EC 3.2.1.28); dextran dextrinase (EC 2.4.1.2) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH97 GH97 glucoamylase (EC 3.2.1.3); alpha-glucosidase (EC 3.2.1.20); alpha-galactosidase (EC 3.2.1.22) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY -GH28 GH28 polygalacturonase (EC 3.2.1.15); alpha-L-rhamnosidase (EC 3.2.1.40); exo-polygalacturonase (EC 3.2.1.67); exo-polygalacturonosidase (EC 3.2.1.82); rhamnogalacturonase (EC 3.2.1.171); rhamnogalacturonan alpha-1,2-galacturonohydrolase (EC 3.2.1.173); endo-xylogalacturonan hydrolase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -PL1 PL1 pectate lyase (EC 4.2.2.2); exo-pectate lyase (EC 4.2.2.9); pectin lyase (EC 4.2.2.10). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL2 PL2 pectate lyase (EC 4.2.2.2); exo-polygalacturonate lyase (EC 4.2.2.9). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL9 PL9 pectate lyase (EC 4.2.2.2); exopolygalacturonate lyase (EC 4.2.2.9); thiopeptidoglycan lyase (EC 4.2.2.-). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL10 PL10 pectate lyase (EC 4.2.2.2) Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL11 PL11 rhamnogalacturonan endolyase (EC 4.2.2.23); rhamnogalacturonan exolyase (EC 4.2.2.24) Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL22 PL22 oligogalacturonate lyase / oligogalacturonide lyase (EC 4.2.2.6) Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL26 PL26 rhamnogalacturonan exolyase (EC 4.2.2.24). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL3 PL3 pectate lyase (EC 4.2.2.2). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -PL4 PL4 rhamnogalacturonan endolyase (EC 4.2.2.23). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY -GH78 GH78 alpha-L-rhamnosidase (EC 3.2.1.40); rhamnogalacturonan alpha-L-rhamnohydrolase (EC 3.2.1.174); L-Rhap-alpha-1,3-D-Apif -specific alpha-1,3-L-rhamnosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -GH106 GH106 alpha-L-rhamnosidase (EC 3.2.1.40); rhamnogalacturonan alpha-L-rhamnohydrolase (EC 3.2.1.174) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -GH138 GH138 alpha-galacturonidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -GH139 GH139 alpha-2-O-Me-L-fucosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -GH143 GH143 2-keto-3-deoxy-D-lyxo-heptulosaric acid hydrolase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -CE8 CE8 pectin methylesterase (EC 3.1.1.11). Carbohydrate Esterases ag Carbon Processing Pectin degradation CAZY -GH105 GH105 unsaturated rhamnogalacturonyl hydrolase (EC 3.2.1.172); d-4,5-unsaturated beta-glucuronyl hydrolase (EC 3.2.1.-); d-4,5-unsaturated alpha-galacturonidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -GH4 GH4 maltose-6-phosphate glucosidase (EC 3.2.1.122); alpha-glucosidase (EC 3.2.1.20); alpha-galactosidase (EC 3.2.1.22); 6-phospho-beta-glucosidase (EC 3.2.1.86); alpha-glucuronidase (EC 3.2.1.139); alpha-galacturonase (EC 3.2.1.67); palatinase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -CE12 CE12 pectin acetylesterase (EC 3.1.1.-); rhamnogalacturonan acetylesterase (EC 3.1.1.-); acetyl xylan esterase (EC 3.1.1.72) Carbohydrate Esterases ag Carbon Processing Pectin degradation CAZY -GH2 GH2 beta-galactosidase (EC 3.2.1.23) ; beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); alpha-L-arabinofuranosidase (EC 3.2.1.55); mannosylglycoprotein endo-beta-mannosidase (EC 3.2.1.152); exo-beta-glucosaminidase (EC 3.2.1.165); alpha-L-arabinopyranosidase (EC 3.2.1.-); beta-galacturonidase (EC 3.2.1.-); beta-xylosidase (EC 3.2.1.37); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY -GH113 GH113 beta-mannanase (EC 3.2.1.78) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Beta-mannan Backbone Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose) -GH134 GH134 endo-beta-1,4-mannanase (EC 3.2.1.78); Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Beta-mannan Backbone Cleavage (Hemicellulose) -GH26 GH26 beta-mannanase (EC 3.2.1.78); exo-beta-1,4-mannobiohydrolase (EC 3.2.1.100); beta-1,3-xylanase (EC 3.2.1.32); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); mannobiose-producing exo-beta-mannanase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xylan Backbone Cleavage (Hemicellulose), Beta-mannan Backbone Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose) -GH130 GH130 beta-1,4-mannosylglucose phosphorylase (EC 2.4.1.281); beta-1,4-mannooligosaccharide phosphorylase (EC 2.4.1.319); beta-1,4-mannosyl-N-acetyl-glucosamine phosphorylase (EC 2.4.1.320); beta-1,2-mannobiose phosphorylase (EC 2.4.1.-); beta-1,2-oligomannan phosphorylase (EC 2.4.1.-); beta-1,2-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose) -CE2 CE2 acetyl xylan esterase (EC 3.1.1.72). Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Beta-mannan Oligo Cleavage (Hemicellulose) -CE17 acetyl mannan esterase [EC:3.1.1.-] Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Beta-mannan deacetylation support (Hemicellulose) -GH99 GH99 glycoprotein endo-alpha-1,2-mannosidase (EC 3.2.1.130); mannan endo-1,2-alpha-mannanase (3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Backbone Cleavage (Hemicellulose) -GH76 GH76 alpha-1,6-mannanase (EC 3.2.1.101); alpha-glucosidase (EC 3.2.1.20) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Backbone Cleavage (Hemicellulose), Alpha-mannan Oligo Cleavage (Hemicellulose) -GH92 GH92 mannosyl-oligosaccharide alpha-1,2-mannosidase (EC 3.2.1.113); mannosyl-oligosaccharide alpha-1,3-mannosidase (EC 3.2.1.-); mannosyl-oligosaccharide alpha-1,6-mannosidase (EC 3.2.1.-); alpha-mannosidase (EC 3.2.1.24); alpha-1,2-mannosidase (EC 3.2.1.-); alpha-1,3-mannosidase (EC 3.2.1.-); alpha-1,4-mannosidase (EC 3.2.1.-); mannosyl-1-phosphodiester alpha-1,P-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) -GH38 GH38 alpha-mannosidase (EC 3.2.1.24); mannosyl-oligosaccharide alpha-1,2-mannosidase (EC 3.2.1.113); mannosyl-oligosaccharide alpha-1,3-1,6-mannosidase (EC 3.2.1.114); alpha-2-O-mannosylglycerate hydrolase (EC 3.2.1.170); mannosyl-oligosaccharide alpha-1,3-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) -GH63 GH63 processing alpha-glucosidase (EC 3.2.1.106); alpha-1,3-glucosidase (EC 3.2.1.84); alpha-glucosidase (EC 3.2.1.20); mannosylglycerate alpha-mannosidase / mannosylglycerate hydrolase (EC 3.2.1.170); glucosylglycerate hydrolase (EC 3.2.1.208) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) -GH47 GH47 alpha-mannosidase (EC 3.2.1.113) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) -GH125 GH125 exo-alpha-1,6-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) -GH5 GH5 endo-beta-1,4-glucanase / cellulase (EC 3.2.1.4); endo-beta-1,4-xylanase (EC 3.2.1.8); beta-glucosidase (EC 3.2.1.21); beta-mannosidase (EC 3.2.1.25); beta-glucosylceramidase (EC 3.2.1.45); glucan beta-1,3-glucosidase (EC 3.2.1.58); licheninase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); glucan endo-1,6-beta-glucosidase (EC 3.2.1.75); mannan endo-beta-1,4-mannosidase (EC 3.2.1.78); cellulose beta-1,4-cellobiosidase (EC 3.2.1.91); steryl beta-glucosidase (EC 3.2.1.104); endoglycoceramidase (EC 3.2.1.123); chitosanase (EC 3.2.1.132); beta-primeverosidase (EC 3.2.1.149); xyloglucan-specific endo-beta-1,4-glucanase (EC 3.2.1.151); endo-beta-1,6-galactanase (EC 3.2.1.164); hesperidin 6-O-alpha-L-rhamnosyl-beta-glucosidase (EC 3.2.1.168); beta-1,3-mannanase (EC 3.2.1.-); arabinoxylan-specific endo-beta-1,4-xylanase (EC 3.2.1.-); mannan transglycosylase (EC 2.4.1.-); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-glucanase / laminarinase (EC 3.2.1.39); beta-N-acetylhexosaminidase (EC 3.2.1.52); chitosanase (EC 3.2.1.132); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Amorphous Cellulose Oligo Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose), Xylan Backbone Cleavage (Hemicellulose), Beta-mannan Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Backbone Cleavage (Hemicellulose), Chitin Oligo Cleavage -GH9 GH9 endoglucanase (EC 3.2.1.4); endo-beta-1,3(4)-glucanase / lichenase-laminarinase (EC 3.2.1.6); beta-glucosidase (EC 3.2.1.21); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); cellobiohydrolase (EC 3.2.1.91); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); exo-beta-glucosaminidase (EC 3.2.1.165) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Amorphous Cellulose Oligo Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Backbone Cleavage (Hemicellulose) -GH12 GH12 endoglucanase (EC 3.2.1.4); xyloglucan hydrolase (EC 3.2.1.151); beta-1,3-1,4-glucanase (EC 3.2.1.73); xyloglucan endotransglycosylase (EC 2.4.1.207) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) -GH16 GH16 xyloglucan:xyloglucosyltransferase (EC 2.4.1.207); keratan-sulfate endo-1,4-beta-galactosidase (EC 3.2.1.103); endo-1,3-beta-glucanase / laminarinase (EC 3.2.1.39); endo-1,3(4)-beta-glucanase (EC 3.2.1.6); licheninase (EC 3.2.1.73); beta-agarase (EC 3.2.1.81); kappa;-carrageenase (EC 3.2.1.83); xyloglucanase (EC 3.2.1.151); endo-beta-1,3-galactanase (EC 3.2.1.181); [retaining] beta-porphyranase (EC 3.2.1.178); hyaluronidase (EC 3.2.1.35); endo-beta-1,4-galactosidase (EC 3.2.1.-); chitin beta-1,6-glucanosyltransferase (EC 2.4.1.-); beta-transglycosidase (EC 2.4.1.-); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-galactanase (EC 3.2.1.181) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Oligo Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Oligo Cleavage (Hemicellulose), Sulf-Polysachharides Backbone Cleavage -GH44 GH44 endoglucanase (EC 3.2.1.4); xyloglucanase (EC 3.2.1.151) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) -GH45 GH45 endoglucanase (EC 3.2.1.4); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); endo-beta-1,4-mannanase (EC 3.2.1.78) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) -GH48 GH48 reducing end-acting cellobiohydrolase (EC 3.2.1.176); endo-beta-1,4-glucanase (EC 3.2.1.4); chitinase (EC 3.2.1.14) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Crystalline Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) -GH74 GH74 endoglucanase (EC 3.2.1.4); oligoxyloglucan reducing end-specific cellobiohydrolase (EC 3.2.1.150); xyloglucanase (EC 3.2.1.151) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xyloglucan Backbone Cleavage (Hemicellulose) -GH31 GH31 alpha-glucosidase (EC 3.2.1.20); alpha-galactosidase (EC 3.2.1.22); alpha-mannosidase (EC 3.2.1.24); alpha-1,3-glucosidase (EC 3.2.1.84); sucrase-isomaltase (EC 3.2.1.48) (EC 3.2.1.10); alpha-xylosidase (EC 3.2.1.177); alpha-glucan lyase (EC 4.2.2.13); isomaltosyltransferase (EC 2.4.1.-); oligosaccharide alpha-1,4-glucosyltransferase (EC 2.4.1.161); sulfoquinovosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xyloglucan Oligo Cleavage (Hemicellulose), Xylan Oligo Cleavage (Hemicellulose), Alpha-galactans Oligo Cleavage, Alpha-galactans Oligo Cleavage, Mucin Oligo Cleavage -GH10 GH10 endo-1,4-beta-xylanase (EC 3.2.1.8); endo-1,3-beta-xylanase (EC 3.2.1.32); tomatinase (EC 3.2.1.-); xylan endotransglycosylase (EC 2.4.2.-); endo-beta-1,4-glucanase (EC 3.2.1.4) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Oligo Cleavage (Hemicellulose), Xylan Backbone Cleavage (Hemicellulose) -GH2 GH2 beta-galactosidase (EC 3.2.1.23) ; beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); alpha-L-arabinofuranosidase (EC 3.2.1.55); mannosylglycoprotein endo-beta-mannosidase (EC 3.2.1.152); exo-beta-glucosaminidase (EC 3.2.1.165); alpha-L-arabinopyranosidase (EC 3.2.1.-); beta-galacturonidase (EC 3.2.1.-); beta-xylosidase (EC 3.2.1.37); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Oligo Cleavage, Xyloglucan Oligo Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose), Pectin Oligo Cleavage, Beta-galactan (pectic galactan) Oligo Cleavage, Arabinose Oligo cleavage -GH11 GH11 endo-beta-1,4-xylanase (EC 3.2.1.8); endo-beta-1,3-xylanase (EC 3.2.1.32) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xylan Backbone Cleavage (Hemicellulose) -GH43 GH43 beta-xylosidase (EC 3.2.1.37); alpha-L-arabinofuranosidase (EC 3.2.1.55); xylanase (EC 3.2.1.8); alpha-1,2-L-arabinofuranosidase (EC 3.2.1.-); exo-alpha-1,5-L-arabinofuranosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); beta-1,3-xylosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); [inverting] endo-alpha-1,5-L-arabinanase (EC 3.2.1.99); exo-beta-1,3-galactanase (EC 3.2.1.145); beta-D-galactofuranosidase (EC 3.2.1.146) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xyloglucan Oligo Cleavage (Hemicellulose), Arabinan Backbone Cleavage, Arabinan Oligo Cleavage -GH51 GH51 endoglucanase (EC 3.2.1.4); endo-beta-1,4-xylanase (EC 3.2.1.8); beta-xylosidase (EC 3.2.1.37); alpha-L-arabinofuranosidase (EC 3.2.1.55); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Arabinan Oligo Cleavage -CE1 CE1 acetyl xylan esterase (EC 3.1.1.72); cinnamoyl esterase (EC 3.1.1.-); feruloyl esterase (EC 3.1.1.73); carboxylesterase (EC 3.1.1.1); S-formylglutathione hydrolase (EC 3.1.2.12); diacylglycerol O-acyltransferase (EC 2.3.1.20); trehalose 6-O-mycolyltransferase (EC 2.3.1.122) Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Xylan deacetylation support -CE4 CE4 acetyl xylan esterase (EC 3.1.1.72); chitin deacetylase (EC 3.5.1.41); chitooligosaccharide deacetylase (EC 3.5.1.-); peptidoglycan GlcNAc deacetylase (EC 3.5.1.-); peptidoglycan N-acetylmuramic acid deacetylase (EC 3.5.1.-). Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Chitin Oligo Cleavage -AA9 AA9 (formerly GH61) proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of cellulose chains with oxidation of carbons C1 and/or C4 and C-6); lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic cellulose monooxygenase (C4-dehydrogenating) (EC 1.14.99.56) Auxiliary Activities ag Carbon Processing Hemicellulose degradation Crystalline Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) -AA1 laccase / multicopper oxidase [EC:1.10.3.2] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack -mco multicopper oxidase (bacterial laccase) [EC:1.10.3.2] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack -AA2 class II peroxidase (lignin/manganese/versatile peroxidases) [EC:1.11.1.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack -dyp DyP-type peroxidase (dye-decolorizing peroxidase) [EC:1.11.1.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack -AA3_2 aryl-alcohol oxidase (GMC oxidoreductase) [EC:1.1.3.7] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support -AA5_1 glyoxal oxidase [EC:1.2.3.15] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support -AA8 cellobiose dehydrogenase, cytochrome domain [EC:1.1.99.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support -AA3_1 cellobiose dehydrogenase, dehydrogenase domain [EC:1.1.99.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support -K18851 glucose-6-phosphate isomerase [EC:5.3.1.9] Glycolysis / gluconeogenesis ag Carbon Processing Sugar utilization Glucose -K00844 hexokinase [EC:2.7.1.1] Glycolysis (hexokinase reaction) ag Carbon Processing Sugar utilization Glucose -K12407 glucokinase [EC:2.7.1.2] Glycolysis (glucokinase reaction) ag Carbon Processing Sugar utilization Glucose -K00845 glucose-6-phosphate dehydrogenase [EC:1.1.1.49] Pentose phosphate pathway (glucose-6-phosphate dehydrogenase) ag Carbon Processing Sugar utilization Glucose -K25026 phosphoglucose isomerase [EC:5.3.1.9] Glycolysis / pentose phosphate interconversion ag Carbon Processing Sugar utilization Glucose -K01182 sucrase-isomaltase [EC:3.2.1.48] Sucrose and starch metabolism (sucrase–isomaltase complex) ag Carbon Processing Sugar utilization Sucrose -K01203 β-fructofuranosidase [EC:3.2.1.26] Fructose and mannose metabolism (β-fructofuranosidase) ag Carbon Processing Sugar utilization Sucrose -K12047 sucrose phosphorylase [EC:2.4.1.7] Sucrose metabolism (sucrose phosphorylase) ag Carbon Processing Sugar utilization Sucrose -K01187 sucrase [EC:3.2.1.48] Sucrose metabolism (sucrase) ag Carbon Processing Sugar utilization Sucrose -K12316 glucosyltransferase [EC:2.4.1.4] Sucrose and starch metabolism (α-glucosyltransferase) ag Carbon Processing Sugar utilization Sucrose -K12317 sucrose-6F-phosphate phosphohydrolase [EC:3.1.3.24] Sucrose-6F-phosphate metabolism (phosphohydrolase) ag Carbon Processing Sugar utilization Sucrose -K00695 α-glucosidase [EC:3.2.1.20] Carbohydrate metabolism (α-glucosidase) ag Carbon Processing Sugar utilization Sucrose -K00690 maltase-glucoamylase [EC:3.2.1.20] Starch and sucrose metabolism (maltase–glucoamylase) ag Carbon Processing Sugar utilization Sucrose -K05341 glucanotransferase [EC:2.4.1.25] Glycosyltransferase (oligosaccharide interconversion) ag Carbon Processing Sugar utilization Sucrose -K00689 oligo-1,6-glucosidase [EC:3.2.1.10] Carbohydrate metabolism (oligo-1,6-glucosidase) ag Carbon Processing Sugar utilization Sucrose -K00692 isomaltase [EC:3.2.1.10] Starch and sucrose metabolism (isomaltase) ag Carbon Processing Sugar utilization Sucrose -K01809 mannose-6-phosphate isomerase [EC:5.3.1.8] Mannose metabolism (mannose-6-phosphate isomerase) ag Carbon Processing Sugar utilization Mannose -K02793 mannose PTS system IIA component [EC:2.7.1.191] PTS system, mannose-specific II component ag Carbon Processing Sugar utilization Mannose -K02794 mannose PTS system IIB component [EC:2.7.1.191] PTS system, mannose-specific II component ag Carbon Processing Sugar utilization Mannose -K02795 mannose PTS system IIC component [EC:2.7.1.191] PTS system, mannose-specific II component ag Carbon Processing Sugar utilization Mannose -K00849 galactokinase [EC:2.7.1.6] Galactose metabolism (galactokinase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose -K00965 galactose-1-phosphate uridylyltransferase [EC:2.7.7.12] Galactose metabolism (galactose-1-phosphate uridylyltransferase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose -K01784 UDP-galactose 4-epimerase [EC:5.1.3.2] Galactose metabolism (UDP-galactose 4-epimerase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose -K01785 galactose mutarotase [EC:5.1.3.3] Galactose metabolism (galactose mutarotase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose -K00879 L-fucokinase [EC:2.7.1.52] Fucose metabolism (L-fucokinase) ag Carbon Processing Sugar utilization Fucose -K01628 L-fuculose-phosphate aldolase [EC:4.1.2.17] Fucose metabolism (L-fuculose-phosphate aldolase) ag Carbon Processing Sugar utilization Fucose -K01818 L-fucose isomerase [EC:5.3.1.25] Fucose metabolism (L-fucose isomerase) ag Carbon Processing Sugar utilization Fucose -K00854 xylose kinase [EC:2.7.1.17] Xylose metabolism (xylose kinase) ag Carbon Processing Sugar utilization Xylose -K01805 xylose isomerase [EC:5.3.1.5] Xylose metabolism (xylose isomerase) ag Carbon Processing Sugar utilization Xylose -K00008 xylitol dehydrogenase [EC:1.1.1.9] Xylose metabolism (xylitol dehydrogenase) ag Carbon Processing Sugar utilization Xylose -K00011 L-arabitol dehydrogenase [EC:1.1.1.12] Xylose / arabinose metabolism (arabitol dehydrogenase) ag Carbon Processing Sugar utilization Xylose -K05351 xylulokinase [EC:2.7.1.17] Xylose metabolism (xylulokinase) ag Carbon Processing Sugar utilization Xylose -K17743 xylitol oxidase [EC:1.1.3.41] Xylose metabolism (xylitol oxidase) ag Carbon Processing Sugar utilization Xylose -K14273 xylulose reductase [EC:1.1.1.9] Xylose metabolism (xylulose reductase) ag Carbon Processing Sugar utilization Xylose -K14274 D-xylonate dehydratase [EC:4.2.1.82] Xylose metabolism (xylonate dehydratase) ag Carbon Processing Sugar utilization Xylose -K14275 xylonolactonase [EC:3.1.1.68] Xylose metabolism (xylonolactonase) ag Carbon Processing Sugar utilization Xylose -K01804 L-arabinose isomerase [EC:5.3.1.4] Arabinose metabolism (L-arabinose isomerase) ag Carbon Processing Sugar utilization Arabinose -K00011 L-arabitol dehydrogenase [EC:1.1.1.12] Xylose / arabinose metabolism (arabitol dehydrogenase) ag Carbon Processing Sugar utilization Arabinose -K26066 arabinose 1-dehydrogenase [EC:1.1.1.46] Arabinose metabolism (arabinose 1-dehydrogenase) ag Carbon Processing Sugar utilization Arabinose -K13873 arabinolactonase [EC:3.1.1.110] Arabinose metabolism (arabinolactonase) ag Carbon Processing Sugar utilization Arabinose -K19660 arabinonate dehydratase [EC:4.2.1.37] Arabinose metabolism (arabinonate dehydratase) ag Carbon Processing Sugar utilization Arabinose -K12446 L-arabonate dehydratase [EC:4.2.1.37] Arabinose metabolism (L-arabonate dehydratase) ag Carbon Processing Sugar utilization Arabinose -K19243 glucose-6-phosphate 1-dehydrogenase [EC:1.1.1.49 1.1.1.363 1.1.1.388] [RN:R02736 R10907] ag Carbon Processing Sugar utilization Glucose -K01807 ribose 5-phosphate isomerase [EC:5.3.1.6] [RN:R01056] ag Carbon Processing Sugar utilization Ribose -K01808 ribose 5-phosphate isomerase [EC:5.3.1.6] [RN:R01056] ag Carbon Processing Sugar utilization Ribose -K01810 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose -K06859 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose -K13810 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose -K15916 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose -K00948 ribose-phosphate pyrophosphokinase [EC:2.7.6.1] [RN:R01049] ag Carbon Processing Sugar utilization Ribose -K13937 hexose-6-phosphate dehydrogenase [EC:1.1.1.47 3.1.1.31] [RN:R02736 R02035] ag Carbon Processing Sugar utilization Glucose -K01057 6-phosphogluconolactonase [EC:3.1.1.31] [RN:R02035] ag Carbon Processing Sugar utilization Glucose -K07404 6-phosphogluconolactonase [EC:3.1.1.31] [RN:R02035] ag Carbon Processing Sugar utilization Glucose -K00033 6-phosphogluconate dehydrogenase [EC:1.1.1.44 1.1.1.343] [RN:R01528 R10221] ag Carbon Processing Sugar utilization Glucose -K00615 transketolase [EC:2.2.1.1] [RN:R01830 R01641] ag Carbon Processing Sugar utilization Ribose -K00616 transaldolase [EC:2.2.1.2] [RN:R01827] ag Carbon Processing Sugar utilization Ribose -K01783 ribulose-phosphate 3-epimerase [EC:5.1.3.1] [RN:R01529] ag Carbon Processing Sugar utilization Ribose -K08094 6-phospho-3-hexuloisomerase [EC:5.3.1.27] [RN:R09780] ag Carbon Processing Sugar utilization Ribose -K08093 3-hexulose-6-phosphate synthase [EC:4.1.2.43] [RN:R05338] ag Carbon Processing Sugar utilization Ribose -K13812 3-hexulose-6-phosphate synthase [EC:4.1.2.43] [RN:R05338] ag Carbon Processing Sugar utilization Ribose -K13831 6-phospho-3-hexuloisomerase [EC:5.3.1.27] [RN:R09780] ag Carbon Processing Sugar utilization Ribose -K00844 hexokinase [EC:2.7.1.1] [RN:R01786] ag Carbon Processing Sugar utilization Glucose -K01835 phosphoglucomutase [EC:5.4.2.2] [RN:R00959] ag Carbon Processing Sugar utilization Glucose -K00963 UTP--glucose-1-phosphate uridylyltransferase [EC:2.7.7.9] [RN:R00289] ag Carbon Processing Sugar utilization Glucose -K00849 galactokinase [EC:2.7.1.6] [RN:R01092] ag Carbon Processing Sugar utilization Galactose -K00918 ADP-dependent phosphofructokinase [EC:2.7.1.146] [RN:R09084] ag Carbon Processing Sugar utilization Glucose -K00850 6-phosphofructokinase [EC:2.7.1.11] [RN:R04779] ag Carbon Processing Sugar utilization Glucose -K16370 6-phosphofructokinase [EC:2.7.1.11] [RN:R04779] ag Carbon Processing Sugar utilization Glucose -K01623 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose -K01624 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose -K11645 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose -K16305 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose -K16306 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose -K01803 triosephosphate isomerase [EC:5.3.1.1] [RN:R01015] ag Carbon Processing Sugar utilization Glucose -K00134 glyceraldehyde 3-phosphate dehydrogenase [EC:1.2.1.12 1.2.1.59] [RN:R01061 R01063] ag Carbon Processing Sugar utilization Glucose -K00150 glyceraldehyde 3-phosphate dehydrogenase [EC:1.2.1.12 1.2.1.59] [RN:R01061 R01063] ag Carbon Processing Sugar utilization Glucose -K00927 phosphoglycerate kinase [EC:2.7.2.3] [RN:R01512] ag Carbon Processing Sugar utilization Glucose -K11389 glyceraldehyde-3-phosphate dehydrogenase (ferredoxin) [EC:1.2.7.6] [RN:R07159] ag Carbon Processing Sugar utilization Glucose -K01834 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose -K15633 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose -K15634 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose -K15635 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose -K01689 enolase [EC:4.2.1.11] [RN:R00658] ag Carbon Processing Sugar utilization Glucose -K00873 pyruvate kinase [EC:2.7.1.40] [RN:R00200] ag Carbon Processing Sugar utilization Glucose -K12406 pyruvate kinase [EC:2.7.1.40] [RN:R00200] ag Carbon Processing Sugar utilization Glucose -K01596 phosphoenolpyruvate carboxykinase [EC:4.1.1.32 4.1.1.49] [RN:R00431 R00726 R00341] ag Carbon Processing Sugar utilization Fructose -K01610 phosphoenolpyruvate carboxykinase [EC:4.1.1.32 4.1.1.49] [RN:R00431 R00726 R00341] ag Carbon Processing Sugar utilization Fructose -K03841 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose -K02446 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose -K11532 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose -K01086 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose -K04041 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose -K01622 fructose 1,6-bisphosphate aldolase/phosphatase [EC:4.1.2.13 3.1.3.11] [RN:R01070 R04780] ag Carbon Processing Sugar utilization Fructose -K01690 phosphogluconate dehydratase [EC:4.2.1.12] [RN:R02036] ag Carbon Processing Sugar utilization Glucose -K01625 2-dehydro-3-deoxyphosphogluconate aldolase [EC:4.1.2.14] [RN:R05605] ag Carbon Processing Sugar utilization Glucose -K01785 aldose 1-epimerase [EC:5.1.3.3] [RN:R10619] ag Carbon Processing Sugar utilization Glucose -K00012 UDPglucose 6-dehydrogenase [EC:1.1.1.22] [RN:R00286] ag Carbon Processing Sugar utilization Glucose -AA3 AA3 cellobiose dehydrogenase (EC 1.1.99.18); glucose 1-oxidase (EC 1.1.3.4); aryl alcohol oxidase (EC 1.1.3.7); alcohol oxidase (EC 1.1.3.13); pyranose oxidase (EC 1.1.3.10) ag Carbon Processing Sugar utilization Glucose -AA5 AA5 Oxidase with oxygen as acceptor (EC 1.1.3.-); galactose oxidase (EC 1.1.3.9); glyoxal oxidase (EC 1.2.3.15); alcohol oxidase (EC 1.1.3.13) ag Carbon Processing Sugar utilization Galactose -CBM13 CBM13 Modules of approx. 150 residues which always appear as a threefold internal repeat. The only apparent exception to this, xylanase II of Actinomadura sp. FC7 (GenBank U08894), is in fact not completely sequenced. These modules were first identified in several plant lectins such as ricin or agglutinin of Ricinus communis which bind galactose residues. The three-dimensional structure of a plant lectin has been determined and displays a pseudo-threefold symmetry in accord with the observed sequence threefold repeat. These modules have since been found in a number of other proteins of various functions including glycoside hydrolases and glycosyltransferases. While in the plant lectins this module binds mannose, binding to xylan has been demonstrated in the Streptomyces lividans xylanase A and arabinofuranosidase B. Binding to GalNAc has been shown for the corresponding module of GalNAc transferase 4. For the other proteins, the binding specificity of these modules has not been established. The pseudo three-fold symmetry of the CBM13 module has now been confirmed in the 3-D structure of the intact, two-domain, xylanase of Streptomyces olivaceoviridis. ag Carbon Processing Sugar utilization Xylanase -CBM31 CBM31 Binding to beta-1,3-xylan has been demonstrated for the C-terminal module of the beta-1,3-xylanase of Alcaligenes sp. XY234. ag Carbon Processing Sugar utilization Xylanase -CBM32 CBM32 Binding to galactose and lactose has been demonstrated for the module of Micromonospora viridifaciens sialidase (PMID: 16239725). Binding to polygalacturonic acid has been shown for a Yersinia member (PMID: 17292916). Binding to LacNAc (beta-D-galactosyl-1,4-beta-D-N-acetylglucosamine) has been shown for an N-acetylglucosaminidase from Clostridium perfingens (PMID: 16990278). ag Carbon Processing Sugar utilization Galacturonic Acid -CBM36 CBM36 Modules of approx. 120-130 residues displaying structural similarities to CBM6 modules. The only CBM36 currently characterised, that from Paenbacillus polymyxa xylanase 43A, shows calcium-dependent binding of xylans and xylooligosaccharides. X-ray crystallography shows that there is a direct interaction between calcium and ligand. ag Carbon Processing Sugar utilization Xylanase -CBM51 CBM51 Modules of approx. 150 residues found attached to various enzymes from families GH2, GH27, GH31, GH95, GH98 and GH101 . Binding to galactose and to blood group A/B-antigens demonstrated in the case of C. perfringens GH95CBM51 and GH98CBM51 respectively [Gregg KJ et al. (2008) J. Biol. Chem. 283:12604-13 PMID: 18292090]. ag Carbon Processing Sugar utilization Galactose -CBM59 CBM59 Binding to mannan, xylan, and cellulose demonstrated for the CBM59 of ManF-X10 xylanase from an environmental genomic DNA library (Li et al. (2009) World Journal of Microbiology and Biotechnology 25:2071-2078; doi:10.1007/s11274-009-0111-6) ag Carbon Processing Sugar utilization Xylanase -CBM60 CBM60 Modules of approx 120 residues usually found appended to xylanases. The xylan-binding function and the relatedness (circular permutation) to family CBM36 has been demonstrated [PMID: 20659893]. ag Carbon Processing Sugar utilization Xylanase -CBM62 CBM62 The CBM62 module of Clostridium thermocellum Cthe_2193 protein binds galactose moieties found on xyloglucan, arabinogalactan and galactomannan. ag Carbon Processing Sugar utilization Galactose -CBM67 CBM67 Fujimoto et al. [PMID : 23486481] disclosed the L-rhamnose binding activity and 3-D structure of the CBM67 of Streptomyces avermitilis alpha-L-rhamnosidase (SaRha78A); ag Carbon Processing Sugar utilization Rhamnose -CBM71 CBM71 The two CBM71s of S. pneumoniae BgaA bind lactose and LacNAc. ag Carbon Processing Sugar utilization Lactose -CBM9 CBM9 Modules of approx. 170 residues found so far only in xylanases. The cellulose-binding function has been demonstrated in one case. ag Carbon Processing Sugar utilization Xylanase -CE1 CE1 acetyl xylan esterase (EC 3.1.1.72); cinnamoyl esterase (EC 3.1.1.-); feruloyl esterase (EC 3.1.1.73); carboxylesterase (EC 3.1.1.1); S-formylglutathione hydrolase (EC 3.1.2.12); diacylglycerol O-acyltransferase (EC 2.3.1.20); trehalose 6-O-mycolyltransferase (EC 2.3.1.122) ag Carbon Processing Sugar utilization Trehalose -GH11 GH11 endo-beta-1,4-xylanase (EC 3.2.1.8); endo-beta-1,3-xylanase (EC 3.2.1.32) ag Carbon Processing Sugar utilization Glycoside Hydrolase -GH130 GH130 beta-1,4-mannosylglucose phosphorylase (EC 2.4.1.281); beta-1,4-mannooligosaccharide phosphorylase (EC 2.4.1.319); beta-1,4-mannosyl-N-acetyl-glucosamine phosphorylase (EC 2.4.1.320); beta-1,2-mannobiose phosphorylase (EC 2.4.1.-); beta-1,2-oligomannan phosphorylase (EC 2.4.1.-); beta-1,2-mannosidase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Glycoside Hydrolase -GH18 GH18 chitinase (EC 3.2.1.14); lysozyme (EC 3.2.1.17); endo-beta-N-acetylglucosaminidase (EC 3.2.1.96); peptidoglycan hydrolase with endo-beta-N-acetylglucosaminidase specificity (EC 3.2.1.-); Nod factor hydrolase (EC 3.2.1.-); xylanase inhibitor; concanavalin B; narbonin ag Carbon Processing Sugar utilization Glycoside Hydrolase -GH26 GH26 beta-mannanase (EC 3.2.1.78); exo-beta-1,4-mannobiohydrolase (EC 3.2.1.100); beta-1,3-xylanase (EC 3.2.1.32); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); mannobiose-producing exo-beta-mannanase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Glycoside Hydrolase -GH32 GH32 invertase (EC 3.2.1.26); endo-inulinase (EC 3.2.1.7); beta-2,6-fructan 6-levanbiohydrolase (EC 3.2.1.64); endo-levanase (EC 3.2.1.65); exo-inulinase (EC 3.2.1.80); fructan beta-(2,1)-fructosidase/1-exohydrolase (EC 3.2.1.153); fructan beta-(2,6)-fructosidase/6-exohydrolase (EC 3.2.1.154); sucrose:sucrose 1-fructosyltransferase (EC 2.4.1.99); fructan:fructan 1-fructosyltransferase (EC 2.4.1.100); sucrose:fructan 6-fructosyltransferase (EC 2.4.1.10); fructan:fructan 6G-fructosyltransferase (EC 2.4.1.243); levan fructosyltransferase (EC 2.4.1.-); [retaining] sucrose:sucrose 6-fructosyltransferase (6-SST) (EC 2.4.1.-); cycloinulo-oligosaccharide fructanotransferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycoside Hydrolase -GH43 GH43 beta-xylosidase (EC 3.2.1.37); alpha-L-arabinofuranosidase (EC 3.2.1.55); xylanase (EC 3.2.1.8); alpha-1,2-L-arabinofuranosidase (EC 3.2.1.-); exo-alpha-1,5-L-arabinofuranosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); beta-1,3-xylosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); [inverting] endo-alpha-1,5-L-arabinanase (EC 3.2.1.99); exo-beta-1,3-galactanase (EC 3.2.1.145); beta-D-galactofuranosidase (EC 3.2.1.146) ag Carbon Processing Sugar utilization Glycoside Hydrolase -GH8 GH8 chitosanase (EC 3.2.1.132); cellulase (EC 3.2.1.4); licheninase (EC 3.2.1.73); endo-1,4-beta-xylanase (EC 3.2.1.8); reducing-end-xylose releasing exo-oligoxylanase (EC 3.2.1.156) ag Carbon Processing Sugar utilization Glycoside Hydrolase -GT106 GT106 UDP-beta-L-rhamnose:rhamnogalacturonan I 4-alpha-rhamnosyltransferase (EC 2.4.1.351) ag Carbon Processing Sugar utilization Glycosyl Transferase -GT1 GT1 UDP-glucuronosyltransferase (EC 2.4.1.17); zeatin O-beta-xylosyltransferase (EC 2.4.2.40); 2-hydroxyacylsphingosine 1-beta-galactosyltransferase (EC 2.4.1.45); N-acylsphingosine galactosyltransferase (EC 2.4.1.47); flavonol 3-O-glucosyltransferase (EC 2.4.1.91); anthocyanidin 3-O-glucosyltransferase (EC 2.4.1.115); sinapate 1-glucosyltransferase (EC 2.4.1.120); indole-3-acetate beta-glucosyltransferase (EC 2.4.1.121); flavonol L-rhamnosyltransferase (EC 2.4.1.159); sterol glucosyltransferase (EC 2.4.1.173); UDP-Glc: 4-hydroxybenzoate 4-O-beta-glucosyltransferase (EC 2.4.1.194); zeatin O-beta-glucosyltransferase (EC 2.4.1.203); limonoid glucosyltransferase (EC 2.4.1.210); UDP-GlcA: baicalein 7-O-beta-glucuronosyltransferase (EC 2.4.1.253); UDP-Glc: chalcone 4‚Äö√Ñ√∂‚àö‚Ć‚àö‚àǬ¨¬®¬¨¬¢‚Äö√Ñ√∂‚àö√ë‚àö‚àÇ‚Äö√†√∂‚àö¬∞¬¨¬®¬¨√ܬ¨¬®¬¨¬Æ‚Äö√Ñ√∂‚àö¬¢¬¨√ü-O-beta-glucosyltransferase (EC 2.4.1.286); ecdysteroid UDP-glucosyltransferase (EC 2.4.1.-); salicylic acid beta-glucosyltransferase (EC 2.4.1.-); anthocyanin 3-O-galactosyltransferase (EC 2.4.1.-); anthocyanin 5-O-glucosyltransferase (EC 2.4.1.-); dTDP-beta-2-deoxy-L-fucose: alpha-L-2-deoxyfucosyltransferase (EC 2.4.1.-); UDP-beta-L-rhamnose: alpha-L-rhamnosyltransferase (EC 2.4.1.-); zeaxanthin glucosyltransferase (EC 2.4.1.-); flavone 8-C-glycosyltransferase ag Carbon Processing Sugar utilization Glycosyl Transferase -GT20 GT20 alpha,alpha-trehalose-phosphate synthase [UDP-forming] (EC 2.4.1.15); Glucosylglycerol-phosphate synthase (EC 2.4.1.213); trehalose-6-P phosphatase (EC 3.1.3.12); [retaining] GDP-valeniol: validamine 7-phosphate valeniolyltransferase (EC 2.-.-.-) ag Carbon Processing Sugar utilization Glycosyl Transferase -GT31 GT31 N-acetyllactosaminide beta-1,3-N-acetylglucosaminyltransferase (EC 2.4.1.149); Glycoprotein-N-acetylgalactosamine 3-beta-galactosyltransferase (EC 2.4.1.122); fucose-specific beta-1,3-N-acetylglucosaminyltransferase (EC 2.4.1.-); globotriosylceramide beta-1,3-GalNAc transferase (EC 2.4.1.79); chondroitin synthase (beta-1,3-GlcUA and beta-1,4-GalNAc transferase (EC 2.4.1.175); chondroitin beta-1,3-glucuronyltransferase (EC 2.4.1.226); chondroitin beta-1,4-N-acetylgalactosaminyltransferase (EC 2.4.1.-); UDP-Gal: beta-galactosylxylosylprotein beta-1,3-galactosyltransferase (EC 2.4.1.134); UDP-GlcNAc: O-fucosylpeptide beta-1,3-N-acetylglucosaminyltransferase (EC 2.4.1.222) ag Carbon Processing Sugar utilization Glycosyl Transferase -GT32 GT32 alpha-1,6-mannosyltransferase (EC 2.4.1.-); alpha-1,4-N-acetylglucosaminyltransferase (EC 2.4.1.-); alpha-1,4-N-acetylgalactosaminyltransferase (EC 2.4.1.-); GDP-Man: inositol-phosphorylceramide transferase (EC 2.4.1.-); UDP-Gal: beta-galactoside alpha-1,4-galactosyltransferase (EC 2.4.1.-); UDP-Gal: lactose/N-acetyl-lactosamine alpha-1,4-galactosyltransferase (EC 2.4.1.-); UDP-Glc: protein alpha-glucosyltransferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycosyl Transferase -GT4 GT4 sucrose synthase (EC 2.4.1.13); sucrose-phosphate synthase (EC 2.4.1.14); alpha-glucosyltransferase (EC 2.4.1.52); lipopolysaccharide N-acetylglucosaminyltransferase (EC 2.4.1.56); phosphatidylinositol alpha-mannosyltransferase (EC 2.4.1.57); GDP-Man: Man1GlcNAc2-PP-dolichol alpha-1,3-mannosyltransferase (EC 2.4.1.132); GDP-Man: Man3GlcNAc2-PP-dolichol/Man4GlcNAc2-PP-dolichol alpha-1,2-mannosyltransferase (EC 2.4.1.131); digalactosyldiacylglycerol synthase (EC 2.4.1.141); 1,2-diacylglycerol 3-glucosyltransferase (EC 2.4.1.157); diglucosyl diacylglycerol synthase (EC 2.4.1.208); trehalose phosphorylase (EC 2.4.1.231); NDP-Glc: alpha-glucose alpha-glucosyltransferase / alpha,alpha-trehalose synthase (EC 2.4.1.245); GDP-Man: Man2GlcNAc2-PP-dolichol alpha-1,6-mannosyltransferase (EC 2.4.1.257); UDP-GlcNAc: 2-deoxystreptamine alpha-N-acetylglucosaminyltransferase (EC 2.4.1.283); UDP-GlcNAc: ribostamycin alpha-N-acetylglucosaminyltransferase (EC 2.4.1.285); UDP-Gal alpha-galactosyltransferase (EC 2.4.1.-); UDP-Xyl alpha-xylosyltransferase (EC 2.4.2.-); UDP-GlcA alpha-glucuronyltransferase (EC 2.4.1.-); UDP-Glc alpha-glucosyltransferase (EC 2.4.1.-); UDP-GalNAc: GalNAc-PP-Und alpha-1,3-N-acetylgalactosaminyltransferase (EC 2.4.1.306); UDP-GalNAc: N,N'-diacetylbacillosaminyl-PP-Und alpha-1,3-N-acetylgalactosaminyltransferase (EC 2.4.1.290); ADP-dependent alpha-maltose-1-phosphate synthase (2.4.1.342) ag Carbon Processing Sugar utilization Glycosyl Transferase -GT7 GT7 lactose synthase (EC 2.4.1.22); beta-N-acetylglucosaminyl-glycopeptide beta-1,4-galactosyltransferase (EC 2.4.1.38); N-acetyllactosamine synthase (EC 2.4.1.90); xylosylprotein beta-4-galactosyltransferase (EC 2.4.1.133); UDP-Gal: neolactotriaosylceramide beta-1,4-galactosyltransferase (EC 2.4.1.275); beta-1,4-N-acetylglucosaminyltransferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycosyl Transferase -GT83 GT83 undecaprenyl phosphate-alpha-L-Ara4N: 4-amino-4-deoxy-beta-L-arabinosyltransferase (EC 2.4.2.43); dodecaprenyl phosphate-beta-galacturonic acid: lipopolysaccharide core alpha-galacturonosyl transferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycosyl Transferase -PL27 PL27 L-rhamnose-alpha-1,4-D-glucuronate lyase (EC 4.2.2.-) ag Carbon Processing Sugar utilization Rhamnose -K10108 malE; maltose/maltodextrin transport system substrate-binding protein ag Carbon Processing Sugar utilization Maltose -K10109 malF; maltose/maltodextrin transport system permease protein ag Carbon Processing Sugar utilization Maltose -K10110 malG; maltose/maltodextrin transport system permease protein ag Carbon Processing Sugar utilization Maltose -K10111 malK; maltose/maltodextrin transport system ATP-binding protein [EC:3.6.3.19] ag Carbon Processing Sugar utilization Maltose -K10112 msmX; maltose/maltodextrin transport system ATP-binding protein ag Carbon Processing Sugar utilization Maltose -K10188 lacE; lactose/L-arabinose transport system substrate-binding protein ag Carbon Processing Sugar utilization Lactose -K10189 lacF; lactose/L-arabinose transport system permease protein ag Carbon Processing Sugar utilization Lactose -K10190 lacG; lactose/L-arabinose transport system permease protein ag Carbon Processing Sugar utilization Lactose -K10191 lacK; lactose/L-arabinose transport system ATP-binding protein ag Carbon Processing Sugar utilization Lactose -K10196 ABC.GLC.S; glucose/arabinose transport system substrate-binding protein ag Carbon Processing Sugar utilization Glucose -K10197 ABC.GLC.P; glucose/arabinose transport system permease protein ag Carbon Processing Sugar utilization Glucose -K10198 ABC.GLC.P1; glucose/arabinose transport system permease protein ag Carbon Processing Sugar utilization Glucose -K10199 ABC.GLC.A; glucose/arabinose transport system ATP-binding protein ag Carbon Processing Sugar utilization Glucose -K10236 thuE; trehalose/maltose transport system substrate-binding protein ag Carbon Processing Sugar utilization Trehalose -K10237 thuF; trehalose/maltose transport system permease protein ag Carbon Processing Sugar utilization Trehalose -K10238 thuG; trehalose/maltose transport system permease protein ag Carbon Processing Sugar utilization Trehalose -K10439 rbsB; ribose transport system substrate-binding protein ag Carbon Processing Sugar utilization Ribose -K10440 rbsC; ribose transport system permease protein ag Carbon Processing Sugar utilization Ribose -K10441 rbsA; ribose transport system ATP-binding protein [EC:3.6.3.17] ag Carbon Processing Sugar utilization Ribose -K10543 xylF; D-xylose transport system substrate-binding protein ag Carbon Processing Sugar utilization Xylose -K10544 xylH; D-xylose transport system permease protein ag Carbon Processing Sugar utilization Xylose -K10545 xylG; D-xylose transport system ATP-binding protein [EC:3.6.3.17] ag Carbon Processing Sugar utilization Xylose -K10552 frcB; fructose transport system substrate-binding protein ag Carbon Processing Sugar utilization Fructose -K10553 frcC; fructose transport system permease protein ag Carbon Processing Sugar utilization Fructose -K10554 frcA; fructose transport system ATP-binding protein ag Carbon Processing Sugar utilization Fructose -K10559 rhaS1; rhamnose transport system substrate-binding protein ag Carbon Processing Sugar utilization Rhamnose -K10560 rhaP; rhamnose transport system permease protein ag Carbon Processing Sugar utilization Rhamnose -K10561 rhaQ; rhamnose transport system permease protein ag Carbon Processing Sugar utilization Rhamnose -K10562 rhaT; rhamnose transport system ATP-binding protein [EC:3.6.3.17] ag Carbon Processing Sugar utilization Rhamnose -K02777 PTS-Glc-EIIA; PTS system, glucose-specific IIA component ag Carbon Processing Sugar utilization Glucose -K02778 PTS-Glc-EIIB; PTS system, glucose-specific IIB component ag Carbon Processing Sugar utilization Glucose -K02779 PTS-Glc-EIIC; PTS system, glucose-specific IIC component ag Carbon Processing Sugar utilization Glucose -K02790 PTS-MalGlc-EIIB; PTS system, maltose/glucose-specific IIB component ag Carbon Processing Sugar utilization Maltose -K02791 PTS-MalGlc-EIIC; PTS system, maltose/glucose-specific IIC component ag Carbon Processing Sugar utilization Maltose -K02808 PTS-Scr-EIIA; PTS system, sucrose-specific IIA component ag Carbon Processing Sugar utilization Sucrose -K02809 PTS-Scr-EIIB; PTS system, sucrose-specific IIB component ag Carbon Processing Sugar utilization Sucrose -K02810 PTS-Scr-EIIC; PTS system, sucrose-specific IIC component ag Carbon Processing Sugar utilization Sucrose -K02817 PTS-Tre-EIIA; PTS system, trehalose-specific IIA component ag Carbon Processing Sugar utilization Trehalose -K02818 PTS-Tre-EIIB; PTS system, trehalose-specific IIB component ag Carbon Processing Sugar utilization Trehalose -K02819 PTS-Tre-EIIC; PTS system, trehalose-specific IIC component ag Carbon Processing Sugar utilization Trehalose -K02768 PTS-Fru-EIIA; PTS system, fructose-specific IIA component ag Carbon Processing Sugar utilization Fructose -K02769 PTS-Fru-EIIB; PTS system, fructose-specific IIB component ag Carbon Processing Sugar utilization Fructose -K02770 PTS-Fru-EIIC; PTS system, fructose-specific IIC component ag Carbon Processing Sugar utilization Fructose -K02793 PTS-Man-EIIA; PTS system, mannose-specific IIA component ag Carbon Processing Sugar utilization Mannose -K02786 PTS-Lac-EIIA; PTS system, lactose-specific IIA component ag Carbon Processing Sugar utilization Lactose -K02787 PTS-Lac-EIIB; PTS system, lactose-specific IIB component ag Carbon Processing Sugar utilization Lactose -K02788 PTS-Lac-EIIC; PTS system, lactose-specific IIC component ag Carbon Processing Sugar utilization Lactose -K11194 PTS-Fru1-EIIA; PTS system, fructose-specific IIA component ag Carbon Processing Sugar utilization Fructose -K11195 PTS-Fru1-EIIB; PTS system, fructose-specific IIB component ag Carbon Processing Sugar utilization Fructose -K11196 PTS-Fru1-EIIC; PTS system, fructose-specific IIC component ag Carbon Processing Sugar utilization Fructose -K02771 PTS-Fru1-EIID; PTS system, fructose-specific IID component ag Carbon Processing Sugar utilization Fructose -K11201 PTS-Fru2-EIIA; PTS system, fructose-specific IIA-like component ag Carbon Processing Sugar utilization Fructose -K11202 PTS-Fru2-EIIB; PTS system, fructose-specific IIB-like component ag Carbon Processing Sugar utilization Fructose -K11203 PTS-Fru2-EIIC; PTS system, fructose-specific IIC-like component ag Carbon Processing Sugar utilization Fructose -K17311 K17311; trehalose transport system substrate-binding protein ag Carbon Processing Sugar utilization Trehalose -K17312 K17312; trehalose transport system permease protein ag Carbon Processing Sugar utilization Trehalose -K17313 treU; trehalose transport system permease protein ag Carbon Processing Sugar utilization Trehalose -K17314 treV; trehalose transport system ATP-binding protein ag Carbon Processing Sugar utilization Trehalose -K17315 gtsA; glucose/mannose transport system substrate-binding protein ag Carbon Processing Sugar utilization Glucose -K17316 gtsB; glucose/mannose transport system permease protein ag Carbon Processing Sugar utilization Glucose -K17317 gtsC; glucose/mannose transport system permease protein ag Carbon Processing Sugar utilization Glucose -K19506 PTS-Gfr-EIIA; PTS system, fructoselysine/glucoselysine-specific IIA component ag Carbon Processing Sugar utilization Fructose -K19507 PTS-Gfr-EIIB; PTS system, fructoselysine/glucoselysine-specific IIB component ag Carbon Processing Sugar utilization Fructose -K19508 PTS-Gfr-EIIC; PTS system, fructoselysine/glucoselysine-specific IIC component ag Carbon Processing Sugar utilization Fructose -K19509 PTS-Gfr-EIID; PTS system, fructoselysine/glucoselysine-specific IID component ag Carbon Processing Sugar utilization Fructose -K20107 PTS-Mal-EIIB; PTS system, maltose-specific IIB component ag Carbon Processing Sugar utilization Maltose -K20108 PTS-Mal-EIIC; PTS system, maltose-specific IIC component ag Carbon Processing Sugar utilization Maltose -K20112 PTS-Gal-EIIA; PTS system, galactose-specific IIA component ag Carbon Processing Sugar utilization Galactose -K20113 PTS-Gal-EIIB; PTS system, galactose-specific IIB component ag Carbon Processing Sugar utilization Galactose -K20114 PTS-Gal-EIIC; PTS system, galactose-specific IIC component ag Carbon Processing Sugar utilization Galactose -K20116 PTS-Glc1-EIIA; PTS system, glucose-specific IIA component ag Carbon Processing Sugar utilization Glucose -K20117 PTS-Glc1-EIIB; PTS system, glucose-specific IIB component ag Carbon Processing Sugar utilization Glucose -K20118 PTS-Glc1-EIIC; PTS system, glucose-specific IIC component ag Carbon Processing Sugar utilization Glucose -K01812 glucuronate isomerase ag Carbon Processing Sugar utilization Galacturonic Acid -K00041 tagaturonate reductase ag Carbon Processing Sugar utilization Galacturonic Acid -K01685 altronate hydrolase ag Carbon Processing Sugar utilization Galacturonic Acid -K16849 altronate dehydratase small subunit ag Carbon Processing Sugar utilization Galacturonic Acid -K16850 altronate dehydratase large subunit ag Carbon Processing Sugar utilization Galacturonic Acid -K00874 2-dehydro-3-deoxygluconokinase ag Carbon Processing Sugar utilization Galacturonic Acid -K01190 beta-galactosidase ag Carbon Processing Sugar utilization Lactose -K12111 evolved beta-galactosidase subunit alpha ag Carbon Processing Sugar utilization Lactose -K12112 evolved beta-galactosidase subunit beta ag Carbon Processing Sugar utilization Lactose -K12309 beta-galactosidase ag Carbon Processing Sugar utilization Lactose -K01203 sucrase-isomaltase ag Carbon Processing Sugar utilization Sucrose -K12047 maltase-glucoamylase ag Carbon Processing Sugar utilization Sucrose -K00690 sucrose phosphorylase ag Carbon Processing Sugar utilization Sucrose -K01809 mannose-6-phosphate isomerase ag Carbon Processing Sugar utilization Mannose -K14273 D-xylose 1-dehydrogenase (NADP+) ag Carbon Processing Sugar utilization Xylose -GH172 difructose-anhydride-I synthase (EC 4.2.1.179 (old 3.2.1.134)); alpha-D-Arabinofuranosidase (EC 3.2.1.-); alpha-D-Fructofuranosidase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Fructose -PL42 L-rhamnose-_-1,4-D-glucuronate lyase (EC 4.2.2.-); L-Rh_-_-1,4-GlcA _-L-rhamnohydrolase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Rhamnose -CBM88 Binding to terminal galactose in galactoxyloglucan and galactomannan ag Carbon Processing Sugar utilization Galactose -K01188 beta-glucosidase [EC:3.2.1.21] Hydrolysis of terminal β-D-glucosyl residues (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K05349 beta-glucosidase [EC:3.2.1.21] Hydrolysis of terminal β-D-glucosyl residues (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K05350 beta-glucosidase [EC:3.2.1.21] Hydrolysis of terminal β-D-glucosyl residues (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K01198 xylan 1,4-beta-xylosidase [EC:3.2.1.37] Hydrolysis of β-D-xylose residues ag Enzyme Assay Analogs Hydrolytic Enzymes -K15920 xylan 1,4-beta-xylosidase [EC:3.2.1.37] Hydrolysis of β-D-xylose residues ag Enzyme Assay Analogs Hydrolytic Enzymes -K22268 xylan 1,4-beta-xylosidase [EC:3.2.1.37] Hydrolysis of β-D-xylose residues ag Enzyme Assay Analogs Hydrolytic Enzymes -K01130 arylsulfatase [EC:3.1.6.1] Hydrolysis of aromatic sulfate esters ag Enzyme Assay Analogs Hydrolytic Enzymes -K01227 mannosyl-glycoprotein endo-beta-N-acetylglucosaminidase [EC:3.2.1.96] Hydrolysis of chitin N-acetyl-β-D-glucosaminide ag Enzyme Assay Analogs Hydrolytic Enzymes -K13714 bifunctional autolysin [EC:3.2.1.96] Hydrolysis of chitin N-acetyl-β-D-glucosaminide ag Enzyme Assay Analogs Hydrolytic Enzymes -K23989 mannosyl-glycoprotein endo-beta-N-acetylglucosaminidase [EC:3.2.1.96] Hydrolysis of chitin N-acetyl-β-D-glucosaminide ag Enzyme Assay Analogs Hydrolytic Enzymes -K01078 acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K01093 4-phytase / acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K03788 acid phosphatase (class B) [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K09474 acid phosphatase (class A) [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K14379 tartrate-resistant acid phosphatase type 5 [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K14394 low molecular weight phosphotyrosine protein phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K14395 lysophosphatidic acid phosphatase type 6 [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K14410 lysosomal acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K19283 prostatic acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K19284 testicular acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K23458 repressible acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes -K01255 leucyl aminopeptidase [EC:3.4.11.1] Breakdown of leucine residues at the N-terminus of peptides ag Enzyme Assay Analogs Hydrolytic Enzymes -K11142 cytosol aminopeptidase [EC:3.4.11.1] Breakdown of leucine residues at the N-terminus of peptides ag Enzyme Assay Analogs Hydrolytic Enzymes -K01225 cellulose 1,4-beta-cellobiosidase [EC:3.2.1.91] Hydrolysis of β-D-glucosyl linkages (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K19668 cellulose 1,4-beta-cellobiosidase [EC:3.2.1.91] Hydrolysis of β-D-glucosyl linkages (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K01187 alpha-glucosidase [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K12047 maltase-glucoamylase [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K12316 lysosomal alpha-glucosidase [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K12317 neutral alpha-glucosidase C [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes -K05910 NADH peroxidase [EC:1.11.1.-] Use of peroxide as electron acceptor to depolymerize lignin ag Enzyme Assay Analogs Oxidative Enzymes -K00421 laccase [EC:1.10.3.2] Oxidation of aromatic rings in phenolics ag Enzyme Assay Analogs Oxidative Enzymes -K05909 laccase [EC:1.10.3.2] Oxidation of aromatic rings in phenolics ag Enzyme Assay Analogs Oxidative Enzymes \ No newline at end of file +K04103 ipdC [EC:4.1.1.74] Indole-3-pyruvate → IAA ag Rhizosphere Transformations Auxin (IAA) +K00466 iaaM [EC:1.13.12.3] Tryptophan → IAM → IAA ag Rhizosphere Transformations Auxin (IAA) +K21801  iaaH [EC:3.5.1.4] Tryptophan → IAM → IAA ag Rhizosphere Transformations Auxin (IAA) +K01426 amiE [EC:3.5.1.4] IAM → IAA ag Rhizosphere Transformations Auxin (IAA) +K03397 iaaL [EC:6.3.2.20] Conjugates IAA → IAA-Lys (inactivation) ag Rhizosphere Transformations Auxin (IAA) +K10760 ipt [EC:2.5.1.112] Isopentenyl-AMP → cytokinins ag Rhizosphere Transformations Cytokinins +K00279 ckx [EC:1.5.99.12] Cytokinin degradation ag Rhizosphere Transformations Cytokinins +K04121 ks [EC:4.2.3.19] ent-kaurene synthase (ent-copalyl diphosphate → ent-kaurene; early GA biosynthesis) ag Rhizosphere Transformations Gibberellins +K20657  cps/ks [EC:5.5.1.13] ent-copalyl diphosphate / ent-kaurene synthase (bifunctional) ag Rhizosphere Transformations Gibberellins +K27636 cps/ks [EC:4.2.3.19] ent-copalyl diphosphate / ent-kaurene / ent-beyerene synthase ag Rhizosphere Transformations Gibberellins +K21719  cyp701A [EC:1.14.14.86] ent-Kaurene → GA intermediates ag Rhizosphere Transformations Gibberellins +K04123    cyp88A [EC:1.14.13.79] ent-Kaurenoic acid → GA12 ag Rhizosphere Transformations Gibberellins +K01505 acdS [EC:3.5.99.7] ACC → α-ketobutyrate + NH3 ag Rhizosphere Transformations ACC Deaminase +K21815  efe [EC:1.13.12.19] L-arginine → ethylene ag Rhizosphere Transformations AA Derivatives +K09840 abaA-like [EC:1.13.11.51] Mevalonate pathway → ABA ag Rhizosphere Transformations AA Derivatives +K09843 cyp707A-like [EC:1.14.13.93] ABA → phaseic acid ag Rhizosphere Transformations AA Derivatives +K01851 pchA [EC:5.4.4.2] Chorismate → salicylic acid ag Rhizosphere Transformations Phenolics +K04781 pchB [EC:4.2.99.21] Chorismate → salicylic acid ag Rhizosphere Transformations Phenolics +K00480 nahG [EC:1.14.13.1] Salicylic acid → catechol ag Rhizosphere Transformations Phenolics +K00454 lox [EC:1.13.11.12] Linolenic acid → hydroperoxides ag Rhizosphere Transformations AA Derivatives +K01723  aos [EC:4.2.1.92] Hydroperoxides → OPDA ag Rhizosphere Transformations AA Derivatives +K09591 det2-like [EC:1.3.1.-] Steroid metabolism → brassinolide-like compounds ag Rhizosphere Transformations AA Derivatives +K09587  dwrf [EC:1.14.-.-] Steroid metabolism → brassinolide-like compounds ag Rhizosphere Transformations AA Derivatives +K22944   cyaA [EC:4.6.1.1] ATP → cAMP (adenylate cyclase) ag Rhizosphere Transformations Nucleotides/Sides +K01769 gya [EC:4.6.1.2] GTP → cGMP (guanylate cyclase ag Rhizosphere Transformations Nucleotides/Sides +K00108 betA; choline dehydrogenase (EC 1.1.99.1) Glycine betaine biosynthesis from choline ag Stressors Methyl-related Compatible Solutes +K00130 betB; betaine-aldehyde dehydrogenase (EC 1.2.1.8) Glycine betaine biosynthesis from betaine-aldehyde ag Stressors Methyl-related Compatible Solutes +K02000 proV; glycine-betaine/proline transport system ATP-binding protein Glycine betaine/proline transport ag Stressors Methyl-related Compatible Solutes +K02001 proW; glycine-betaine/proline transport system permease protein Glycine betaine/proline transport ag Stressors Methyl-related Compatible Solutes +K02002 proX; glycine-betaine/proline transport system substrate-binding protein Glycine betaine/proline transport ag Stressors Methyl-related Compatible Solutes +K02168 betP; choline/glycine/proline betaine transport protein Glycine betaine/choline/proline transport ag Stressors Methyl-related Compatible Solutes +K03451 betT/BCCT; choline/carnitine/betaine/glycine transporter Choline/betaine transport (BCCT family) ag Stressors Methyl-related Compatible Solutes +K03607 proQ; ProP effector (proline/betaine regulation) Regulation of proline/betaine transport (ProP system) ag Stressors Methyl-related Compatible Solutes +K03762 proP; MFS transporter for proline/betaine Proline/betaine transport (ProP system) ag Stressors Methyl-related Compatible Solutes +K05020 opuD; glycine-betaine transporter Glycine betaine uptake ag Stressors Methyl-related Compatible Solutes +K05245 caiT; L-carnitine/gamma-butyrobetaine antiporter L-carnitine transport (osmoprotectant role) ag Stressors Methyl-related Compatible Solutes +K05845 opuC; osmoprotectant transport system substrate-binding protein Osmoprotectant transport (OpuC system) ag Stressors Methyl-related Compatible Solutes +K05846 opuBD; osmoprotectant transport system permease protein Osmoprotectant transport (OpuC system) ag Stressors Methyl-related Compatible Solutes +K05847 opuA; osmoprotectant transport system ATP-binding protein Osmoprotectant transport (OpuC system) ag Stressors Methyl-related Compatible Solutes +K10036 glnH; glutamine transport system substrate-binding protein Glutamine transport (osmotic adjustment role) ag Stressors Methyl-related Compatible Solutes +K10037 glnP; glutamine transport system permease protein Glutamine transport (osmotic adjustment role) ag Stressors Methyl-related Compatible Solutes +K10038 glnQ; glutamine transport system ATP-binding protein Glutamine transport (osmotic adjustment role) ag Stressors Methyl-related Compatible Solutes +K11440 betA; choline dehydrogenase (alternate) Glycine betaine biosynthesis from choline ag Stressors Methyl-related Compatible Solutes +K18896 gsmT; glycine/sarcosine N-methyltransferase Glycine → sarcosine → dimethylglycine synthesis ag Stressors Methyl-related Compatible Solutes +K18897 dmt; sarcosine/dimethylglycine N-methyltransferase Dimethylglycine → betaine synthesis ag Stressors Methyl-related Compatible Solutes +K00697 otsA (EC 2.4.1.15) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) +K01087 otsB (EC 3.1.3.12) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) +K01236 treZ (EC 3.2.1.141) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) +K06044 treY (EC 5.4.99.15) Trehalose biosynthesis ag Stressors Sugar Compatible Solutes (Trehalose) +K05342 treP (EC 2.4.1.64) Trehalose metabolism ag Stressors Sugar Compatible Solutes (Trehalose) +K05343 treS (EC 5.4.99.16) Trehalose metabolism ag Stressors Sugar Compatible Solutes (Trehalose) +K00009 mtlD (EC 1.1.1.17) Mannitol biosynthesis ag Stressors Sugar Compatible Solutes (Mannitol) +K02798 mtlA Mannitol transport ag Stressors Sugar Compatible Solutes (Mannitol) +K05947 mpgS (EC 2.4.1.217) Mannosyl-3-phosphoglycerate biosynthesis ag Stressors Sugar Compatible Solutes (Mannosyl glycerate) +K17314 treV Trehalose transport ag Stressors Sugar Compatible Solutes (Trehalose) +K02781 srlA; sorbitol transporter subunit II A Sorbitol transport ag Stressors Sugar Compatible Solutes (Sorbitol) +K02782 srlB; sorbitol transporter subunit II B Sorbitol transport ag Stressors Sugar Compatible Solutes (Sorbitol) +K02783 srlE; sorbitol transporter subunit II E Sorbitol transport ag Stressors Sugar Compatible Solutes (Sorbitol) +K10109 malF; maltose transport system permease protein Maltose transport ag Stressors Sugar Compatible Solutes (Maltose) +K10110 malG; maltose transport system permease protein Maltose transport ag Stressors Sugar Compatible Solutes (Maltose) +K10111 malK; maltose/maltodextrin transport system ATP-binding protein Maltose transport ag Stressors Sugar Compatible Solutes (Maltose) +K10227 smoE; sorbitol/mannitol transport system substrate-binding protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) +K10228 smoF; sorbitol/mannitol transport system permease protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) +K10229 sorbitol/mannitol transport system permease protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) +K10230 sorbitol/mannitol transport system ATP-binding protein Sorbitol/mannitol transport ag Stressors Sugar Compatible Solutes (Sorbitol / Mannitol) +K03782 katG [EC:1.11.1.21] Catalase–peroxidase ag Stressors +K04564 sodA [EC:1.15.1.1] Superoxide dismutase (Mn-dependent) ag Stressors +K04565 sodB [EC:1.15.1.1] Superoxide dismutase (Fe-dependent) ag Stressors +K01920 gshA [EC:6.3.2.2] Glutamate–cysteine ligase (first step in glutathione biosynthesis) ag Stressors +K01921 gshB [EC:6.3.2.3] Glutathione synthase (second step in glutathione biosynthesis) ag Stressors +K05909 mco [EC:1.10.3.2] Multicopper oxidase (laccase; oxidizes phenolics, triazines, and aromatics) ag Stressors +K00421 lcc [EC:1.10.3.2] Laccase (multicopper oxidase; lignin and aromatic oxidation) ag Stressors +K05910 npr [EC:1.11.1.1] NADH peroxidase (reduces hydrogen peroxide via NADH) ag Stressors +K00431 lip [EC:1.11.1.14] Lignin peroxidase (oxidizes lignin and aromatic compounds via H₂O₂) ag Stressors +K00799 gst [EC:2.5.1.18] Glutathione S-transferase (conjugates glutathione to xenobiotics for detoxification) ag Stressors +K00697 otsA [EC:2.4.1.15] Trehalose-6-phosphate synthase (trehalose biosynthesis) ag Stressors +K01087 otsB [EC:3.1.3.12] Trehalose-6-phosphate phosphatase (trehalose biosynthesis) ag Stressors +K00147 proA [EC:1.2.1.41] γ-Glutamyl phosphate reductase (proline biosynthesis) ag Stressors +K00931 proB [EC:2.7.2.11] Glutamate 5-kinase (proline biosynthesis) ag Stressors +K00286 proC [EC:1.5.1.2] Pyrroline-5-carboxylate reductase (proline biosynthesis) ag Stressors +K00006 gpd1 [EC:1.1.1.8] Glycerol-3-phosphate dehydrogenase (NAD⁺-dependent) ag Stressors +K00111 gpd2 [EC:1.1.5.3] Glycerol-3-phosphate dehydrogenase (quinone-dependent) ag Stressors +K00108 betA [EC:1.1.99.1] Choline dehydrogenase (glycine betaine biosynthesis) ag Stressors +K00130 betB [EC:1.2.1.8] Betaine aldehyde dehydrogenase (glycine betaine biosynthesis) ag Stressors +K16566 exoY Exopolysaccharide production protein ExoY (succinoglycan) ag Stressors Exopolysaccharide Production +K16557 exoA Succinoglycan biosynthesis glycosyltransferase ag Stressors Exopolysaccharide Production +K16556 exoM Succinoglycan biosynthesis mannosyltransferase ag Stressors Exopolysaccharide Production +K16555 exoO Succinoglycan biosynthesis protein ag Stressors Exopolysaccharide Production +K19290 alg8 Mannuronan synthase (alginate biosynthesis) ag Stressors Exopolysaccharide Production +K19291 alg44 Mannuronan polymer co-polymerase (alginate biosynthesis) ag Stressors Exopolysaccharide Production +K19293 algX Alginate biosynthesis protein ag Stressors Exopolysaccharide Production +K19295 algJ Alginate O-acetyltransferase complex protein ag Stressors Exopolysaccharide Production +K20997 pslA Psl polysaccharide biosynthesis protein ag Stressors Exopolysaccharide Production +K21001 pslH Psl polysaccharide biosynthesis protein ag Stressors Exopolysaccharide Production +K21154 pssM Exopolysaccharide glucosyl ketal-pyruvate-transferase ag Stressors Exopolysaccharide Production +K25902 pssA Acidic exopolysaccharide biosynthesis protein ag Stressors Exopolysaccharide Production +K25904 pssE Exopolysaccharide biosynthesis glucuronosyltransferase ag Stressors Exopolysaccharide Production +K25906 pssS Exopolysaccharide biosynthesis glucosyltransferase ag Stressors Exopolysaccharide Production +K19290 alg8 Mannuronan synthase (alginate biosynthesis) ag Stressors Biofilm Formation +K19291 alg44 Mannuronan co-polymerase (alginate biosynthesis) ag Stressors Biofilm Formation +K19293 algX Alginate biosynthesis protein AlgX ag Stressors Biofilm Formation +K19294 algI Alginate O-acetyltransferase complex protein AlgI ag Stressors Biofilm Formation +K19295 algJ Alginate O-acetyltransferase complex protein AlgJ ag Stressors Biofilm Formation +K19296 algF Alginate O-acetyltransferase complex protein AlgF ag Stressors Biofilm Formation +K11936 pgaC / icaA Poly-β-1,6-N-acetyl-D-glucosamine synthase (PGA/ICA matrix) ag Stressors Biofilm Formation +K11937 pgaD Biofilm PGA synthesis protein ag Stressors Biofilm Formation +K21001 pslH Psl polysaccharide biosynthesis protein ag Stressors Biofilm Formation +K20997 pslA Psl polysaccharide biosynthesis protein ag Stressors Biofilm Formation +K25205 pslC Psl polysaccharide biosynthesis protein ag Stressors Biofilm Formation +K21461 icaD Poly-β-1,6-N-acetyl-D-glucosamine synthesis protein ag Stressors Biofilm Formation +K01045 opd/mpd/pah/ophC2 [EC:3.1.8.1] Carbamates ag Stressors Pesticides +K14449 mcd [EC:3.1.1.88] Carbamates ag Stressors Pesticides +K25604 cehA [EC:3.5.1.137] Triazines ag Stressors Pesticides +K05394  atzA [EC:3.8.1.8] Triazines ag Stressors Pesticides +K03382 atzB [EC:3.5.99.3] Triazines ag Stressors Pesticides +K08710 atzC [EC:3.5.99.4] Triazines ag Stressors Pesticides +K05394 trzN [EC:3.8.1.8] Organochlorines ag Stressors Pesticides +K15236  linA [EC:4.5.1.-] Organochlorines ag Stressors Pesticides +K01563 linB [EC:3.8.1.5] Organochlorines ag Stressors Pesticides +K15237 "linC [EC:1.3.1.-] " Phenoxy herbicides ag Stressors Pesticides +K06912 tfdA [EC:1.14.11.-] Phenoxy herbicides ag Stressors Pesticides +K08719 tfdB [EC:1.14.13.2] Pyrethroids ag Stressors Pesticides +K08722 tfdF [EC:5.5.1.5] Pyrethroids ag Stressors Pesticides +K20992 pytH [EC:3.1.1.-] Pyrethroids ag Stressors Pesticides +K20993 estP [EC:3.1.1.88] Glyphosate ag Stressors Pesticides +K17842 gox [EC:1.13.11.59] Glyphosate ag Stressors Pesticides +K23996 phnY [EC:1.14.11.71] Methylphosphonate hydroxylase (oxidizes methylphosphonate to phosphate intermediates) ag Stressors Pesticides +K06164 phnI [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides +K06165 phnH [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides +K06166 phnG [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides +K05780 phnL [EC:2.7.8.37] Alpha-D-ribose-1-methylphosphonate-5-triphosphate synthase subunit (C–P lyase complex) ag Stressors Pesticides +K06162 phnM [EC:3.6.1.63] Alpha-D-ribose-1-methylphosphonate-5-triphosphate diphosphatase (hydrolyzes phosphonate intermediates) ag Stressors Pesticides +K06163 phnJ [EC:4.7.1.1] C–P lyase catalytic subunit (cleaves C–P bond in phosphonates including glyphosate) ag Stressors Pesticides +K06167 phnP [EC:3.1.4.55] Phosphoribosyl-1,2-cyclic phosphate phosphodiesterase (final phosphonate degradation step) ag Stressors Pesticides +K01560  Haloacid dehalogenases [EC:3.8.1.2] Broad (various pesticides) ag Stressors Pesticides +K03930 estA [EC:3.1.1.1] Carboxylesterase (broad-spectrum hydrolase acting on xenobiotic organoesters and pesticides) ag Stressors Pesticides +K00163 pyruvate dehydrogenase E1 component [EC:1.2.4.1] pyruvate → acetyl-CoA v1 ag Carbon Processing SCFA and alcohol conversions +K00174 2-oxoglutarate/2-oxoacid ferredoxin oxidoreductase subunit alpha [EC:1.2.7.3, 1.2.7.11] pyruvate → acetyl-CoA v2 ag Carbon Processing SCFA and alcohol conversions +K00656 formate C-acetyltransferase [EC:2.3.1.54] pyruvate → acetyl-CoA + formate v3 ag Carbon Processing SCFA and alcohol conversions +K00625 phosphate acetyltransferase [EC:2.3.1.8] [RN:R00230] acetate, pt 1 ag Carbon Processing SCFA and alcohol conversions +K00925 acetate kinase [EC:2.7.2.1] [RN:R00315] acetate, pt 1 ag Carbon Processing SCFA and alcohol conversions +K01905 acetate-CoA ligase (ADP-forming) subunit alpha acetate, pt 2 ag Carbon Processing SCFA and alcohol conversions +K01067 acetyl-CoA hydrolase [EC:3.1.2.1] acetate, pt 3 ag Carbon Processing SCFA and alcohol conversions +K00016 L-lactate dehydrogenase [EC:1.1.1.27] lactate (L) ag Carbon Processing SCFA and alcohol conversions +K00101 L-lactate dehydrogenase (cytochrome) [EC:1.1.2.3] lactate (L) ag Carbon Processing SCFA and alcohol conversions +K03778 D-lactate dehydrogenase [EC:1.1.1.28] lactate (D) ag Carbon Processing SCFA and alcohol conversions +K03777 D-lactate dehydrogenase (quinone/cytochrome variants) [EC:1.1.5.12, EC:1.1.2.4] lactate (D) ag Carbon Processing SCFA and alcohol conversions +K00634 phosphate butyryltransferase [EC:2.3.1.19] butyrate, pt 1 ag Carbon Processing SCFA and alcohol conversions +K00929 butyrate kinase [EC:2.7.2.7] butyrate, pt 2 ag Carbon Processing SCFA and alcohol conversions +K01896 medium-chain acyl-CoA synthetase [EC:6.2.1.2] butyrate, pt 2 ag Carbon Processing SCFA and alcohol conversions +K19697 propionate kinase [EC:2.7.2.15] propionate, pt 1 ag Carbon Processing SCFA and alcohol conversions +K01026 propionate CoA-transferase [EC:2.8.3.1] propionate, pt 2 ag Carbon Processing SCFA and alcohol conversions +K00001 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K00121 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K04072 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K13951 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K13952 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K13953 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K13954 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K13980 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K18857 alcohol dehydrogenase [EC:1.1.1.1] alcohol production ag Carbon Processing SCFA and alcohol conversions +K00192 cdhA; anaerobic carbon-monoxide dehydrogenase, CODH/ACS complex subunit alpha [EC:1.2.7.4] [RN:R07157] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation +K00195 cdhB; anaerobic carbon-monoxide dehydrogenase, CODH/ACS complex subunit epsilon [RN:R07157] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation +K00193 cdhC; acetyl-CoA decarbonylase/synthase, CODH/ACS complex subunit beta [EC:2.3.1.169] [RN:R09096 R10219] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation +K00197 cdhE; acetyl-CoA decarbonylase/synthase, CODH/ACS complex subunit gamma [EC:2.1.1.245] [RN:R09096 R10219] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation +K00194 cdhD; acetyl-CoA decarbonylase/synthase, CODH/ACS complex subunit delta [EC:2.1.1.245] [RN:R09096 R10219] Acetyl-CoA pathway, CO2 => acetyl-CoA ag Carbon Processing CO2 Fixation +K10944 particulate methane monooxygenase subunit A (pmoA) [EC:1.14.18.3] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K10945 particulate methane monooxygenase subunit B (pmoB) [EC:1.14.18.3] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K10946 particulate methane monooxygenase subunit C (pmoC) [EC:1.14.18.3] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K16157 soluble methane monooxygenase hydroxylase alpha subunit (mmoX) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K16158 soluble methane monooxygenase hydroxylase beta subunit (mmoY) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K16159 soluble methane monooxygenase hydroxylase gamma subunit (mmoZ) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K16160 soluble methane monooxygenase component B (mmoB) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K16161 soluble methane monooxygenase reductase component (mmoC) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +K16162 soluble methane monooxygenase regulatory protein (mmoD) [EC:1.14.13.25] Methane oxidation = methane => methanol ag Carbon Processing CH4 oxidation +GH94 GH94 cellobiose phosphorylase (EC 2.4.1.20); laminaribiose phosphorylase (EC 2.4.1.31); cellodextrin phosphorylase (EC 2.4.1.49); chitobiose phosphorylase (EC 2.4.1.-); cyclic beta-1,2-glucan synthase (EC 2.4.1.-); cellobionic acid phosphorylase (EC 2.4.1.321); beta-1,2-oligoglucan phosphorylase (EC 2.4.1.-) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH1 GH1 beta-glucosidase (EC 3.2.1.21); beta-galactosidase (EC 3.2.1.23); beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); beta-xylosidase (EC 3.2.1.37); beta-D-fucosidase (EC 3.2.1.38); phlorizin hydrolase (EC 3.2.1.62); exo-beta-1,4-glucanase (EC 3.2.1.74); 6-phospho-beta-galactosidase (EC 3.2.1.85); 6-phospho-beta-glucosidase (EC 3.2.1.86); strictosidine beta-glucosidase (EC 3.2.1.105); lactase (EC 3.2.1.108); amygdalin beta-glucosidase (EC 3.2.1.117); prunasin beta-glucosidase (EC 3.2.1.118); vicianin hydrolase (EC 3.2.1.119); raucaffricine beta-glucosidase (EC 3.2.1.125); thioglucosidase (EC 3.2.1.147); beta-primeverosidase (EC 3.2.1.149); isoflavonoid 7-O-beta-apiosyl-beta-glucosidase (EC 3.2.1.161); ABA-specific beta-glucosidase (EC 3.2.1.175); DIMBOA beta-glucosidase (EC 3.2.1.182); beta-glycosidase (EC 3.2.1.-); hydroxyisourate hydrolase (EC 3.-.-.-) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH2 GH2 beta-galactosidase (EC 3.2.1.23) ; beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); alpha-L-arabinofuranosidase (EC 3.2.1.55); mannosylglycoprotein endo-beta-mannosidase (EC 3.2.1.152); exo-beta-glucosaminidase (EC 3.2.1.165); alpha-L-arabinopyranosidase (EC 3.2.1.-); beta-galacturonidase (EC 3.2.1.-); beta-xylosidase (EC 3.2.1.37); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH3 GH3 beta-glucosidase (EC 3.2.1.21); xylan 1,4-beta-xylosidase (EC 3.2.1.37); beta-glucosylceramidase (EC 3.2.1.45); beta-N-acetylhexosaminidase (EC 3.2.1.52); alpha-L-arabinofuranosidase (EC 3.2.1.55); glucan 1,3-beta-glucosidase (EC 3.2.1.58); glucan 1,4-beta-glucosidase (EC 3.2.1.74); isoprimeverose-producing oligoxyloglucan hydrolase (EC 3.2.1.120); coniferin beta-glucosidase (EC 3.2.1.126); exo-1,3-1,4-glucanase (EC 3.2.1.-); beta-N-acetylglucosaminide phosphorylases (EC 2.4.1.-) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH5 GH5 endo-beta-1,4-glucanase / cellulase (EC 3.2.1.4); endo-beta-1,4-xylanase (EC 3.2.1.8); beta-glucosidase (EC 3.2.1.21); beta-mannosidase (EC 3.2.1.25); beta-glucosylceramidase (EC 3.2.1.45); glucan beta-1,3-glucosidase (EC 3.2.1.58); licheninase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); glucan endo-1,6-beta-glucosidase (EC 3.2.1.75); mannan endo-beta-1,4-mannosidase (EC 3.2.1.78); cellulose beta-1,4-cellobiosidase (EC 3.2.1.91); steryl beta-glucosidase (EC 3.2.1.104); endoglycoceramidase (EC 3.2.1.123); chitosanase (EC 3.2.1.132); beta-primeverosidase (EC 3.2.1.149); xyloglucan-specific endo-beta-1,4-glucanase (EC 3.2.1.151); endo-beta-1,6-galactanase (EC 3.2.1.164); hesperidin 6-O-alpha-L-rhamnosyl-beta-glucosidase (EC 3.2.1.168); beta-1,3-mannanase (EC 3.2.1.-); arabinoxylan-specific endo-beta-1,4-xylanase (EC 3.2.1.-); mannan transglycosylase (EC 2.4.1.-); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-glucanase / laminarinase (EC 3.2.1.39); beta-N-acetylhexosaminidase (EC 3.2.1.52); chitosanase (EC 3.2.1.132); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH9 GH9 endoglucanase (EC 3.2.1.4); endo-beta-1,3(4)-glucanase / lichenase-laminarinase (EC 3.2.1.6); beta-glucosidase (EC 3.2.1.21); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); cellobiohydrolase (EC 3.2.1.91); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); exo-beta-glucosaminidase (EC 3.2.1.165) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH16 GH16 xyloglucan:xyloglucosyltransferase (EC 2.4.1.207); keratan-sulfate endo-1,4-beta-galactosidase (EC 3.2.1.103); endo-1,3-beta-glucanase / laminarinase (EC 3.2.1.39); endo-1,3(4)-beta-glucanase (EC 3.2.1.6); licheninase (EC 3.2.1.73); beta-agarase (EC 3.2.1.81); kappa;-carrageenase (EC 3.2.1.83); xyloglucanase (EC 3.2.1.151); endo-beta-1,3-galactanase (EC 3.2.1.181); [retaining] beta-porphyranase (EC 3.2.1.178); hyaluronidase (EC 3.2.1.35); endo-beta-1,4-galactosidase (EC 3.2.1.-); chitin beta-1,6-glucanosyltransferase (EC 2.4.1.-); beta-transglycosidase (EC 2.4.1.-); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-galactanase (EC 3.2.1.181) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH116 GH116 beta-glucosidase (EC 3.2.1.21); beta-xylosidase (EC 3.2.1.37); acid beta-glucosidase/beta-glucosylceramidase (EC 3.2.1.45); beta-N-acetylglucosaminidase (EC 3.2.1.52) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH6 GH6 endoglucanase (EC 3.2.1.4); cellobiohydrolase (EC 3.2.1.91) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH7 GH7 endo-beta-1,4-glucanase (EC 3.2.1.4); reducing end-acting cellobiohydrolase (EC 3.2.1.176); chitosanase (EC 3.2.1.132); endo-beta-1,3-1,4-glucanase (EC 3.2.1.73) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH8 GH8 chitosanase (EC 3.2.1.132); cellulase (EC 3.2.1.4); licheninase (EC 3.2.1.73); endo-1,4-beta-xylanase (EC 3.2.1.8); reducing-end-xylose releasing exo-oligoxylanase (EC 3.2.1.156) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH10 GH10 endo-1,4-beta-xylanase (EC 3.2.1.8); endo-1,3-beta-xylanase (EC 3.2.1.32); tomatinase (EC 3.2.1.-); xylan endotransglycosylase (EC 2.4.2.-); endo-beta-1,4-glucanase (EC 3.2.1.4) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH124 GH124 endoglucanase (EC 3.2.1.4) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH12 GH12 endoglucanase (EC 3.2.1.4); xyloglucan hydrolase (EC 3.2.1.151); beta-1,3-1,4-glucanase (EC 3.2.1.73); xyloglucan endotransglycosylase (EC 2.4.1.207) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH44 GH44 endoglucanase (EC 3.2.1.4); xyloglucanase (EC 3.2.1.151) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH45 GH45 endoglucanase (EC 3.2.1.4); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); endo-beta-1,4-mannanase (EC 3.2.1.78) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +GH48 GH48 reducing end-acting cellobiohydrolase (EC 3.2.1.176); endo-beta-1,4-glucanase (EC 3.2.1.4); chitinase (EC 3.2.1.14) Glycoside Hydrolases ag Carbon Processing Cellulose degradation CAZY +AA10 AA10 (formerly CBM33) proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); some proteins have been shown to act on chitin, others on cellulose; lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic cellulose monooxygenase (C4-dehydrogenating)(EC 1.14.99.56); lytic chitin monooxygenase (EC 1.14.99.53) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY +AA15 AA15 lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic chitin monooxygenase (EC 1.14.99.53) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY +AA16 AA16 Lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY +AA9 AA9 (formerly GH61) proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of cellulose chains with oxidation of carbons C1 and/or C4 and C-6); lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic cellulose monooxygenase (C4-dehydrogenating) (EC 1.14.99.56) Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY +AA11 AA11 proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of chitin chains with oxidation of C-1 has been demonstrated for a AA11 LPMO from Aspergillus oryzae; Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY +AA13 AA13 proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of starch with oxidation of C-1 at the site of cleavage has been demonstrated for the LPMO encoded by gene NCU08746 from Neurospora crassa; Auxiliary Activities ag Carbon Processing Cellulose degradation CAZY +AA13 AA13 proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of starch with oxidation of C-1 at the site of cleavage has been demonstrated for the LPMO encoded by gene NCU08746 from Neurospora crassa; Auxiliary Activities ag Carbon Processing Starch degradation CAZY +GH13 GH13 alpha-amylase (EC 3.2.1.1); pullulanase (EC 3.2.1.41); cyclomaltodextrin glucanotransferase (EC 2.4.1.19); cyclomaltodextrinase (EC 3.2.1.54); trehalose-6-phosphate hydrolase (EC 3.2.1.93); oligo-alpha-glucosidase (EC 3.2.1.10); maltogenic amylase (EC 3.2.1.133); neopullulanase (EC 3.2.1.135); alpha-glucosidase (EC 3.2.1.20); maltotetraose-forming alpha-amylase (EC 3.2.1.60); isoamylase (EC 3.2.1.68); glucodextranase (EC 3.2.1.70); maltohexaose-forming alpha-amylase (EC 3.2.1.98); maltotriose-forming alpha-amylase (EC 3.2.1.116); branching enzyme (EC 2.4.1.18); trehalose synthase (EC 5.4.99.16); 4-alpha-glucanotransferase (EC 2.4.1.25); maltopentaose-forming alpha-amylase (EC 3.2.1.-) ; amylosucrase (EC 2.4.1.4) ; sucrose phosphorylase (EC 2.4.1.7); malto-oligosyltrehalose trehalohydrolase (EC 3.2.1.141); isomaltulose synthase (EC 5.4.99.11); malto-oligosyltrehalose synthase (EC 5.4.99.15); amylo-alpha-1,6-glucosidase (EC 3.2.1.33); alpha-1,4-glucan: phosphate alpha-maltosyltransferase (EC 2.4.99.16); 6'-P-sucrose phosphorylase (EC 2.4.1.-); amino acid transporter Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH14 GH14 beta-amylase (EC 3.2.1.2) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH57 GH57 alpha-amylase (EC 3.2.1.1); alpha-galactosidase (EC 3.2.1.22); amylopullulanase (EC 3.2.1.41); cyclomaltodextrinase (EC 3.2.1.54); branching enzyme (EC 2.4.1.18); 4-alpha-glucanotransferase (EC 2.4.1.25) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH119 GH119 alpha-amylase (EC 3.2.1.1) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH126 GH126 alpha-amylase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH133 GH133 amylo-alpha-1,6-glucosidase (EC 3.2.1.33); Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH15 GH15 glucoamylase (EC 3.2.1.3); glucodextranase (EC 3.2.1.70); alpha,alpha-trehalase (EC 3.2.1.28); dextran dextrinase (EC 2.4.1.2) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH97 GH97 glucoamylase (EC 3.2.1.3); alpha-glucosidase (EC 3.2.1.20); alpha-galactosidase (EC 3.2.1.22) Glycoside Hydrolases ag Carbon Processing Starch degradation CAZY +GH28 GH28 polygalacturonase (EC 3.2.1.15); alpha-L-rhamnosidase (EC 3.2.1.40); exo-polygalacturonase (EC 3.2.1.67); exo-polygalacturonosidase (EC 3.2.1.82); rhamnogalacturonase (EC 3.2.1.171); rhamnogalacturonan alpha-1,2-galacturonohydrolase (EC 3.2.1.173); endo-xylogalacturonan hydrolase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +PL1 PL1 pectate lyase (EC 4.2.2.2); exo-pectate lyase (EC 4.2.2.9); pectin lyase (EC 4.2.2.10). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL2 PL2 pectate lyase (EC 4.2.2.2); exo-polygalacturonate lyase (EC 4.2.2.9). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL9 PL9 pectate lyase (EC 4.2.2.2); exopolygalacturonate lyase (EC 4.2.2.9); thiopeptidoglycan lyase (EC 4.2.2.-). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL10 PL10 pectate lyase (EC 4.2.2.2) Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL11 PL11 rhamnogalacturonan endolyase (EC 4.2.2.23); rhamnogalacturonan exolyase (EC 4.2.2.24) Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL22 PL22 oligogalacturonate lyase / oligogalacturonide lyase (EC 4.2.2.6) Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL26 PL26 rhamnogalacturonan exolyase (EC 4.2.2.24). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL3 PL3 pectate lyase (EC 4.2.2.2). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +PL4 PL4 rhamnogalacturonan endolyase (EC 4.2.2.23). Polysaccharide Lyases ag Carbon Processing Pectin degradation CAZY +GH78 GH78 alpha-L-rhamnosidase (EC 3.2.1.40); rhamnogalacturonan alpha-L-rhamnohydrolase (EC 3.2.1.174); L-Rhap-alpha-1,3-D-Apif -specific alpha-1,3-L-rhamnosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +GH106 GH106 alpha-L-rhamnosidase (EC 3.2.1.40); rhamnogalacturonan alpha-L-rhamnohydrolase (EC 3.2.1.174) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +GH138 GH138 alpha-galacturonidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +GH139 GH139 alpha-2-O-Me-L-fucosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +GH143 GH143 2-keto-3-deoxy-D-lyxo-heptulosaric acid hydrolase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +CE8 CE8 pectin methylesterase (EC 3.1.1.11). Carbohydrate Esterases ag Carbon Processing Pectin degradation CAZY +GH105 GH105 unsaturated rhamnogalacturonyl hydrolase (EC 3.2.1.172); d-4,5-unsaturated beta-glucuronyl hydrolase (EC 3.2.1.-); d-4,5-unsaturated alpha-galacturonidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +GH4 GH4 maltose-6-phosphate glucosidase (EC 3.2.1.122); alpha-glucosidase (EC 3.2.1.20); alpha-galactosidase (EC 3.2.1.22); 6-phospho-beta-glucosidase (EC 3.2.1.86); alpha-glucuronidase (EC 3.2.1.139); alpha-galacturonase (EC 3.2.1.67); palatinase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +CE12 CE12 pectin acetylesterase (EC 3.1.1.-); rhamnogalacturonan acetylesterase (EC 3.1.1.-); acetyl xylan esterase (EC 3.1.1.72) Carbohydrate Esterases ag Carbon Processing Pectin degradation CAZY +GH2 GH2 beta-galactosidase (EC 3.2.1.23) ; beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); alpha-L-arabinofuranosidase (EC 3.2.1.55); mannosylglycoprotein endo-beta-mannosidase (EC 3.2.1.152); exo-beta-glucosaminidase (EC 3.2.1.165); alpha-L-arabinopyranosidase (EC 3.2.1.-); beta-galacturonidase (EC 3.2.1.-); beta-xylosidase (EC 3.2.1.37); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Pectin degradation CAZY +GH113 GH113 beta-mannanase (EC 3.2.1.78) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Beta-mannan Backbone Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose) +GH134 GH134 endo-beta-1,4-mannanase (EC 3.2.1.78); Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Beta-mannan Backbone Cleavage (Hemicellulose) +GH26 GH26 beta-mannanase (EC 3.2.1.78); exo-beta-1,4-mannobiohydrolase (EC 3.2.1.100); beta-1,3-xylanase (EC 3.2.1.32); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); mannobiose-producing exo-beta-mannanase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xylan Backbone Cleavage (Hemicellulose), Beta-mannan Backbone Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose) +GH130 GH130 beta-1,4-mannosylglucose phosphorylase (EC 2.4.1.281); beta-1,4-mannooligosaccharide phosphorylase (EC 2.4.1.319); beta-1,4-mannosyl-N-acetyl-glucosamine phosphorylase (EC 2.4.1.320); beta-1,2-mannobiose phosphorylase (EC 2.4.1.-); beta-1,2-oligomannan phosphorylase (EC 2.4.1.-); beta-1,2-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose) +CE2 CE2 acetyl xylan esterase (EC 3.1.1.72). Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Beta-mannan Oligo Cleavage (Hemicellulose) +CE17 acetyl mannan esterase [EC:3.1.1.-] Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Beta-mannan deacetylation support (Hemicellulose) +GH99 GH99 glycoprotein endo-alpha-1,2-mannosidase (EC 3.2.1.130); mannan endo-1,2-alpha-mannanase (3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Backbone Cleavage (Hemicellulose) +GH76 GH76 alpha-1,6-mannanase (EC 3.2.1.101); alpha-glucosidase (EC 3.2.1.20) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Backbone Cleavage (Hemicellulose), Alpha-mannan Oligo Cleavage (Hemicellulose) +GH92 GH92 mannosyl-oligosaccharide alpha-1,2-mannosidase (EC 3.2.1.113); mannosyl-oligosaccharide alpha-1,3-mannosidase (EC 3.2.1.-); mannosyl-oligosaccharide alpha-1,6-mannosidase (EC 3.2.1.-); alpha-mannosidase (EC 3.2.1.24); alpha-1,2-mannosidase (EC 3.2.1.-); alpha-1,3-mannosidase (EC 3.2.1.-); alpha-1,4-mannosidase (EC 3.2.1.-); mannosyl-1-phosphodiester alpha-1,P-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) +GH38 GH38 alpha-mannosidase (EC 3.2.1.24); mannosyl-oligosaccharide alpha-1,2-mannosidase (EC 3.2.1.113); mannosyl-oligosaccharide alpha-1,3-1,6-mannosidase (EC 3.2.1.114); alpha-2-O-mannosylglycerate hydrolase (EC 3.2.1.170); mannosyl-oligosaccharide alpha-1,3-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) +GH63 GH63 processing alpha-glucosidase (EC 3.2.1.106); alpha-1,3-glucosidase (EC 3.2.1.84); alpha-glucosidase (EC 3.2.1.20); mannosylglycerate alpha-mannosidase / mannosylglycerate hydrolase (EC 3.2.1.170); glucosylglycerate hydrolase (EC 3.2.1.208) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) +GH47 GH47 alpha-mannosidase (EC 3.2.1.113) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) +GH125 GH125 exo-alpha-1,6-mannosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Alpha-mannan Oligo Cleavage (Hemicellulose) +GH5 GH5 endo-beta-1,4-glucanase / cellulase (EC 3.2.1.4); endo-beta-1,4-xylanase (EC 3.2.1.8); beta-glucosidase (EC 3.2.1.21); beta-mannosidase (EC 3.2.1.25); beta-glucosylceramidase (EC 3.2.1.45); glucan beta-1,3-glucosidase (EC 3.2.1.58); licheninase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); glucan endo-1,6-beta-glucosidase (EC 3.2.1.75); mannan endo-beta-1,4-mannosidase (EC 3.2.1.78); cellulose beta-1,4-cellobiosidase (EC 3.2.1.91); steryl beta-glucosidase (EC 3.2.1.104); endoglycoceramidase (EC 3.2.1.123); chitosanase (EC 3.2.1.132); beta-primeverosidase (EC 3.2.1.149); xyloglucan-specific endo-beta-1,4-glucanase (EC 3.2.1.151); endo-beta-1,6-galactanase (EC 3.2.1.164); hesperidin 6-O-alpha-L-rhamnosyl-beta-glucosidase (EC 3.2.1.168); beta-1,3-mannanase (EC 3.2.1.-); arabinoxylan-specific endo-beta-1,4-xylanase (EC 3.2.1.-); mannan transglycosylase (EC 2.4.1.-); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-glucanase / laminarinase (EC 3.2.1.39); beta-N-acetylhexosaminidase (EC 3.2.1.52); chitosanase (EC 3.2.1.132); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Amorphous Cellulose Oligo Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose), Xylan Backbone Cleavage (Hemicellulose), Beta-mannan Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Backbone Cleavage (Hemicellulose), Chitin Oligo Cleavage +GH9 GH9 endoglucanase (EC 3.2.1.4); endo-beta-1,3(4)-glucanase / lichenase-laminarinase (EC 3.2.1.6); beta-glucosidase (EC 3.2.1.21); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); exo-beta-1,4-glucanase / cellodextrinase (EC 3.2.1.74); cellobiohydrolase (EC 3.2.1.91); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); exo-beta-glucosaminidase (EC 3.2.1.165) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Amorphous Cellulose Oligo Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Backbone Cleavage (Hemicellulose) +GH12 GH12 endoglucanase (EC 3.2.1.4); xyloglucan hydrolase (EC 3.2.1.151); beta-1,3-1,4-glucanase (EC 3.2.1.73); xyloglucan endotransglycosylase (EC 2.4.1.207) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) +GH16 GH16 xyloglucan:xyloglucosyltransferase (EC 2.4.1.207); keratan-sulfate endo-1,4-beta-galactosidase (EC 3.2.1.103); endo-1,3-beta-glucanase / laminarinase (EC 3.2.1.39); endo-1,3(4)-beta-glucanase (EC 3.2.1.6); licheninase (EC 3.2.1.73); beta-agarase (EC 3.2.1.81); kappa;-carrageenase (EC 3.2.1.83); xyloglucanase (EC 3.2.1.151); endo-beta-1,3-galactanase (EC 3.2.1.181); [retaining] beta-porphyranase (EC 3.2.1.178); hyaluronidase (EC 3.2.1.35); endo-beta-1,4-galactosidase (EC 3.2.1.-); chitin beta-1,6-glucanosyltransferase (EC 2.4.1.-); beta-transglycosidase (EC 2.4.1.-); beta-glycosidase (EC 3.2.1.-); endo-beta-1,3-galactanase (EC 3.2.1.181) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Oligo Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Backbone Cleavage (Hemicellulose), Mixed-Linkage glucans Oligo Cleavage (Hemicellulose), Sulf-Polysachharides Backbone Cleavage +GH44 GH44 endoglucanase (EC 3.2.1.4); xyloglucanase (EC 3.2.1.151) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) +GH45 GH45 endoglucanase (EC 3.2.1.4); xyloglucan-specific endo-beta-1,4-glucanase / endo-xyloglucanase (EC 3.2.1.151); endo-beta-1,4-mannanase (EC 3.2.1.78) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) +GH48 GH48 reducing end-acting cellobiohydrolase (EC 3.2.1.176); endo-beta-1,4-glucanase (EC 3.2.1.4); chitinase (EC 3.2.1.14) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Crystalline Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) +GH74 GH74 endoglucanase (EC 3.2.1.4); oligoxyloglucan reducing end-specific cellobiohydrolase (EC 3.2.1.150); xyloglucanase (EC 3.2.1.151) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xyloglucan Backbone Cleavage (Hemicellulose) +GH31 GH31 alpha-glucosidase (EC 3.2.1.20); alpha-galactosidase (EC 3.2.1.22); alpha-mannosidase (EC 3.2.1.24); alpha-1,3-glucosidase (EC 3.2.1.84); sucrase-isomaltase (EC 3.2.1.48) (EC 3.2.1.10); alpha-xylosidase (EC 3.2.1.177); alpha-glucan lyase (EC 4.2.2.13); isomaltosyltransferase (EC 2.4.1.-); oligosaccharide alpha-1,4-glucosyltransferase (EC 2.4.1.161); sulfoquinovosidase (EC 3.2.1.-) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xyloglucan Oligo Cleavage (Hemicellulose), Xylan Oligo Cleavage (Hemicellulose), Alpha-galactans Oligo Cleavage, Alpha-galactans Oligo Cleavage, Mucin Oligo Cleavage +GH10 GH10 endo-1,4-beta-xylanase (EC 3.2.1.8); endo-1,3-beta-xylanase (EC 3.2.1.32); tomatinase (EC 3.2.1.-); xylan endotransglycosylase (EC 2.4.2.-); endo-beta-1,4-glucanase (EC 3.2.1.4) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Backbone Cleavage, Xyloglucan Oligo Cleavage (Hemicellulose), Xylan Backbone Cleavage (Hemicellulose) +GH2 GH2 beta-galactosidase (EC 3.2.1.23) ; beta-mannosidase (EC 3.2.1.25); beta-glucuronidase (EC 3.2.1.31); alpha-L-arabinofuranosidase (EC 3.2.1.55); mannosylglycoprotein endo-beta-mannosidase (EC 3.2.1.152); exo-beta-glucosaminidase (EC 3.2.1.165); alpha-L-arabinopyranosidase (EC 3.2.1.-); beta-galacturonidase (EC 3.2.1.-); beta-xylosidase (EC 3.2.1.37); beta-D-galactofuranosidase (EC 3.2.1.146); Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Amorphous Cellulose Oligo Cleavage, Xyloglucan Oligo Cleavage (Hemicellulose), Beta-mannan Oligo Cleavage (Hemicellulose), Pectin Oligo Cleavage, Beta-galactan (pectic galactan) Oligo Cleavage, Arabinose Oligo cleavage +GH11 GH11 endo-beta-1,4-xylanase (EC 3.2.1.8); endo-beta-1,3-xylanase (EC 3.2.1.32) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xylan Backbone Cleavage (Hemicellulose) +GH43 GH43 beta-xylosidase (EC 3.2.1.37); alpha-L-arabinofuranosidase (EC 3.2.1.55); xylanase (EC 3.2.1.8); alpha-1,2-L-arabinofuranosidase (EC 3.2.1.-); exo-alpha-1,5-L-arabinofuranosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); beta-1,3-xylosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); [inverting] endo-alpha-1,5-L-arabinanase (EC 3.2.1.99); exo-beta-1,3-galactanase (EC 3.2.1.145); beta-D-galactofuranosidase (EC 3.2.1.146) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Xyloglucan Oligo Cleavage (Hemicellulose), Arabinan Backbone Cleavage, Arabinan Oligo Cleavage +GH51 GH51 endoglucanase (EC 3.2.1.4); endo-beta-1,4-xylanase (EC 3.2.1.8); beta-xylosidase (EC 3.2.1.37); alpha-L-arabinofuranosidase (EC 3.2.1.55); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73) Glycoside Hydrolases ag Carbon Processing Hemicellulose degradation Arabinan Oligo Cleavage +CE1 CE1 acetyl xylan esterase (EC 3.1.1.72); cinnamoyl esterase (EC 3.1.1.-); feruloyl esterase (EC 3.1.1.73); carboxylesterase (EC 3.1.1.1); S-formylglutathione hydrolase (EC 3.1.2.12); diacylglycerol O-acyltransferase (EC 2.3.1.20); trehalose 6-O-mycolyltransferase (EC 2.3.1.122) Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Xylan deacetylation support +CE4 CE4 acetyl xylan esterase (EC 3.1.1.72); chitin deacetylase (EC 3.5.1.41); chitooligosaccharide deacetylase (EC 3.5.1.-); peptidoglycan GlcNAc deacetylase (EC 3.5.1.-); peptidoglycan N-acetylmuramic acid deacetylase (EC 3.5.1.-). Carbohydrate Esterases ag Carbon Processing Hemicellulose degradation Chitin Oligo Cleavage +AA9 AA9 (formerly GH61) proteins are copper-dependent lytic polysaccharide monooxygenases (LPMOs); cleavage of cellulose chains with oxidation of carbons C1 and/or C4 and C-6); lytic cellulose monooxygenase (C1-hydroxylating) (EC 1.14.99.54); lytic cellulose monooxygenase (C4-dehydrogenating) (EC 1.14.99.56) Auxiliary Activities ag Carbon Processing Hemicellulose degradation Crystalline Cellulose Backbone Cleavage, Xyloglucan Backbone Cleavage (Hemicellulose) +AA1 laccase / multicopper oxidase [EC:1.10.3.2] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack +mco multicopper oxidase (bacterial laccase) [EC:1.10.3.2] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack +AA2 class II peroxidase (lignin/manganese/versatile peroxidases) [EC:1.11.1.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack +dyp DyP-type peroxidase (dye-decolorizing peroxidase) [EC:1.11.1.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Oxidative polymer attack +AA3_2 aryl-alcohol oxidase (GMC oxidoreductase) [EC:1.1.3.7] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support +AA5_1 glyoxal oxidase [EC:1.2.3.15] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support +AA8 cellobiose dehydrogenase, cytochrome domain [EC:1.1.99.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support +AA3_1 cellobiose dehydrogenase, dehydrogenase domain [EC:1.1.99.-] Lignin degradation (oxidative depolymerization) ag Carbon Processing Lignin degradation Redox support +K18851 glucose-6-phosphate isomerase [EC:5.3.1.9] Glycolysis / gluconeogenesis ag Carbon Processing Sugar utilization Glucose +K00844 hexokinase [EC:2.7.1.1] Glycolysis (hexokinase reaction) ag Carbon Processing Sugar utilization Glucose +K12407 glucokinase [EC:2.7.1.2] Glycolysis (glucokinase reaction) ag Carbon Processing Sugar utilization Glucose +K00845 glucose-6-phosphate dehydrogenase [EC:1.1.1.49] Pentose phosphate pathway (glucose-6-phosphate dehydrogenase) ag Carbon Processing Sugar utilization Glucose +K25026 phosphoglucose isomerase [EC:5.3.1.9] Glycolysis / pentose phosphate interconversion ag Carbon Processing Sugar utilization Glucose +K01182 sucrase-isomaltase [EC:3.2.1.48] Sucrose and starch metabolism (sucrase–isomaltase complex) ag Carbon Processing Sugar utilization Sucrose +K01203 β-fructofuranosidase [EC:3.2.1.26] Fructose and mannose metabolism (β-fructofuranosidase) ag Carbon Processing Sugar utilization Sucrose +K12047 sucrose phosphorylase [EC:2.4.1.7] Sucrose metabolism (sucrose phosphorylase) ag Carbon Processing Sugar utilization Sucrose +K01187 sucrase [EC:3.2.1.48] Sucrose metabolism (sucrase) ag Carbon Processing Sugar utilization Sucrose +K12316 glucosyltransferase [EC:2.4.1.4] Sucrose and starch metabolism (α-glucosyltransferase) ag Carbon Processing Sugar utilization Sucrose +K12317 sucrose-6F-phosphate phosphohydrolase [EC:3.1.3.24] Sucrose-6F-phosphate metabolism (phosphohydrolase) ag Carbon Processing Sugar utilization Sucrose +K00695 α-glucosidase [EC:3.2.1.20] Carbohydrate metabolism (α-glucosidase) ag Carbon Processing Sugar utilization Sucrose +K00690 maltase-glucoamylase [EC:3.2.1.20] Starch and sucrose metabolism (maltase–glucoamylase) ag Carbon Processing Sugar utilization Sucrose +K05341 glucanotransferase [EC:2.4.1.25] Glycosyltransferase (oligosaccharide interconversion) ag Carbon Processing Sugar utilization Sucrose +K00689 oligo-1,6-glucosidase [EC:3.2.1.10] Carbohydrate metabolism (oligo-1,6-glucosidase) ag Carbon Processing Sugar utilization Sucrose +K00692 isomaltase [EC:3.2.1.10] Starch and sucrose metabolism (isomaltase) ag Carbon Processing Sugar utilization Sucrose +K01809 mannose-6-phosphate isomerase [EC:5.3.1.8] Mannose metabolism (mannose-6-phosphate isomerase) ag Carbon Processing Sugar utilization Mannose +K02793 mannose PTS system IIA component [EC:2.7.1.191] PTS system, mannose-specific II component ag Carbon Processing Sugar utilization Mannose +K02794 mannose PTS system IIB component [EC:2.7.1.191] PTS system, mannose-specific II component ag Carbon Processing Sugar utilization Mannose +K02795 mannose PTS system IIC component [EC:2.7.1.191] PTS system, mannose-specific II component ag Carbon Processing Sugar utilization Mannose +K00849 galactokinase [EC:2.7.1.6] Galactose metabolism (galactokinase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose +K00965 galactose-1-phosphate uridylyltransferase [EC:2.7.7.12] Galactose metabolism (galactose-1-phosphate uridylyltransferase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose +K01784 UDP-galactose 4-epimerase [EC:5.1.3.2] Galactose metabolism (UDP-galactose 4-epimerase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose +K01785 galactose mutarotase [EC:5.1.3.3] Galactose metabolism (galactose mutarotase; Leloir pathway) ag Carbon Processing Sugar utilization Galactose +K00879 L-fucokinase [EC:2.7.1.52] Fucose metabolism (L-fucokinase) ag Carbon Processing Sugar utilization Fucose +K01628 L-fuculose-phosphate aldolase [EC:4.1.2.17] Fucose metabolism (L-fuculose-phosphate aldolase) ag Carbon Processing Sugar utilization Fucose +K01818 L-fucose isomerase [EC:5.3.1.25] Fucose metabolism (L-fucose isomerase) ag Carbon Processing Sugar utilization Fucose +K00854 xylose kinase [EC:2.7.1.17] Xylose metabolism (xylose kinase) ag Carbon Processing Sugar utilization Xylose +K01805 xylose isomerase [EC:5.3.1.5] Xylose metabolism (xylose isomerase) ag Carbon Processing Sugar utilization Xylose +K00008 xylitol dehydrogenase [EC:1.1.1.9] Xylose metabolism (xylitol dehydrogenase) ag Carbon Processing Sugar utilization Xylose +K00011 L-arabitol dehydrogenase [EC:1.1.1.12] Xylose / arabinose metabolism (arabitol dehydrogenase) ag Carbon Processing Sugar utilization Xylose +K05351 xylulokinase [EC:2.7.1.17] Xylose metabolism (xylulokinase) ag Carbon Processing Sugar utilization Xylose +K17743 xylitol oxidase [EC:1.1.3.41] Xylose metabolism (xylitol oxidase) ag Carbon Processing Sugar utilization Xylose +K14273 xylulose reductase [EC:1.1.1.9] Xylose metabolism (xylulose reductase) ag Carbon Processing Sugar utilization Xylose +K14274 D-xylonate dehydratase [EC:4.2.1.82] Xylose metabolism (xylonate dehydratase) ag Carbon Processing Sugar utilization Xylose +K14275 xylonolactonase [EC:3.1.1.68] Xylose metabolism (xylonolactonase) ag Carbon Processing Sugar utilization Xylose +K01804 L-arabinose isomerase [EC:5.3.1.4] Arabinose metabolism (L-arabinose isomerase) ag Carbon Processing Sugar utilization Arabinose +K00011 L-arabitol dehydrogenase [EC:1.1.1.12] Xylose / arabinose metabolism (arabitol dehydrogenase) ag Carbon Processing Sugar utilization Arabinose +K26066 arabinose 1-dehydrogenase [EC:1.1.1.46] Arabinose metabolism (arabinose 1-dehydrogenase) ag Carbon Processing Sugar utilization Arabinose +K13873 arabinolactonase [EC:3.1.1.110] Arabinose metabolism (arabinolactonase) ag Carbon Processing Sugar utilization Arabinose +K19660 arabinonate dehydratase [EC:4.2.1.37] Arabinose metabolism (arabinonate dehydratase) ag Carbon Processing Sugar utilization Arabinose +K12446 L-arabonate dehydratase [EC:4.2.1.37] Arabinose metabolism (L-arabonate dehydratase) ag Carbon Processing Sugar utilization Arabinose +K19243 glucose-6-phosphate 1-dehydrogenase [EC:1.1.1.49 1.1.1.363 1.1.1.388] [RN:R02736 R10907] ag Carbon Processing Sugar utilization Glucose +K01807 ribose 5-phosphate isomerase [EC:5.3.1.6] [RN:R01056] ag Carbon Processing Sugar utilization Ribose +K01808 ribose 5-phosphate isomerase [EC:5.3.1.6] [RN:R01056] ag Carbon Processing Sugar utilization Ribose +K01810 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose +K06859 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose +K13810 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose +K15916 glucose-6-phosphate isomerase [EC:5.3.1.9] [RN:R02740 R02739] ag Carbon Processing Sugar utilization Glucose +K00948 ribose-phosphate pyrophosphokinase [EC:2.7.6.1] [RN:R01049] ag Carbon Processing Sugar utilization Ribose +K13937 hexose-6-phosphate dehydrogenase [EC:1.1.1.47 3.1.1.31] [RN:R02736 R02035] ag Carbon Processing Sugar utilization Glucose +K01057 6-phosphogluconolactonase [EC:3.1.1.31] [RN:R02035] ag Carbon Processing Sugar utilization Glucose +K07404 6-phosphogluconolactonase [EC:3.1.1.31] [RN:R02035] ag Carbon Processing Sugar utilization Glucose +K00033 6-phosphogluconate dehydrogenase [EC:1.1.1.44 1.1.1.343] [RN:R01528 R10221] ag Carbon Processing Sugar utilization Glucose +K00615 transketolase [EC:2.2.1.1] [RN:R01830 R01641] ag Carbon Processing Sugar utilization Ribose +K00616 transaldolase [EC:2.2.1.2] [RN:R01827] ag Carbon Processing Sugar utilization Ribose +K01783 ribulose-phosphate 3-epimerase [EC:5.1.3.1] [RN:R01529] ag Carbon Processing Sugar utilization Ribose +K08094 6-phospho-3-hexuloisomerase [EC:5.3.1.27] [RN:R09780] ag Carbon Processing Sugar utilization Ribose +K08093 3-hexulose-6-phosphate synthase [EC:4.1.2.43] [RN:R05338] ag Carbon Processing Sugar utilization Ribose +K13812 3-hexulose-6-phosphate synthase [EC:4.1.2.43] [RN:R05338] ag Carbon Processing Sugar utilization Ribose +K13831 6-phospho-3-hexuloisomerase [EC:5.3.1.27] [RN:R09780] ag Carbon Processing Sugar utilization Ribose +K00844 hexokinase [EC:2.7.1.1] [RN:R01786] ag Carbon Processing Sugar utilization Glucose +K01835 phosphoglucomutase [EC:5.4.2.2] [RN:R00959] ag Carbon Processing Sugar utilization Glucose +K00963 UTP--glucose-1-phosphate uridylyltransferase [EC:2.7.7.9] [RN:R00289] ag Carbon Processing Sugar utilization Glucose +K00849 galactokinase [EC:2.7.1.6] [RN:R01092] ag Carbon Processing Sugar utilization Galactose +K00918 ADP-dependent phosphofructokinase [EC:2.7.1.146] [RN:R09084] ag Carbon Processing Sugar utilization Glucose +K00850 6-phosphofructokinase [EC:2.7.1.11] [RN:R04779] ag Carbon Processing Sugar utilization Glucose +K16370 6-phosphofructokinase [EC:2.7.1.11] [RN:R04779] ag Carbon Processing Sugar utilization Glucose +K01623 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose +K01624 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose +K11645 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose +K16305 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose +K16306 fructose-bisphosphate aldolase [EC:4.1.2.13] [RN:R01070] ag Carbon Processing Sugar utilization Fructose +K01803 triosephosphate isomerase [EC:5.3.1.1] [RN:R01015] ag Carbon Processing Sugar utilization Glucose +K00134 glyceraldehyde 3-phosphate dehydrogenase [EC:1.2.1.12 1.2.1.59] [RN:R01061 R01063] ag Carbon Processing Sugar utilization Glucose +K00150 glyceraldehyde 3-phosphate dehydrogenase [EC:1.2.1.12 1.2.1.59] [RN:R01061 R01063] ag Carbon Processing Sugar utilization Glucose +K00927 phosphoglycerate kinase [EC:2.7.2.3] [RN:R01512] ag Carbon Processing Sugar utilization Glucose +K11389 glyceraldehyde-3-phosphate dehydrogenase (ferredoxin) [EC:1.2.7.6] [RN:R07159] ag Carbon Processing Sugar utilization Glucose +K01834 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose +K15633 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose +K15634 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose +K15635 phosphoglycerate mutase [EC:5.4.2.11 5.4.2.12] [RN:R01518] ag Carbon Processing Sugar utilization Glucose +K01689 enolase [EC:4.2.1.11] [RN:R00658] ag Carbon Processing Sugar utilization Glucose +K00873 pyruvate kinase [EC:2.7.1.40] [RN:R00200] ag Carbon Processing Sugar utilization Glucose +K12406 pyruvate kinase [EC:2.7.1.40] [RN:R00200] ag Carbon Processing Sugar utilization Glucose +K01596 phosphoenolpyruvate carboxykinase [EC:4.1.1.32 4.1.1.49] [RN:R00431 R00726 R00341] ag Carbon Processing Sugar utilization Fructose +K01610 phosphoenolpyruvate carboxykinase [EC:4.1.1.32 4.1.1.49] [RN:R00431 R00726 R00341] ag Carbon Processing Sugar utilization Fructose +K03841 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose +K02446 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose +K11532 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose +K01086 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose +K04041 fructose-1,6-bisphosphatase [EC:3.1.3.11] [RN:R04780] ag Carbon Processing Sugar utilization Fructose +K01622 fructose 1,6-bisphosphate aldolase/phosphatase [EC:4.1.2.13 3.1.3.11] [RN:R01070 R04780] ag Carbon Processing Sugar utilization Fructose +K01690 phosphogluconate dehydratase [EC:4.2.1.12] [RN:R02036] ag Carbon Processing Sugar utilization Glucose +K01625 2-dehydro-3-deoxyphosphogluconate aldolase [EC:4.1.2.14] [RN:R05605] ag Carbon Processing Sugar utilization Glucose +K01785 aldose 1-epimerase [EC:5.1.3.3] [RN:R10619] ag Carbon Processing Sugar utilization Glucose +K00012 UDPglucose 6-dehydrogenase [EC:1.1.1.22] [RN:R00286] ag Carbon Processing Sugar utilization Glucose +AA3 AA3 cellobiose dehydrogenase (EC 1.1.99.18); glucose 1-oxidase (EC 1.1.3.4); aryl alcohol oxidase (EC 1.1.3.7); alcohol oxidase (EC 1.1.3.13); pyranose oxidase (EC 1.1.3.10) ag Carbon Processing Sugar utilization Glucose +AA5 AA5 Oxidase with oxygen as acceptor (EC 1.1.3.-); galactose oxidase (EC 1.1.3.9); glyoxal oxidase (EC 1.2.3.15); alcohol oxidase (EC 1.1.3.13) ag Carbon Processing Sugar utilization Galactose +CBM13 CBM13 Modules of approx. 150 residues which always appear as a threefold internal repeat. The only apparent exception to this, xylanase II of Actinomadura sp. FC7 (GenBank U08894), is in fact not completely sequenced. These modules were first identified in several plant lectins such as ricin or agglutinin of Ricinus communis which bind galactose residues. The three-dimensional structure of a plant lectin has been determined and displays a pseudo-threefold symmetry in accord with the observed sequence threefold repeat. These modules have since been found in a number of other proteins of various functions including glycoside hydrolases and glycosyltransferases. While in the plant lectins this module binds mannose, binding to xylan has been demonstrated in the Streptomyces lividans xylanase A and arabinofuranosidase B. Binding to GalNAc has been shown for the corresponding module of GalNAc transferase 4. For the other proteins, the binding specificity of these modules has not been established. The pseudo three-fold symmetry of the CBM13 module has now been confirmed in the 3-D structure of the intact, two-domain, xylanase of Streptomyces olivaceoviridis. ag Carbon Processing Sugar utilization Xylanase +CBM31 CBM31 Binding to beta-1,3-xylan has been demonstrated for the C-terminal module of the beta-1,3-xylanase of Alcaligenes sp. XY234. ag Carbon Processing Sugar utilization Xylanase +CBM32 CBM32 Binding to galactose and lactose has been demonstrated for the module of Micromonospora viridifaciens sialidase (PMID: 16239725). Binding to polygalacturonic acid has been shown for a Yersinia member (PMID: 17292916). Binding to LacNAc (beta-D-galactosyl-1,4-beta-D-N-acetylglucosamine) has been shown for an N-acetylglucosaminidase from Clostridium perfingens (PMID: 16990278). ag Carbon Processing Sugar utilization Galacturonic Acid +CBM36 CBM36 Modules of approx. 120-130 residues displaying structural similarities to CBM6 modules. The only CBM36 currently characterised, that from Paenbacillus polymyxa xylanase 43A, shows calcium-dependent binding of xylans and xylooligosaccharides. X-ray crystallography shows that there is a direct interaction between calcium and ligand. ag Carbon Processing Sugar utilization Xylanase +CBM51 CBM51 Modules of approx. 150 residues found attached to various enzymes from families GH2, GH27, GH31, GH95, GH98 and GH101 . Binding to galactose and to blood group A/B-antigens demonstrated in the case of C. perfringens GH95CBM51 and GH98CBM51 respectively [Gregg KJ et al. (2008) J. Biol. Chem. 283:12604-13 PMID: 18292090]. ag Carbon Processing Sugar utilization Galactose +CBM59 CBM59 Binding to mannan, xylan, and cellulose demonstrated for the CBM59 of ManF-X10 xylanase from an environmental genomic DNA library (Li et al. (2009) World Journal of Microbiology and Biotechnology 25:2071-2078; doi:10.1007/s11274-009-0111-6) ag Carbon Processing Sugar utilization Xylanase +CBM60 CBM60 Modules of approx 120 residues usually found appended to xylanases. The xylan-binding function and the relatedness (circular permutation) to family CBM36 has been demonstrated [PMID: 20659893]. ag Carbon Processing Sugar utilization Xylanase +CBM62 CBM62 The CBM62 module of Clostridium thermocellum Cthe_2193 protein binds galactose moieties found on xyloglucan, arabinogalactan and galactomannan. ag Carbon Processing Sugar utilization Galactose +CBM67 CBM67 Fujimoto et al. [PMID : 23486481] disclosed the L-rhamnose binding activity and 3-D structure of the CBM67 of Streptomyces avermitilis alpha-L-rhamnosidase (SaRha78A); ag Carbon Processing Sugar utilization Rhamnose +CBM71 CBM71 The two CBM71s of S. pneumoniae BgaA bind lactose and LacNAc. ag Carbon Processing Sugar utilization Lactose +CBM9 CBM9 Modules of approx. 170 residues found so far only in xylanases. The cellulose-binding function has been demonstrated in one case. ag Carbon Processing Sugar utilization Xylanase +CE1 CE1 acetyl xylan esterase (EC 3.1.1.72); cinnamoyl esterase (EC 3.1.1.-); feruloyl esterase (EC 3.1.1.73); carboxylesterase (EC 3.1.1.1); S-formylglutathione hydrolase (EC 3.1.2.12); diacylglycerol O-acyltransferase (EC 2.3.1.20); trehalose 6-O-mycolyltransferase (EC 2.3.1.122) ag Carbon Processing Sugar utilization Trehalose +GH11 GH11 endo-beta-1,4-xylanase (EC 3.2.1.8); endo-beta-1,3-xylanase (EC 3.2.1.32) ag Carbon Processing Sugar utilization Glycoside Hydrolase +GH130 GH130 beta-1,4-mannosylglucose phosphorylase (EC 2.4.1.281); beta-1,4-mannooligosaccharide phosphorylase (EC 2.4.1.319); beta-1,4-mannosyl-N-acetyl-glucosamine phosphorylase (EC 2.4.1.320); beta-1,2-mannobiose phosphorylase (EC 2.4.1.-); beta-1,2-oligomannan phosphorylase (EC 2.4.1.-); beta-1,2-mannosidase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Glycoside Hydrolase +GH18 GH18 chitinase (EC 3.2.1.14); lysozyme (EC 3.2.1.17); endo-beta-N-acetylglucosaminidase (EC 3.2.1.96); peptidoglycan hydrolase with endo-beta-N-acetylglucosaminidase specificity (EC 3.2.1.-); Nod factor hydrolase (EC 3.2.1.-); xylanase inhibitor; concanavalin B; narbonin ag Carbon Processing Sugar utilization Glycoside Hydrolase +GH26 GH26 beta-mannanase (EC 3.2.1.78); exo-beta-1,4-mannobiohydrolase (EC 3.2.1.100); beta-1,3-xylanase (EC 3.2.1.32); lichenase / endo-beta-1,3-1,4-glucanase (EC 3.2.1.73); mannobiose-producing exo-beta-mannanase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Glycoside Hydrolase +GH32 GH32 invertase (EC 3.2.1.26); endo-inulinase (EC 3.2.1.7); beta-2,6-fructan 6-levanbiohydrolase (EC 3.2.1.64); endo-levanase (EC 3.2.1.65); exo-inulinase (EC 3.2.1.80); fructan beta-(2,1)-fructosidase/1-exohydrolase (EC 3.2.1.153); fructan beta-(2,6)-fructosidase/6-exohydrolase (EC 3.2.1.154); sucrose:sucrose 1-fructosyltransferase (EC 2.4.1.99); fructan:fructan 1-fructosyltransferase (EC 2.4.1.100); sucrose:fructan 6-fructosyltransferase (EC 2.4.1.10); fructan:fructan 6G-fructosyltransferase (EC 2.4.1.243); levan fructosyltransferase (EC 2.4.1.-); [retaining] sucrose:sucrose 6-fructosyltransferase (6-SST) (EC 2.4.1.-); cycloinulo-oligosaccharide fructanotransferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycoside Hydrolase +GH43 GH43 beta-xylosidase (EC 3.2.1.37); alpha-L-arabinofuranosidase (EC 3.2.1.55); xylanase (EC 3.2.1.8); alpha-1,2-L-arabinofuranosidase (EC 3.2.1.-); exo-alpha-1,5-L-arabinofuranosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); beta-1,3-xylosidase (EC 3.2.1.-); [inverting] exo-alpha-1,5-L-arabinanase (EC 3.2.1.-); [inverting] endo-alpha-1,5-L-arabinanase (EC 3.2.1.99); exo-beta-1,3-galactanase (EC 3.2.1.145); beta-D-galactofuranosidase (EC 3.2.1.146) ag Carbon Processing Sugar utilization Glycoside Hydrolase +GH8 GH8 chitosanase (EC 3.2.1.132); cellulase (EC 3.2.1.4); licheninase (EC 3.2.1.73); endo-1,4-beta-xylanase (EC 3.2.1.8); reducing-end-xylose releasing exo-oligoxylanase (EC 3.2.1.156) ag Carbon Processing Sugar utilization Glycoside Hydrolase +GT106 GT106 UDP-beta-L-rhamnose:rhamnogalacturonan I 4-alpha-rhamnosyltransferase (EC 2.4.1.351) ag Carbon Processing Sugar utilization Glycosyl Transferase +GT1 GT1 UDP-glucuronosyltransferase (EC 2.4.1.17); zeatin O-beta-xylosyltransferase (EC 2.4.2.40); 2-hydroxyacylsphingosine 1-beta-galactosyltransferase (EC 2.4.1.45); N-acylsphingosine galactosyltransferase (EC 2.4.1.47); flavonol 3-O-glucosyltransferase (EC 2.4.1.91); anthocyanidin 3-O-glucosyltransferase (EC 2.4.1.115); sinapate 1-glucosyltransferase (EC 2.4.1.120); indole-3-acetate beta-glucosyltransferase (EC 2.4.1.121); flavonol L-rhamnosyltransferase (EC 2.4.1.159); sterol glucosyltransferase (EC 2.4.1.173); UDP-Glc: 4-hydroxybenzoate 4-O-beta-glucosyltransferase (EC 2.4.1.194); zeatin O-beta-glucosyltransferase (EC 2.4.1.203); limonoid glucosyltransferase (EC 2.4.1.210); UDP-GlcA: baicalein 7-O-beta-glucuronosyltransferase (EC 2.4.1.253); UDP-Glc: chalcone 4‚Äö√Ñ√∂‚àö‚Ć‚àö‚àǬ¨¬®¬¨¬¢‚Äö√Ñ√∂‚àö√ë‚àö‚àÇ‚Äö√†√∂‚àö¬∞¬¨¬®¬¨√ܬ¨¬®¬¨¬Æ‚Äö√Ñ√∂‚àö¬¢¬¨√ü-O-beta-glucosyltransferase (EC 2.4.1.286); ecdysteroid UDP-glucosyltransferase (EC 2.4.1.-); salicylic acid beta-glucosyltransferase (EC 2.4.1.-); anthocyanin 3-O-galactosyltransferase (EC 2.4.1.-); anthocyanin 5-O-glucosyltransferase (EC 2.4.1.-); dTDP-beta-2-deoxy-L-fucose: alpha-L-2-deoxyfucosyltransferase (EC 2.4.1.-); UDP-beta-L-rhamnose: alpha-L-rhamnosyltransferase (EC 2.4.1.-); zeaxanthin glucosyltransferase (EC 2.4.1.-); flavone 8-C-glycosyltransferase ag Carbon Processing Sugar utilization Glycosyl Transferase +GT20 GT20 alpha,alpha-trehalose-phosphate synthase [UDP-forming] (EC 2.4.1.15); Glucosylglycerol-phosphate synthase (EC 2.4.1.213); trehalose-6-P phosphatase (EC 3.1.3.12); [retaining] GDP-valeniol: validamine 7-phosphate valeniolyltransferase (EC 2.-.-.-) ag Carbon Processing Sugar utilization Glycosyl Transferase +GT31 GT31 N-acetyllactosaminide beta-1,3-N-acetylglucosaminyltransferase (EC 2.4.1.149); Glycoprotein-N-acetylgalactosamine 3-beta-galactosyltransferase (EC 2.4.1.122); fucose-specific beta-1,3-N-acetylglucosaminyltransferase (EC 2.4.1.-); globotriosylceramide beta-1,3-GalNAc transferase (EC 2.4.1.79); chondroitin synthase (beta-1,3-GlcUA and beta-1,4-GalNAc transferase (EC 2.4.1.175); chondroitin beta-1,3-glucuronyltransferase (EC 2.4.1.226); chondroitin beta-1,4-N-acetylgalactosaminyltransferase (EC 2.4.1.-); UDP-Gal: beta-galactosylxylosylprotein beta-1,3-galactosyltransferase (EC 2.4.1.134); UDP-GlcNAc: O-fucosylpeptide beta-1,3-N-acetylglucosaminyltransferase (EC 2.4.1.222) ag Carbon Processing Sugar utilization Glycosyl Transferase +GT32 GT32 alpha-1,6-mannosyltransferase (EC 2.4.1.-); alpha-1,4-N-acetylglucosaminyltransferase (EC 2.4.1.-); alpha-1,4-N-acetylgalactosaminyltransferase (EC 2.4.1.-); GDP-Man: inositol-phosphorylceramide transferase (EC 2.4.1.-); UDP-Gal: beta-galactoside alpha-1,4-galactosyltransferase (EC 2.4.1.-); UDP-Gal: lactose/N-acetyl-lactosamine alpha-1,4-galactosyltransferase (EC 2.4.1.-); UDP-Glc: protein alpha-glucosyltransferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycosyl Transferase +GT4 GT4 sucrose synthase (EC 2.4.1.13); sucrose-phosphate synthase (EC 2.4.1.14); alpha-glucosyltransferase (EC 2.4.1.52); lipopolysaccharide N-acetylglucosaminyltransferase (EC 2.4.1.56); phosphatidylinositol alpha-mannosyltransferase (EC 2.4.1.57); GDP-Man: Man1GlcNAc2-PP-dolichol alpha-1,3-mannosyltransferase (EC 2.4.1.132); GDP-Man: Man3GlcNAc2-PP-dolichol/Man4GlcNAc2-PP-dolichol alpha-1,2-mannosyltransferase (EC 2.4.1.131); digalactosyldiacylglycerol synthase (EC 2.4.1.141); 1,2-diacylglycerol 3-glucosyltransferase (EC 2.4.1.157); diglucosyl diacylglycerol synthase (EC 2.4.1.208); trehalose phosphorylase (EC 2.4.1.231); NDP-Glc: alpha-glucose alpha-glucosyltransferase / alpha,alpha-trehalose synthase (EC 2.4.1.245); GDP-Man: Man2GlcNAc2-PP-dolichol alpha-1,6-mannosyltransferase (EC 2.4.1.257); UDP-GlcNAc: 2-deoxystreptamine alpha-N-acetylglucosaminyltransferase (EC 2.4.1.283); UDP-GlcNAc: ribostamycin alpha-N-acetylglucosaminyltransferase (EC 2.4.1.285); UDP-Gal alpha-galactosyltransferase (EC 2.4.1.-); UDP-Xyl alpha-xylosyltransferase (EC 2.4.2.-); UDP-GlcA alpha-glucuronyltransferase (EC 2.4.1.-); UDP-Glc alpha-glucosyltransferase (EC 2.4.1.-); UDP-GalNAc: GalNAc-PP-Und alpha-1,3-N-acetylgalactosaminyltransferase (EC 2.4.1.306); UDP-GalNAc: N,N'-diacetylbacillosaminyl-PP-Und alpha-1,3-N-acetylgalactosaminyltransferase (EC 2.4.1.290); ADP-dependent alpha-maltose-1-phosphate synthase (2.4.1.342) ag Carbon Processing Sugar utilization Glycosyl Transferase +GT7 GT7 lactose synthase (EC 2.4.1.22); beta-N-acetylglucosaminyl-glycopeptide beta-1,4-galactosyltransferase (EC 2.4.1.38); N-acetyllactosamine synthase (EC 2.4.1.90); xylosylprotein beta-4-galactosyltransferase (EC 2.4.1.133); UDP-Gal: neolactotriaosylceramide beta-1,4-galactosyltransferase (EC 2.4.1.275); beta-1,4-N-acetylglucosaminyltransferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycosyl Transferase +GT83 GT83 undecaprenyl phosphate-alpha-L-Ara4N: 4-amino-4-deoxy-beta-L-arabinosyltransferase (EC 2.4.2.43); dodecaprenyl phosphate-beta-galacturonic acid: lipopolysaccharide core alpha-galacturonosyl transferase (EC 2.4.1.-) ag Carbon Processing Sugar utilization Glycosyl Transferase +PL27 PL27 L-rhamnose-alpha-1,4-D-glucuronate lyase (EC 4.2.2.-) ag Carbon Processing Sugar utilization Rhamnose +K10108 malE; maltose/maltodextrin transport system substrate-binding protein ag Carbon Processing Sugar utilization Maltose +K10109 malF; maltose/maltodextrin transport system permease protein ag Carbon Processing Sugar utilization Maltose +K10110 malG; maltose/maltodextrin transport system permease protein ag Carbon Processing Sugar utilization Maltose +K10111 malK; maltose/maltodextrin transport system ATP-binding protein [EC:3.6.3.19] ag Carbon Processing Sugar utilization Maltose +K10112 msmX; maltose/maltodextrin transport system ATP-binding protein ag Carbon Processing Sugar utilization Maltose +K10188 lacE; lactose/L-arabinose transport system substrate-binding protein ag Carbon Processing Sugar utilization Lactose +K10189 lacF; lactose/L-arabinose transport system permease protein ag Carbon Processing Sugar utilization Lactose +K10190 lacG; lactose/L-arabinose transport system permease protein ag Carbon Processing Sugar utilization Lactose +K10191 lacK; lactose/L-arabinose transport system ATP-binding protein ag Carbon Processing Sugar utilization Lactose +K10196 ABC.GLC.S; glucose/arabinose transport system substrate-binding protein ag Carbon Processing Sugar utilization Glucose +K10197 ABC.GLC.P; glucose/arabinose transport system permease protein ag Carbon Processing Sugar utilization Glucose +K10198 ABC.GLC.P1; glucose/arabinose transport system permease protein ag Carbon Processing Sugar utilization Glucose +K10199 ABC.GLC.A; glucose/arabinose transport system ATP-binding protein ag Carbon Processing Sugar utilization Glucose +K10236 thuE; trehalose/maltose transport system substrate-binding protein ag Carbon Processing Sugar utilization Trehalose +K10237 thuF; trehalose/maltose transport system permease protein ag Carbon Processing Sugar utilization Trehalose +K10238 thuG; trehalose/maltose transport system permease protein ag Carbon Processing Sugar utilization Trehalose +K10439 rbsB; ribose transport system substrate-binding protein ag Carbon Processing Sugar utilization Ribose +K10440 rbsC; ribose transport system permease protein ag Carbon Processing Sugar utilization Ribose +K10441 rbsA; ribose transport system ATP-binding protein [EC:3.6.3.17] ag Carbon Processing Sugar utilization Ribose +K10543 xylF; D-xylose transport system substrate-binding protein ag Carbon Processing Sugar utilization Xylose +K10544 xylH; D-xylose transport system permease protein ag Carbon Processing Sugar utilization Xylose +K10545 xylG; D-xylose transport system ATP-binding protein [EC:3.6.3.17] ag Carbon Processing Sugar utilization Xylose +K10552 frcB; fructose transport system substrate-binding protein ag Carbon Processing Sugar utilization Fructose +K10553 frcC; fructose transport system permease protein ag Carbon Processing Sugar utilization Fructose +K10554 frcA; fructose transport system ATP-binding protein ag Carbon Processing Sugar utilization Fructose +K10559 rhaS1; rhamnose transport system substrate-binding protein ag Carbon Processing Sugar utilization Rhamnose +K10560 rhaP; rhamnose transport system permease protein ag Carbon Processing Sugar utilization Rhamnose +K10561 rhaQ; rhamnose transport system permease protein ag Carbon Processing Sugar utilization Rhamnose +K10562 rhaT; rhamnose transport system ATP-binding protein [EC:3.6.3.17] ag Carbon Processing Sugar utilization Rhamnose +K02777 PTS-Glc-EIIA; PTS system, glucose-specific IIA component ag Carbon Processing Sugar utilization Glucose +K02778 PTS-Glc-EIIB; PTS system, glucose-specific IIB component ag Carbon Processing Sugar utilization Glucose +K02779 PTS-Glc-EIIC; PTS system, glucose-specific IIC component ag Carbon Processing Sugar utilization Glucose +K02790 PTS-MalGlc-EIIB; PTS system, maltose/glucose-specific IIB component ag Carbon Processing Sugar utilization Maltose +K02791 PTS-MalGlc-EIIC; PTS system, maltose/glucose-specific IIC component ag Carbon Processing Sugar utilization Maltose +K02808 PTS-Scr-EIIA; PTS system, sucrose-specific IIA component ag Carbon Processing Sugar utilization Sucrose +K02809 PTS-Scr-EIIB; PTS system, sucrose-specific IIB component ag Carbon Processing Sugar utilization Sucrose +K02810 PTS-Scr-EIIC; PTS system, sucrose-specific IIC component ag Carbon Processing Sugar utilization Sucrose +K02817 PTS-Tre-EIIA; PTS system, trehalose-specific IIA component ag Carbon Processing Sugar utilization Trehalose +K02818 PTS-Tre-EIIB; PTS system, trehalose-specific IIB component ag Carbon Processing Sugar utilization Trehalose +K02819 PTS-Tre-EIIC; PTS system, trehalose-specific IIC component ag Carbon Processing Sugar utilization Trehalose +K02768 PTS-Fru-EIIA; PTS system, fructose-specific IIA component ag Carbon Processing Sugar utilization Fructose +K02769 PTS-Fru-EIIB; PTS system, fructose-specific IIB component ag Carbon Processing Sugar utilization Fructose +K02770 PTS-Fru-EIIC; PTS system, fructose-specific IIC component ag Carbon Processing Sugar utilization Fructose +K02793 PTS-Man-EIIA; PTS system, mannose-specific IIA component ag Carbon Processing Sugar utilization Mannose +K02786 PTS-Lac-EIIA; PTS system, lactose-specific IIA component ag Carbon Processing Sugar utilization Lactose +K02787 PTS-Lac-EIIB; PTS system, lactose-specific IIB component ag Carbon Processing Sugar utilization Lactose +K02788 PTS-Lac-EIIC; PTS system, lactose-specific IIC component ag Carbon Processing Sugar utilization Lactose +K11194 PTS-Fru1-EIIA; PTS system, fructose-specific IIA component ag Carbon Processing Sugar utilization Fructose +K11195 PTS-Fru1-EIIB; PTS system, fructose-specific IIB component ag Carbon Processing Sugar utilization Fructose +K11196 PTS-Fru1-EIIC; PTS system, fructose-specific IIC component ag Carbon Processing Sugar utilization Fructose +K02771 PTS-Fru1-EIID; PTS system, fructose-specific IID component ag Carbon Processing Sugar utilization Fructose +K11201 PTS-Fru2-EIIA; PTS system, fructose-specific IIA-like component ag Carbon Processing Sugar utilization Fructose +K11202 PTS-Fru2-EIIB; PTS system, fructose-specific IIB-like component ag Carbon Processing Sugar utilization Fructose +K11203 PTS-Fru2-EIIC; PTS system, fructose-specific IIC-like component ag Carbon Processing Sugar utilization Fructose +K17311 K17311; trehalose transport system substrate-binding protein ag Carbon Processing Sugar utilization Trehalose +K17312 K17312; trehalose transport system permease protein ag Carbon Processing Sugar utilization Trehalose +K17313 treU; trehalose transport system permease protein ag Carbon Processing Sugar utilization Trehalose +K17314 treV; trehalose transport system ATP-binding protein ag Carbon Processing Sugar utilization Trehalose +K17315 gtsA; glucose/mannose transport system substrate-binding protein ag Carbon Processing Sugar utilization Glucose +K17316 gtsB; glucose/mannose transport system permease protein ag Carbon Processing Sugar utilization Glucose +K17317 gtsC; glucose/mannose transport system permease protein ag Carbon Processing Sugar utilization Glucose +K19506 PTS-Gfr-EIIA; PTS system, fructoselysine/glucoselysine-specific IIA component ag Carbon Processing Sugar utilization Fructose +K19507 PTS-Gfr-EIIB; PTS system, fructoselysine/glucoselysine-specific IIB component ag Carbon Processing Sugar utilization Fructose +K19508 PTS-Gfr-EIIC; PTS system, fructoselysine/glucoselysine-specific IIC component ag Carbon Processing Sugar utilization Fructose +K19509 PTS-Gfr-EIID; PTS system, fructoselysine/glucoselysine-specific IID component ag Carbon Processing Sugar utilization Fructose +K20107 PTS-Mal-EIIB; PTS system, maltose-specific IIB component ag Carbon Processing Sugar utilization Maltose +K20108 PTS-Mal-EIIC; PTS system, maltose-specific IIC component ag Carbon Processing Sugar utilization Maltose +K20112 PTS-Gal-EIIA; PTS system, galactose-specific IIA component ag Carbon Processing Sugar utilization Galactose +K20113 PTS-Gal-EIIB; PTS system, galactose-specific IIB component ag Carbon Processing Sugar utilization Galactose +K20114 PTS-Gal-EIIC; PTS system, galactose-specific IIC component ag Carbon Processing Sugar utilization Galactose +K20116 PTS-Glc1-EIIA; PTS system, glucose-specific IIA component ag Carbon Processing Sugar utilization Glucose +K20117 PTS-Glc1-EIIB; PTS system, glucose-specific IIB component ag Carbon Processing Sugar utilization Glucose +K20118 PTS-Glc1-EIIC; PTS system, glucose-specific IIC component ag Carbon Processing Sugar utilization Glucose +K01812 glucuronate isomerase ag Carbon Processing Sugar utilization Galacturonic Acid +K00041 tagaturonate reductase ag Carbon Processing Sugar utilization Galacturonic Acid +K01685 altronate hydrolase ag Carbon Processing Sugar utilization Galacturonic Acid +K16849 altronate dehydratase small subunit ag Carbon Processing Sugar utilization Galacturonic Acid +K16850 altronate dehydratase large subunit ag Carbon Processing Sugar utilization Galacturonic Acid +K00874 2-dehydro-3-deoxygluconokinase ag Carbon Processing Sugar utilization Galacturonic Acid +K01190 beta-galactosidase ag Carbon Processing Sugar utilization Lactose +K12111 evolved beta-galactosidase subunit alpha ag Carbon Processing Sugar utilization Lactose +K12112 evolved beta-galactosidase subunit beta ag Carbon Processing Sugar utilization Lactose +K12309 beta-galactosidase ag Carbon Processing Sugar utilization Lactose +K01203 sucrase-isomaltase ag Carbon Processing Sugar utilization Sucrose +K12047 maltase-glucoamylase ag Carbon Processing Sugar utilization Sucrose +K00690 sucrose phosphorylase ag Carbon Processing Sugar utilization Sucrose +K01809 mannose-6-phosphate isomerase ag Carbon Processing Sugar utilization Mannose +K14273 D-xylose 1-dehydrogenase (NADP+) ag Carbon Processing Sugar utilization Xylose +GH172 difructose-anhydride-I synthase (EC 4.2.1.179 (old 3.2.1.134)); alpha-D-Arabinofuranosidase (EC 3.2.1.-); alpha-D-Fructofuranosidase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Fructose +PL42 L-rhamnose-_-1,4-D-glucuronate lyase (EC 4.2.2.-); L-Rh_-_-1,4-GlcA _-L-rhamnohydrolase (EC 3.2.1.-) ag Carbon Processing Sugar utilization Rhamnose +CBM88 Binding to terminal galactose in galactoxyloglucan and galactomannan ag Carbon Processing Sugar utilization Galactose +K01188 beta-glucosidase [EC:3.2.1.21] Hydrolysis of terminal β-D-glucosyl residues (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K05349 beta-glucosidase [EC:3.2.1.21] Hydrolysis of terminal β-D-glucosyl residues (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K05350 beta-glucosidase [EC:3.2.1.21] Hydrolysis of terminal β-D-glucosyl residues (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K01198 xylan 1,4-beta-xylosidase [EC:3.2.1.37] Hydrolysis of β-D-xylose residues ag Enzyme Assay Analogs Hydrolytic Enzymes +K15920 xylan 1,4-beta-xylosidase [EC:3.2.1.37] Hydrolysis of β-D-xylose residues ag Enzyme Assay Analogs Hydrolytic Enzymes +K22268 xylan 1,4-beta-xylosidase [EC:3.2.1.37] Hydrolysis of β-D-xylose residues ag Enzyme Assay Analogs Hydrolytic Enzymes +K01130 arylsulfatase [EC:3.1.6.1] Hydrolysis of aromatic sulfate esters ag Enzyme Assay Analogs Hydrolytic Enzymes +K01227 mannosyl-glycoprotein endo-beta-N-acetylglucosaminidase [EC:3.2.1.96] Hydrolysis of chitin N-acetyl-β-D-glucosaminide ag Enzyme Assay Analogs Hydrolytic Enzymes +K13714 bifunctional autolysin [EC:3.2.1.96] Hydrolysis of chitin N-acetyl-β-D-glucosaminide ag Enzyme Assay Analogs Hydrolytic Enzymes +K23989 mannosyl-glycoprotein endo-beta-N-acetylglucosaminidase [EC:3.2.1.96] Hydrolysis of chitin N-acetyl-β-D-glucosaminide ag Enzyme Assay Analogs Hydrolytic Enzymes +K01078 acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K01093 4-phytase / acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K03788 acid phosphatase (class B) [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K09474 acid phosphatase (class A) [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K14379 tartrate-resistant acid phosphatase type 5 [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K14394 low molecular weight phosphotyrosine protein phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K14395 lysophosphatidic acid phosphatase type 6 [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K14410 lysosomal acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K19283 prostatic acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K19284 testicular acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K23458 repressible acid phosphatase [EC:3.1.3.2] Hydrolysis of phosphate monoesters ag Enzyme Assay Analogs Hydrolytic Enzymes +K01255 leucyl aminopeptidase [EC:3.4.11.1] Breakdown of leucine residues at the N-terminus of peptides ag Enzyme Assay Analogs Hydrolytic Enzymes +K11142 cytosol aminopeptidase [EC:3.4.11.1] Breakdown of leucine residues at the N-terminus of peptides ag Enzyme Assay Analogs Hydrolytic Enzymes +K01225 cellulose 1,4-beta-cellobiosidase [EC:3.2.1.91] Hydrolysis of β-D-glucosyl linkages (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K19668 cellulose 1,4-beta-cellobiosidase [EC:3.2.1.91] Hydrolysis of β-D-glucosyl linkages (from cellulose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K01187 alpha-glucosidase [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K12047 maltase-glucoamylase [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K12316 lysosomal alpha-glucosidase [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K12317 neutral alpha-glucosidase C [EC:3.2.1.20] Hydrolysis of α-D-glucosyl linkages (starch, maltose, sucrose) ag Enzyme Assay Analogs Hydrolytic Enzymes +K05910 NADH peroxidase [EC:1.11.1.-] Use of peroxide as electron acceptor to depolymerize lignin ag Enzyme Assay Analogs Oxidative Enzymes +K00421 laccase [EC:1.10.3.2] Oxidation of aromatic rings in phenolics ag Enzyme Assay Analogs Oxidative Enzymes +K05909 laccase [EC:1.10.3.2] Oxidation of aromatic rings in phenolics ag Enzyme Assay Analogs Oxidative Enzymes diff --git a/bin/assets/forms/distill_sheets/distill_camper.tsv b/bin/assets/forms/distill_sheets/distill_camper.tsv old mode 100755 new mode 100644 index ab2f0fad..d11c2420 --- a/bin/assets/forms/distill_sheets/distill_camper.tsv +++ b/bin/assets/forms/distill_sheets/distill_camper.tsv @@ -130,7 +130,7 @@ K03381 catA; catechol 1,2-dioxygenase [EC:1.13.11.1] catechol degradation- ortho K03464 catC; muconolactone D-isomerase [EC:5.3.3.4] catechol degradation- ortho cleavage (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;catechol Step 3 (+)-Muconolactone => 3-Oxoadipate enol-lactone oxic EC:5.3.3.4 K03464 K03862 vanA; vanillate monooxygenase subunit A vanillate conversion to protocatechuate route 1 (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;vanillic_acid step 1 subunit A vanillate => protocatechuate, formaldehyde oxic EC:1.14.13.82 K03862 K03863 vanB; vanillate monooxygenase subunit B vanillate conversion to protocatechuate route 1 (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;vanillic_acid step 1 subunit B vanillate => protocatechuate, formaldehyde oxic EC:1.14.13.82 K03863 -K04098 chqB; hydroxyquinol 1,2-dioxygenase resorcylic acid degradation (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;resorcinol step 3 hydroxyquinol => 3-Hydroxy-cis,cis-muconate oxic EC:1.13.11.37 K04098 +K04098 chqB; hydroxyquinol 1,2-dioxygenase resorcylic acid degradation (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;resorcinol step 3 hydroxyquinol => 3-Hydroxy-cis,cis-muconate oxic EC:1.13.11.37 K04098 K04099 GalA;gallate dioxygenase gallate degradation (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;gallic_acid step 1 gallate => (1E)-4-oxobut-1-ene-1,2,4-tricarboxylate oxic EC:1.13.11.57 feeds to protocatechuate meta-cleavage K04099 K04100 ligA; protocatechuate 4,5-dioxygenase, alpha chain protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 1 subunit A protocatechuate => 2-hydroxy-4-carboxymuconic semialdehyde oxic EC:1.13.11.8 K04100 K04101 ligB; protocatechuate 4,5-dioxygenase, beta chain protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 1 subunit B protocatechuate => 2-hydroxy-4-carboxymuconic semialdehyde oxic EC:1.13.11.8 K04101 @@ -203,9 +203,9 @@ K10216 dmpD; 2-hydroxymuconic semialdehyde hydrolase 4-methylcatechol degradatio K10217 dmpC; 2-hydroxymuconate semialdehyde dehydrogenase catechol degradation- meta-cleavage route 1 (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;catechol route 1 step 2 2-Hydroxymuconate semialdehyde => 2-Hydroxymuconate oxic EC:1.2.1.85 K10217 K10217 dmpC; 2-hydroxymuconate semialdehyde dehydrogenase 4-methylcatechol degradation- meta-cleavage route 1 (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;4-methylcatechol route 1 step 2 2-Hydroxy-5-methyl-cis,cis-muconic semialdehyde => 2-Hydroxy-5-methyl-cis,cis-muconate oxic EC:1.2.1.85 K10217 K10218 ligK; 4-oxalocitramalate aldolase protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 6 2-hydroxy-4-oxobutane-1,2,4-tricarboxylate => pyruvate, oxaloacetate oxic EC:4.1.3.17 K10218 -K10219 ligC; 2-hydroxy-4-carboxymuconic-6-semialdehyde dehydrogenase protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 2 2-hydroxy-4-carboxymuconic semialdehyde hemiacetal => 2-pyrone-4,6-dicarboxylate oxic EC:1.1.1.312 K10219 +K10219 ligC; 2-hydroxy-4-carboxymuconic-6-semialdehyde dehydrogenase protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 2 2-hydroxy-4-carboxymuconic semialdehyde hemiacetal => 2-pyrone-4,6-dicarboxylate oxic EC:1.1.1.312 K10219 K10219 ligC; 2-hydroxy-4-carboxymuconate semialdehyde hemiacetal dehydrogenase [EC:1.1.1.312] homoprotocatechuic acid degradation (oxic) CAMPER polyphenols;phenolic_acids;hydroxyphenylacetic_acids;homoprotocatechuic_acid step 2 b 2-Hydroxy-5-carboxymethylmuconate semialdehyde <=> 5-Carboxymethyl-2-hydroxymuconate oxic EC:1.1.1.312 K10219 -K10220|K16515 ligJ; 4-oxalomescaconate hydratase protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 5 (1E,3E)-4-hydroxybuta-1,3-diene-1,2,4-tricarboxylate => 2-hydroxy-4-oxobutane-1,2,4-tricarboxylate oxic EC:4.2.1.83 K10220|K16515 +K10220|K16515 ligJ; 4-oxalomescaconate hydratase protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 5 (1E,3E)-4-hydroxybuta-1,3-diene-1,2,4-tricarboxylate => 2-hydroxy-4-oxobutane-1,2,4-tricarboxylate oxic EC:4.2.1.83 K10220|K16515 K10221 ligI; 2-pyrone-4,6-dicarboxylate hydrolase protocatechuic acid degradation- meta-cleavage (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;protocatechuic_acid step 3 2-pyrone-4,6-dicarboxylate => (1E)-4-oxobut-1-ene-1,2,4-tricarboxylate oxic EC:3.1.1.57 K10221 K10222 bphD; 2,6-dioxo-6-phenylhexa-3-enoate hydrolase [EC:3.7.1.8] biphenyl conversion to benzoate (oxic) CAMPER non-polyphenol;aromatic_hydrocarbon;biphenyl step 4 2-Hydroxy-6-oxo-6-phenylhexa-2,4-dienoate + 2-Hydroxy-2,4-pentadienoate + Benzoate oxic EC:3.7.1.8 K10222 K10616 cymAa; p-cymene methyl-monooxygenase [EC:1.14.15.25] cymene conversion to cumic acid (oxic) CAMPER non-polyphenol;aromatic_hydrocarbon;terpenoid;p-cymene step 1 subunit A p-Cymene => p-Cumic alcohol oxic EC:1.14.15.25 K10616 @@ -336,9 +336,9 @@ K18364 bphH; 2-oxopent-4-enoate hydratase catechol degradation- meta-cleavage ro K18364 bphH; 2-oxopent-4-enoate hydratase 4-methylcatechol degradation- meta-cleavage route 1 (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;4-methylcatechol route 1 step 5 2-Hydroxy-cis-hex-2,4-dienoate => 4-Hydroxy-2-oxohexanoic acid oxic EC:4.2.1.132 K18364 K18365 bphI; 4-hydroxy-2-oxovalerate/4-hydroxy-2-oxohexanoate aldolase [EC:4.1.3.39 4.1.3.43] catechol degradation- meta-cleavage route 1 (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;catechol route 1 step 6 4-Hydroxy-2-oxopentanoate => Acetaldehyde + Pyruvate oxic EC:4.1.3.39,EC:4.1.3.43 K18365 K18365 bphI; 4-hydroxy-2-oxovalerate/4-hydroxy-2-oxohexanoate aldolase [EC:4.1.3.39 4.1.3.43] 4-methylcatechol degradation- meta-cleavage route 1 (oxic) CAMPER polyphenols;other_polyphenols;other_polyphenols;4-methylcatechol route 1 step 6 4-Hydroxy-2-oxohexanoic acid => Propanal + Pyruvate oxic EC:4.1.3.39,EC:4.1.3.43 K18365 -K18383 feruloyl-CoA hydratase/lyase ferulic acid conversion to vanillin (oxic) CAMPER polyphenols;phenolic_acids;hydroxycinnamic_acids;ferulic_acid Step 2 feruloyl-CoA => vanillin oxic EC:4.1.2.61 K18383 +K18383 feruloyl-CoA hydratase/lyase ferulic acid conversion to vanillin (oxic) CAMPER polyphenols;phenolic_acids;hydroxycinnamic_acids;ferulic_acid Step 2 feruloyl-CoA => vanillin oxic EC:4.1.2.61 K18383 K19065 mobA; 3-hydroxybenzoate 4-monooxygenase [EC:1.14.13.23] 3-hydroxybenzoate conversion to protocatechuic acid (oxic) CAMPER polyphenols;phenolic_acids;hydroxybenzoic_acids;3-hydroxybenzoic_acid step 1 3-hydroxybenzoate => 3,4-dihydroxybenzoate oxic EC:1.14.13.23 K19065 -K19066 cyclohex-1-ene-1-carbonyl-CoA dehydrogenase [EC:1.3.8.10] benzoyl-coa degradation route 3 (anoxic) CAMPER non-polyphenol;aromatic_hydrocarbon;benzoyl-coa route 3 step 2 Cyclohex-1-ene-1-carboxyl-CoA => Cyclohexa-1,5-diene-1-carbonyl-CoA anoxic EC:1.3.8.10 K19066 +K19066 cyclohex-1-ene-1-carbonyl-CoA dehydrogenase [EC:1.3.8.10] benzoyl-coa degradation route 3 (anoxic) CAMPER non-polyphenol;aromatic_hydrocarbon;benzoyl-coa route 3 step 2 Cyclohex-1-ene-1-carboxyl-CoA => Cyclohexa-1,5-diene-1-carbonyl-CoA anoxic EC:1.3.8.10 K19066 K19515 benzoyl-CoA reductase subunit BamB [EC:1.3.-.-] benzoyl-coa degradation route 2 (anoxic) CAMPER non-polyphenol;aromatic_hydrocarbon;benzoyl-coa route 2 step 1 subunit B Benzoyl-CoA => Cyclohexa-1,5-diene-1-carbonyl-CoA anoxic K19515 K19516 benzoyl-CoA reductase subunit BamC [EC:1.3.-.-] benzoyl-coa degradation route 2 (anoxic) CAMPER non-polyphenol;aromatic_hydrocarbon;benzoyl-coa route 2 step 1 subunit C Benzoyl-CoA => Cyclohexa-1,5-diene-1-carbonyl-CoA anoxic K19516 K19629 tsaD; 4-(hydroxymethyl)benzenesulfonate dehydrogenase [EC:1.1.1.257] toluene-4-sulfonate conversion to protocatechuic acid (oxic) CAMPER non-polyphenol;aromatic_hydrocarbon;toluene-4-sulfonate step 2 4-Sulfobenzyl alcohol => 4-formylbenzenesulfonate oxic EC:1.1.1.257 K19629 diff --git a/bin/assets/forms/distill_sheets/distill_carbon.tsv b/bin/assets/forms/distill_sheets/distill_carbon.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/distill_energy.tsv b/bin/assets/forms/distill_sheets/distill_energy.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/distill_eng_sys.tsv b/bin/assets/forms/distill_sheets/distill_eng_sys.tsv old mode 100755 new mode 100644 index b17c925d..92a71444 --- a/bin/assets/forms/distill_sheets/distill_eng_sys.tsv +++ b/bin/assets/forms/distill_sheets/distill_eng_sys.tsv @@ -154,29 +154,29 @@ K21009 PelD; EPS engineered systems engineered systems biofilm formation EPS pro K21010 PelD; EPS engineered systems engineered systems biofilm formation EPS production K21011 PelD; EPS engineered systems engineered systems biofilm formation EPS production K21012 PelD; EPS engineered systems engineered systems biofilm formation EPS production -K04455 HSPB1; heat shock protein family B (small) member 1 engineered systems engineered systems heat tolerance -K03667 "ttm:Tthe_1460 heat shock protein HslVU ATPase subunit HslU; K03667 AAA_2 AAA ClpB_D2-small AAA_5 AAA_22 AAA_16 Mg_chelatase Sigma54_activat MCM AAA_18 RuvB_N ABC_tran NTPase_1 TniB AAA_28 AAA_33 Zeta_toxin AAA_7 IstB_IS21 TIP49 TsaE FAS_meander AAA_19 DEAD" engineered systems engineered systems heat tolerance -K13993 ttm:Tthe_0173 heat shock protein Hsp20; K13993 HSP20 ArsA_HSP20 CS engineered systems engineered systems heat tolerance -K03686 blq:L21SP5_01031 dnaJ; Heat shock protein J; K03686 DnaJ_C DnaJ DnaJ_CXXCXGXG Anti-TRAP engineered systems engineered systems heat tolerance -K04762 pet:PEIBARAKI_4309 heat shock protein 15; K04762 S4 engineered systems engineered systems heat tolerance -K05801 tli:Tlie_1612 heat shock protein DnaJ domain protein; K05801 DnaJ 3HBOH engineered systems engineered systems heat tolerance -K03799 "mem:Memar_2252 Heat shock protein Metallo peptidase MEROPS family M48B; K03799 Peptidase_M48 Peptidase_M56 Peptidase_U49 SprT-like DUF2268 Pex24p" engineered systems engineered systems heat tolerance -K03705 tte:TTE0953 HrcA; Transcriptional regulator of heat shock gene; K03705 HrcA HrcA_DNA-bdg HTH_11 HTH_DeoR engineered systems engineered systems heat tolerance -K03687 tte:TTE0954 GrpE; Molecular chaperone GrpE (heat shock protein); K03687 GrpE Herpes_UL6 GldM_N Complex1_LYR Trans_reg_C DUF573 KxDL Atg14 DUF87 engineered systems engineered systems heat tolerance -K13640 cha:CHAB381_0975 putative heat shock protein HspR; K13640 MerR_1 MerR_2 MerR HTH_17 HTH_3 PKcGMP_CC TolA_bind_tri HTH_23 engineered systems engineered systems heat tolerance -K01419 "hor:Hore_07560 heat shock protein HslVU ATP dependent protease HslV; K01419 Proteasome" engineered systems engineered systems heat tolerance -K07721 "tko:TK2291 archaeal heat shock regulator ArsR family; K07721 HTH_5 HTH_20 ArsR HTH_24 PadR TrmB MarR_2 HTH_CodY HTH_11 PSY3 MscS_porin GntR DprA_WH HTH_10 LexA_DNA_bind HxlR IF2_N DUF4795 DUF2205" engineered systems engineered systems heat tolerance -K19411 "min:Minf_0201 mcsA; Modulator of heat shock repressor CtsR McsA; K19411 UVR TackOD1 XFP A2L_zn_ribbon HypA" engineered systems engineered systems heat tolerance -K22447 thv:ADU37_CDS16120 Heat shock protein 60 family chaperone GroEL / Thermosome subunit; K22447 Cpn60_TCP1 AAA_5 engineered systems engineered systems heat tolerance -K04079 csh:Closa_3215 Heat shock protein Hsp90-like protein; K04079 HSP90 HATPase_c_3 HATPase_c engineered systems engineered systems heat tolerance -K04083 cst:CLOST_0638 hslO; disulfide bond chaperone (heat shock protein HSP33); K04083 HSP33 engineered systems engineered systems heat tolerance -K03695 rho:RHOM_03585 heat shock protein ClpB-like protein; K03695 AAA_2 AAA_lid_9 AAA ClpB_D2-small Clp_N AAA_5 AAA_16 Sigma54_activat AAA_22 IstB_IS21 ATPase_2 TniB AAA_7 AAA_18 AAA_14 Mg_chelatase RNA_helicase RuvB_N NACHT DUF815 AAA_3 Zeta_toxin AAA_33 Roc DNA_pol3_delta2 AAA_19 Torsin AAA_23 Spc7 DUF87 Cob_adeno_trans Atg14 ABC_tran engineered systems engineered systems heat tolerance -K06335 sbu:SpiBuddy_2148 heat shock protein Hsp20; K06335 HSP20 ArsA_HSP20 Frataxin_Cyay engineered systems engineered systems heat tolerance -K04078 mthr:MSTHT_2204 Heat shock protein 60 family co-chaperone GroES; K04078 Cpn10 NTPase_1 engineered systems engineered systems heat tolerance -K05516 aeh:Mlg_2130 heat shock protein DnaJ domain protein; K05516 DnaJ_C DnaJ Metal_resist engineered systems engineered systems heat tolerance -K04080 salg:BS332_16600 heat-shock protein; K04080 HSP20 ArsA_HSP20 engineered systems engineered systems heat tolerance -K04077 smul:SMUL_0986 groL; heat shock protein 60 family chaperone GroEL; K04077 Cpn60_TCP1 Cas_APE2256 engineered systems engineered systems heat tolerance -K04043 DnaK; molecular chaperone engineered systems engineered systems heat tolerance +K04455 HSPB1; heat shock protein family B (small) member 1 engineered systems engineered systems heat tolerance +K03667 "ttm:Tthe_1460 heat shock protein HslVU ATPase subunit HslU; K03667 AAA_2 AAA ClpB_D2-small AAA_5 AAA_22 AAA_16 Mg_chelatase Sigma54_activat MCM AAA_18 RuvB_N ABC_tran NTPase_1 TniB AAA_28 AAA_33 Zeta_toxin AAA_7 IstB_IS21 TIP49 TsaE FAS_meander AAA_19 DEAD" engineered systems engineered systems heat tolerance +K13993 ttm:Tthe_0173 heat shock protein Hsp20; K13993 HSP20 ArsA_HSP20 CS engineered systems engineered systems heat tolerance +K03686 blq:L21SP5_01031 dnaJ; Heat shock protein J; K03686 DnaJ_C DnaJ DnaJ_CXXCXGXG Anti-TRAP engineered systems engineered systems heat tolerance +K04762 pet:PEIBARAKI_4309 heat shock protein 15; K04762 S4 engineered systems engineered systems heat tolerance +K05801 tli:Tlie_1612 heat shock protein DnaJ domain protein; K05801 DnaJ 3HBOH engineered systems engineered systems heat tolerance +K03799 "mem:Memar_2252 Heat shock protein Metallo peptidase MEROPS family M48B; K03799 Peptidase_M48 Peptidase_M56 Peptidase_U49 SprT-like DUF2268 Pex24p" engineered systems engineered systems heat tolerance +K03705 tte:TTE0953 HrcA; Transcriptional regulator of heat shock gene; K03705 HrcA HrcA_DNA-bdg HTH_11 HTH_DeoR engineered systems engineered systems heat tolerance +K03687 tte:TTE0954 GrpE; Molecular chaperone GrpE (heat shock protein); K03687 GrpE Herpes_UL6 GldM_N Complex1_LYR Trans_reg_C DUF573 KxDL Atg14 DUF87 engineered systems engineered systems heat tolerance +K13640 cha:CHAB381_0975 putative heat shock protein HspR; K13640 MerR_1 MerR_2 MerR HTH_17 HTH_3 PKcGMP_CC TolA_bind_tri HTH_23 engineered systems engineered systems heat tolerance +K01419 "hor:Hore_07560 heat shock protein HslVU ATP dependent protease HslV; K01419 Proteasome" engineered systems engineered systems heat tolerance +K07721 "tko:TK2291 archaeal heat shock regulator ArsR family; K07721 HTH_5 HTH_20 ArsR HTH_24 PadR TrmB MarR_2 HTH_CodY HTH_11 PSY3 MscS_porin GntR DprA_WH HTH_10 LexA_DNA_bind HxlR IF2_N DUF4795 DUF2205" engineered systems engineered systems heat tolerance +K19411 "min:Minf_0201 mcsA; Modulator of heat shock repressor CtsR McsA; K19411 UVR TackOD1 XFP A2L_zn_ribbon HypA" engineered systems engineered systems heat tolerance +K22447 thv:ADU37_CDS16120 Heat shock protein 60 family chaperone GroEL / Thermosome subunit; K22447 Cpn60_TCP1 AAA_5 engineered systems engineered systems heat tolerance +K04079 csh:Closa_3215 Heat shock protein Hsp90-like protein; K04079 HSP90 HATPase_c_3 HATPase_c engineered systems engineered systems heat tolerance +K04083 cst:CLOST_0638 hslO; disulfide bond chaperone (heat shock protein HSP33); K04083 HSP33 engineered systems engineered systems heat tolerance +K03695 rho:RHOM_03585 heat shock protein ClpB-like protein; K03695 AAA_2 AAA_lid_9 AAA ClpB_D2-small Clp_N AAA_5 AAA_16 Sigma54_activat AAA_22 IstB_IS21 ATPase_2 TniB AAA_7 AAA_18 AAA_14 Mg_chelatase RNA_helicase RuvB_N NACHT DUF815 AAA_3 Zeta_toxin AAA_33 Roc DNA_pol3_delta2 AAA_19 Torsin AAA_23 Spc7 DUF87 Cob_adeno_trans Atg14 ABC_tran engineered systems engineered systems heat tolerance +K06335 sbu:SpiBuddy_2148 heat shock protein Hsp20; K06335 HSP20 ArsA_HSP20 Frataxin_Cyay engineered systems engineered systems heat tolerance +K04078 mthr:MSTHT_2204 Heat shock protein 60 family co-chaperone GroES; K04078 Cpn10 NTPase_1 engineered systems engineered systems heat tolerance +K05516 aeh:Mlg_2130 heat shock protein DnaJ domain protein; K05516 DnaJ_C DnaJ Metal_resist engineered systems engineered systems heat tolerance +K04080 salg:BS332_16600 heat-shock protein; K04080 HSP20 ArsA_HSP20 engineered systems engineered systems heat tolerance +K04077 smul:SMUL_0986 groL; heat shock protein 60 family chaperone GroEL; K04077 Cpn60_TCP1 Cas_APE2256 engineered systems engineered systems heat tolerance +K04043 DnaK; molecular chaperone engineered systems engineered systems heat tolerance K00625 phosphate acetyltransferase [EC:2.3.1.8] [RN:R00230] engineered systems engineered systems organic acids potential acetate production K13788 phosphate acetyltransferase [EC:2.3.1.8] [RN:R00230] engineered systems engineered systems organic acids potential acetate production K15024 phosphate acetyltransferase [EC:2.3.1.8] [RN:R00230] engineered systems engineered systems organic acids potential acetate production @@ -225,23 +225,23 @@ CmdA HMM; cmdA; p-cymene dehydrogenase engineered systems engineered systems "CA EbdA HMM; ebdA; Ethylbenzene dehydrogenase engineered systems engineered systems "CANT-HYD hydrocarbon degradation" "aromatic anaerobic" K27540 HMM; K27540; Naphthalene carboxylase engineered systems engineered systems "CANT-HYD hydrocarbon degradation" "aromatic anaerobic" NmsA HMM; nmsA; Naphthyl 2-methylsuccinate synthase engineered systems engineered systems "CANT-HYD hydrocarbon degradation" "aromatic anaerobic" -APS-reductase_C HMM; adenylylsulfate reductase C engineered systems engineered systems sulfur -ATP-sulfurylase HMM; sulfate adenylyltransferase engineered systems engineered systems sulfur -DoxA HMM; doxA; thiosulfate dehydrogenase (quinone) small subunit engineered systems engineered systems sulfur -DoxD HMM; doxD; thiosulfate dehydrogenase (quinone) large subunit engineered systems engineered systems sulfur -DoxX HMM; doxX engineered systems engineered systems sulfur -DsrD "HMM; dsrD; sulfite reductase D dissimilatory-type" engineered systems engineered systems sulfur -FCSD-flav_bind "HMM; flavocytochrome c sulfide dehydrogenase flavin-binding protein sulfide dehydrogenase" engineered systems engineered systems sulfur -NIR_SIR HMM; nir_sir engineered systems engineered systems sulfur -Rhodanese HMM; rhodanase engineered systems engineered systems sulfur -SOR HMM; SOR; sulphur oxygenase/reductase (elemental sulfur to sulfide & sulfate) engineered systems engineered systems sulfur -SoxY HMM; soxY; sulfur-oxidizing protein SoxY engineered systems engineered systems sulfur -SoxZ HMM; soxZ; sulfur-oxidizing protein SoxZ engineered systems engineered systems sulfur -sqr_alignment HMM; sqr; sulfide-quinone reductase engineered systems engineered systems sulfur -sulfur_dioxygenase_sdo_alignment HMM; dso; sulfur dioxgenase engineered systems engineered systems sulfur -thiosulfate_reductase_phsA_alignment HMM; phsA; thiosulfate reductase / polysulfide reductase chain A engineered systems engineered systems sulfur -dsrA "HMM; dsrA; sulfite reductase A dissimilatory-type" engineered systems engineered systems sulfur -dsrB "HMM; dsrB; sulfite reductase B dissimilatory-type " engineered systems engineered systems sulfur +APS-reductase_C HMM; adenylylsulfate reductase C engineered systems engineered systems sulfur +ATP-sulfurylase HMM; sulfate adenylyltransferase engineered systems engineered systems sulfur +DoxA HMM; doxA; thiosulfate dehydrogenase (quinone) small subunit engineered systems engineered systems sulfur +DoxD HMM; doxD; thiosulfate dehydrogenase (quinone) large subunit engineered systems engineered systems sulfur +DoxX HMM; doxX engineered systems engineered systems sulfur +DsrD "HMM; dsrD; sulfite reductase D dissimilatory-type" engineered systems engineered systems sulfur +FCSD-flav_bind "HMM; flavocytochrome c sulfide dehydrogenase flavin-binding protein sulfide dehydrogenase" engineered systems engineered systems sulfur +NIR_SIR HMM; nir_sir engineered systems engineered systems sulfur +Rhodanese HMM; rhodanase engineered systems engineered systems sulfur +SOR HMM; SOR; sulphur oxygenase/reductase (elemental sulfur to sulfide & sulfate) engineered systems engineered systems sulfur +SoxY HMM; soxY; sulfur-oxidizing protein SoxY engineered systems engineered systems sulfur +SoxZ HMM; soxZ; sulfur-oxidizing protein SoxZ engineered systems engineered systems sulfur +sqr_alignment HMM; sqr; sulfide-quinone reductase engineered systems engineered systems sulfur +sulfur_dioxygenase_sdo_alignment HMM; dso; sulfur dioxgenase engineered systems engineered systems sulfur +thiosulfate_reductase_phsA_alignment HMM; phsA; thiosulfate reductase / polysulfide reductase chain A engineered systems engineered systems sulfur +dsrA "HMM; dsrA; sulfite reductase A dissimilatory-type" engineered systems engineered systems sulfur +dsrB "HMM; dsrB; sulfite reductase B dissimilatory-type " engineered systems engineered systems sulfur K00394 adenylylsulfate reductase [EC:1.8.99.2] [RN:R08553] engineered systems engineered systems sulfur sulfate => H2S K00395 adenylylsulfate reductase [EC:1.8.99.2] [RN:R08553] engineered systems engineered systems sulfur sulfate => H2S K00956 sulfate adenylyltransferase [EC:2.7.7.4] [RN:R00529] engineered systems engineered systems sulfur sulfate => H2S diff --git a/bin/assets/forms/distill_sheets/distill_metals.tsv b/bin/assets/forms/distill_sheets/distill_metals.tsv old mode 100755 new mode 100644 index 1c630af7..e8d45ea3 --- a/bin/assets/forms/distill_sheets/distill_metals.tsv +++ b/bin/assets/forms/distill_sheets/distill_metals.tsv @@ -1,167 +1,167 @@ gene_id rule gene_description pathway topic_ecosystem category subcategory note reference -arsD arsD "arsD, Arsenic metallochaperone for efflux pump" metals Stressors Heavy Metals arsenic -arsM arsM|K07755 "arsM, arsenite methyltransferase" metals Stressors Heavy Metals arsenic -aioA-aoxB aioA-aoxB|K08356 "aioA-aoxB, arsenite oxidase large subunit" metals Stressors Heavy Metals arsenic -aioB-aoxA aioB-aoxA|K08355 "aioB-aoxA, arsenite oxidase small subunit" metals Stressors Heavy Metals arsenic -arsC|K00537 arsC|K00537 "arsC, arsenate reductase (glutaredoxin)" metals Stressors Heavy Metals arsenic -arsC|K03741 arsC|K03741 "arsC, arsenate reductase (thioredoxin)" metals Stressors Heavy Metals arsenic -arsH arsH|K11811 "arsH, arsenical resistance protein ArsH" metals Stressors Heavy Metals arsenic -aioR-aoxR aioR-aoxR "aioR-aoxR, Transcriptional activator protein; two-component system" metals Stressors Heavy Metals arsenic -aioS-aoxS aioS-aoxS "aioS-aoxS, Sensor protein; two-component system" metals Stressors Heavy Metals arsenic -arsR arsR|K03892 "arsR, arsenate/arsenite/antimonite-responsive transcriptional repressor" metals Stressors Heavy Metals arsenic -acr3 acr3|K03325 "acr3, arsenite transporter" metals Stressors Heavy Metals arsenic -arsA arsA|K01551 "arsA, arsenite/tail-anchored protein-transporting ATPase" metals Stressors Heavy Metals arsenic -arsB arsB|K03893 "arsB, arsenical pump membrane protein" metals Stressors Heavy Metals arsenic -cadC cadC|K03765 "cadC, transcriptional activator of cad operon" metals Stressors Heavy Metals cadmium -cadR cadR "cadR, Transcriptional regulator for cadmium resistance" metals Stressors Heavy Metals cadmium -cadX cadX|K21903 "cadX, lead/cadmium/zinc/bismuth-responsive transcriptional repressor" metals Stressors Heavy Metals cadmium -cmtR cmtR|K21885 "cmtR, cadmium/lead-responsive transcriptional repressor" metals Stressors Heavy Metals cadmium -cusR-ylcA cusR-ylcA|K07665 "cusR-ylcA, opper resistance phosphate regulon response regulator CusR" metals Stressors Heavy Metals cadmium -cusS cusS|K07644 "cusS, heavy metal sensor histidine kinase CusS" metals Stressors Heavy Metals cadmium -czcR czcR|K02483 "czcR, two-component system, OmpR family, response regulator" metals Stressors Heavy Metals cadmium -czrA czrA|K22043 "czrA, zinc-responsive transcriptional repressor" metals Stressors Heavy Metals cadmium -K03088 K03088 "RNA polymerase sigma-70 factor, ECF subfamily" metals Stressors Heavy Metals cadmium -K24079 K24079 nickel and cobalt resistance protein CnrY metals Stressors Heavy Metals cadmium -K24078 K24078 nickel and cobalt resistance protein CnrR metals Stressors Heavy Metals cadmium -cadD cadD "cadD, Cadmium resistance permease" metals Stressors Heavy Metals cadmium -czcA czcA|K15726 "czcA, heavy metal efflux system protein" metals Stressors Heavy Metals cadmium -czcB czcB|K15727 "czcB, membrane fusion protein, heavy metal efflux system" metals Stressors Heavy Metals cadmium -czcC czcC|K15725 "czcC, outer membrane protein, heavy metal efflux system" metals Stressors Heavy Metals cadmium -cznB cznB "cznB, Cadmium-zinc-nickel efflux; transporter" metals Stressors Heavy Metals cadmium -czrB czrB|K21133 "czrB, multidrug efflux pump" metals Stressors Heavy Metals cadmium -dmeF dmeF "dmeF, Broad range metal ion transporter" metals Stressors Heavy Metals cadmium -rcnA-yohM rcnA-yohM|K08970 "rcnA-yohM, nickel/cobalt transporter (NicO) family protein" metals Stressors Heavy Metals cadmium -zitB-ybgR zitB-ybgR|K16264 "zitB-ybgR, cobalt-zinc-cadmium efflux system protein" metals Stressors Heavy Metals cadmium -zntA-yhhO zntA-yhhO|K01534 "zntA-yhhO, Zn2+/Cd2+-exporting ATPase" metals Stressors Heavy Metals cadmium -ncrB ncrB "ncrB, Ni-Co efflux; regulator" metals Stressors Heavy Metals cobalt -ncrY ncrY "ncrY, Ni-Co efflux; regulator" metals Stressors Heavy Metals cobalt -rcnR-yohL rcnR-yohL|K23240 "rcnR-yohL, FrmR/RcnR family transcriptional regulator, repressor of rcnA expression" metals Stressors Heavy Metals cobalt -K24073 K24073 RNA polymerase sigma factor CnrH metals Stressors Heavy Metals cobalt -K06042 K06042 precorrin-8X/cobalt-precorrin-8 methylmutase metals Stressors Heavy Metals cobalt -cmeA cmeA|K03585 "cmeA, membrane fusion protein, multidrug efflux system" metals Stressors Heavy Metals cobalt -cmeB cmeB|K18138 "cmeB, multidrug efflux pump" metals Stressors Heavy Metals cobalt -cmeC cmeC|K18139 "cmeC, outer membrane protein, multidrug efflux system" metals Stressors Heavy Metals cobalt -cnrT cnrT "cnrT, Ni-Co efflux system; cation diffusion facilitator" metals Stressors Heavy Metals cobalt -corA corA|K03284 "corA, magnesium transporter" metals Stressors Heavy Metals cobalt -corB corB "corB, Magnesium-transporting ATPase" metals Stressors Heavy Metals cobalt -corC corC|K06189 "corC, hemolysin (HlyC) family protein" metals Stressors Heavy Metals cobalt -ctpD ctpD|K12951 "ctpD, cobalt/nickel-transporting P-type ATPase D" metals Stressors Heavy Metals cobalt -dmeR dmeR "dmeR, Co-Ni dmeRF efflux system" metals Stressors Heavy Metals cobalt -nrsD-nreB nrsD-nreB|K07785 "nrsD-nreB, MFS transporter, NRE family, putaive nickel resistance protein" metals Stressors Heavy Metals cobalt -rcnB-yohN rcnB-yohN|K23243 "rcnB-yohN, nickel/cobalt homeostasis protein" metals Stressors Heavy Metals cobalt -copC copC|K07156 "copC, copper resistance protein C" metals Stressors Heavy Metals copper -cutA cutA|K03926 "cutA, periplasmic divalent cation tolerance protein" metals Stressors Heavy Metals copper -cutC cutC|K06201 "cutC, copper homeostasis protein" metals Stressors Heavy Metals copper -mymT mymT|K21609 "mymT, Cu-binding metallothionein" metals Stressors Heavy Metals copper -pcoB pcoB|K07233 "pcoB, copper resistance protein B" metals Stressors Heavy Metals copper -pcoE pcoE "pcoE, Copper binding protein; downstream from regulatory genes" metals Stressors Heavy Metals copper -copZ copZ|K07213 "copZ, copper chaperone" metals Stressors Heavy Metals copper -K09796 K09796 periplasmic copper chaperone A metals Stressors Heavy Metals copper -K19342 K19342 copper chaperone NosL metals Stressors Heavy Metals copper -cinA cinA "cinA, Copper-binding azurin-like protein" metals Stressors Heavy Metals copper -cueO cueO|K14588 "cueO, cuproxidase" metals Stressors Heavy Metals copper -cutO cutO "cutO, Multicopper oxidase" metals Stressors Heavy Metals copper -mco mco|K22552 "mco, multicopper oxidase" metals Stressors Heavy Metals copper -copL copL "copL, Copper binding protein; higher affinity for Cu(I)" metals Stressors Heavy Metals copper -copY-tcrY copY-tcrY "copY-tcrY, Upstream repressor of CopA/CopB" metals Stressors Heavy Metals copper -corR corR "corR, Transcriptional regulator protein; two component system; cuoABC and copAB" metals Stressors Heavy Metals copper -crdR crdR|K02483 "crdR, two-component system, OmpR family, response regulator" metals Stressors Heavy Metals copper -csoR csoR|K21600 "csoR, CsoR family transcriptional regulator, copper-sensing transcriptional repressor" metals Stressors Heavy Metals copper -cueR-ybbI cueR-ybbI|K11923 "cueR-ybbI, copper efflux regulator" metals Stressors Heavy Metals copper -cusR-ylcA cusR-ylcA|K07665 "cusR-ylcA, copper resistance phosphate regulon response regulator CusR" metals Stressors Heavy Metals copper -hmrR hmrR|K19591 "hmrR, copper efflux regulator" metals Stressors Heavy Metals copper -ycnK ycnK|K21601 "ycnK, copper-sensing transcriptional repressor" metals Stressors Heavy Metals copper -yfmP yfmP|K21902 "yfmP, MerR family transcriptional regulator, repressor of the yfmOP operon" metals Stressors Heavy Metals copper -K18992 K18992 "TetR/AcrR family transcriptional regulator, cmeABC operon repressor" metals Stressors Heavy Metals copper -acrD acrD|K18324 "acrD, multidrug efflux pump" metals Stressors Heavy Metals copper -copA copA|K17686 "copA, P-type Cu+ transporter" metals Stressors Heavy Metals copper -copB copB|K01533 "copB, P-type Cu2+ transporter" metals Stressors Heavy Metals copper -copD copD|K07245 "copD, copper resistance protein D" metals Stressors Heavy Metals copper -copP copP "copP, Copper binding protein; part of cation transport system" metals Stressors Heavy Metals copper -crdA crdA "crdA, Copper resistance determinant" metals Stressors Heavy Metals copper -ctpG ctpG|K12954 "ctpG, cation-transporting P-type ATPase G" metals Stressors Heavy Metals copper -ctpV ctpV|K12956 "ctpV, copper-transporting P-type ATPase V" metals Stressors Heavy Metals copper -cusA-ybdE cusA-ybdE|K07787 "cusA-ybdE, copper/silver efflux system protein" metals Stressors Heavy Metals copper -cusB cusB|K07798 "cusB, membrane fusion protein, copper/silver efflux system" metals Stressors Heavy Metals copper -cusC-ylcB cusC-ylcB|K07796 "cusC-ylcB, outer membrane protein, copper/silver efflux system" metals Stressors Heavy Metals copper -cusF-cusX cusF-cusX|K07810 "cusF-cusX, Cu(I)/Ag(I) efflux system periplasmic protein CusF" metals Stressors Heavy Metals copper -cutE-lnt cutE-lnt|K03820 "cutE-lnt, apolipoprotein N-acyltransferase" metals Stressors Heavy Metals copper -cutF-nlpE cutF-nlpE|K06079 "cutF-nlpE, copper homeostasis protein (lipoprotein)" metals Stressors Heavy Metals copper -hpcopA hpcopA "hpcopA, Copper transport ATPase" metals Stressors Heavy Metals copper -mctB mctB "mctB, Pore-forming protein; copper efflux" metals Stressors Heavy Metals copper -ycnJ ycnJ|K14166 "ycnJ, copper transport protein" metals Stressors Heavy Metals copper -yfmO yfmO|K08221 "yfmO, MFS transporter, ACDE family, multidrug resistance protein" metals Stressors Heavy Metals copper -bfrA bfrA|K03594 "bfrA, bacterioferritin" metals Stressors Heavy Metals iron -dpr-dps dpr-dps "dpr-dps, Sequesters Fe(II), binds and oxidizes to Fe(III) " metals Stressors Heavy Metals iron -dpsA dpsA "dpsA, Stress response, iron-binding protein" metals Stressors Heavy Metals iron -pfr pfr|K02217 "pfr, ferritin" metals Stressors Heavy Metals iron -yqjH yqjH|K07229 "yqjH, ferric-chelate reductase (NADPH)" metals Stressors Heavy Metals iron -ideR ideR|K03709 "ideR, Mn-dependent transcriptional regulator" metals Stressors Heavy Metals iron -pmrA pmrA "pmrA, Transcriptional regulator protein; two component system" metals Stressors Heavy Metals iron -pmrB pmrB "pmrB, Sensor protein; two component system" metals Stressors Heavy Metals iron -fbpA fbpA|K02012 "fbpA, iron(III) transport system substrate-binding protein" metals Stressors Heavy Metals iron -fbpB fbpB|K02011 "fbpB, iron(III) transport system permease protein" metals Stressors Heavy Metals iron -fbpC fbpC|K02010 "fbpC, iron(III) transport system ATP-binding protein" metals Stressors Heavy Metals iron -fieF-yiip fieF-yiip|K13283 "fieF-yiip, ferrous-iron efflux pump FieF" metals Stressors Heavy Metals iron -fptA fptA|K16088 "fptA, outer-membrane receptor for ferric coprogen and ferric-rhodotorulic acid" metals Stressors Heavy Metals iron -mntH-yfeB mntH-yfeB|K03322 "mntH-yfeB, manganese transport protein" metals Stressors Heavy Metals iron -nia nia|K01552 "nia, energy-coupling factor transport system ATP-binding protein" metals Stressors Heavy Metals iron -pmrC pmrC "pmrC, Membrane protein" metals Stressors Heavy Metals iron -ybtP ybtP|K06147 "ybtP, ATP-binding cassette, subfamily B, bacterial" metals Stressors Heavy Metals iron -ybtQ ybtQ|K06147 "ybtQ, ATP-binding cassette, subfamily B, bacterial" metals Stressors Heavy Metals iron -yfeA yfeA|K11604 "yfeA, manganese/iron transport system substrate-binding protein" metals Stressors Heavy Metals iron -yfeB yfeB|K11607 "yfeB, manganese/iron transport system ATP-binding protein" metals Stressors Heavy Metals iron -yfeC yfeC|K11605 "yfeC, manganese/iron transport system permease protein" metals Stressors Heavy Metals iron -yfeD yfeD|K11606 "yfeD, manganese/iron transport system permease protein" metals Stressors Heavy Metals iron -K07224 K07224 iron uptake system component EfeO metals Stressors Heavy Metals iron -pbrR pbrR "pbrR, Transcription factor, regulator" metals Stressors Heavy Metals lead -pbrT pbrT "pbrT, Pb(II) uptake protein; membrane transporter" metals Stressors Heavy Metals lead -K03101 K03101 signal peptidase II metals Stressors Heavy Metals lead -mgtA mgtA|K01531 "mgtA, P-type Mg2+ transporter" metals Stressors Heavy Metals magnesium -K06213 K06213 magnesium transporter metals Stressors Heavy Metals magnesium -mntR mntR|K11924 "mntR, manganese transport regulator" metals Stressors Heavy Metals manganese -ctpC ctpC|K12950 "ctpC, manganese-transporting P-type ATPase C" metals Stressors Heavy Metals manganese -mntA-ytgA mntA-ytgA|K11707 "mntA-ytgA, manganese/zinc/iron transport system substrate-binding protein" metals Stressors Heavy Metals manganese -mntP-yebN mntP-yebN|K23242 "mntP-yebN, manganese efflux pump family protein" metals Stressors Heavy Metals manganese -merB merB|K00221 "merB, alkylmercury lyase" metals Stressors Heavy Metals mercury -merA merA|K00520 "merA, mercuric reductase" metals Stressors Heavy Metals mercury -merD merD|K19057 "merD, mercuric resistance operon regulatory protein" metals Stressors Heavy Metals mercury -merR merR|K08365 "merR, mercuric resistance operon regulatory protein" metals Stressors Heavy Metals mercury -merC merC|K19058 "merC, mercuric ion transport protein" metals Stressors Heavy Metals mercury -merE merE|K19059 "merE, mercuric ion transport protein" metals Stressors Heavy Metals mercury -merF merF|K19058 "merF, mercuric ion transport protein" metals Stressors Heavy Metals mercury -merP merP|K08364 "merP, periplasmic mercuric ion binding protein" metals Stressors Heavy Metals mercury -merT merT|K08363 "merT, mercuric ion transport protein" metals Stressors Heavy Metals mercury -nikR nikR|K07722 "nikR, CopG family transcriptional regulator, nickel-responsive regulator" metals Stressors Heavy Metals nickel -nrsS nrsS|K11328 "nrsS, Ni(II)-sensor and/or redox sensor kinase NrsS" metals Stressors Heavy Metals nickel -K11330 K11330 Ni(II)-responsive and/or redox-responsive regulator NrsR metals Stressors Heavy Metals nickel -hupE hupE "hupE, Nickel transporter; metal permease" metals Stressors Heavy Metals nickel -nikA nikA|K15584 "nikA, nickel transport system substrate-binding protein" metals Stressors Heavy Metals nickel -nikB nikB|K15585 "nikB, nickel transport system permease protein" metals Stressors Heavy Metals nickel -nikC nikC|K15586 "nikC, nickel transport system permease protein" metals Stressors Heavy Metals nickel -nikD nikD|K15587 "nikD, nickel transport system ATP-binding protein" metals Stressors Heavy Metals nickel -nikE nikE|K10824 "nikE, nickel transport system ATP-binding protein" metals Stressors Heavy Metals nickel -nixA nixA|K07241 "nixA, nickel/cobalt transporter (NiCoT) family protein" metals Stressors Heavy Metals nickel -nrsA nrsA|K11326 "nrsA, cation efflux system protein involved in nickel and cobalt tolerance" metals Stressors Heavy Metals nickel -silF silF "silF, Silver cation efflux system; chaperone" metals Stressors Heavy Metals silver -silE silE "silE, Silver cation efflux system; binding protein" metals Stressors Heavy Metals silver -silP silP|K23254 "silP, P-type Ag+ transporter" metals Stressors Heavy Metals silver -smtA smtA|K21904 "smtA, Zinc binding metallothionein" metals Stressors Heavy Metals zinc -zevA zevA "zevA, Zinc binding protein" metals Stressors Heavy Metals zinc -zraP zraP|K07803 "zraP, zinc resistance-associated protein" metals Stressors Heavy Metals zinc -zinT-yodA zinT-yodA "zinT-yodA, Periplasmic zinc (and cadmium) binding protein" metals Stressors Heavy Metals zinc -zntR-yhdM zntR-yhdM|K13638 "zntR-yhdM, Zn(II)-responsive regulator of zntA" metals Stressors Heavy Metals zinc -zraR-hydH zraR-hydH|K07713 "zraR-hydH, two-component system, NtrC family, response regulator HydG" metals Stressors Heavy Metals zinc -zraS-hydG zraS-hydG|K07709 "zraS-hydG, two-component system, NtrC family, sensor histidine kinase HydH" metals Stressors Heavy Metals zinc -zur-yjbK zur-yjbK|K09823 "zur-yjbK, Fur family transcriptional regulator, zinc uptake regulator" metals Stressors Heavy Metals zinc -K03709 K03709 Mn-dependent transcriptional regulator metals Stressors Heavy Metals zinc -mdtA mdtA|K07799 "mdtA, membrane fusion protein, multidrug efflux system" metals Stressors Heavy Metals zinc -mdtB mdtB|K07788 "mdtB, multidrug efflux pump" metals Stressors Heavy Metals zinc -mdtC mdtC|K07789 "mdtC, multidrug efflux pump" metals Stressors Heavy Metals zinc -troB troB|K11710 "troB, manganese/zinc/iron transport system ATP- binding protein" metals Stressors Heavy Metals zinc -zipB zipB|K07238 "zipB, zinc transporter, ZIP family" metals Stressors Heavy Metals zinc -znuA-yebL znuA-yebL|K09815 "znuA-yebL, zinc transport system substrate-binding protein" metals Stressors Heavy Metals zinc -znuB-yebI znuB-yebI|K09816 "znuB-yebI, zinc transport system permease protein" metals Stressors Heavy Metals zinc -znuC-yebM znuC-yebM|K09817 "znuC-yebM, zinc transport system ATP-binding protein" metals Stressors Heavy Metals zinc -K11708 K11708 manganese/zinc/iron transport system permease protein metals Stressors Heavy Metals zinc -K11709 K11709 manganese/zinc/iron transport system permease protein metals Stressors Heavy Metals zinc \ No newline at end of file +arsD arsD "arsD, Arsenic metallochaperone for efflux pump" metals Stressors Heavy Metals arsenic +arsM arsM|K07755 "arsM, arsenite methyltransferase" metals Stressors Heavy Metals arsenic +aioA-aoxB aioA-aoxB|K08356 "aioA-aoxB, arsenite oxidase large subunit" metals Stressors Heavy Metals arsenic +aioB-aoxA aioB-aoxA|K08355 "aioB-aoxA, arsenite oxidase small subunit" metals Stressors Heavy Metals arsenic +arsC|K00537 arsC|K00537 "arsC, arsenate reductase (glutaredoxin)" metals Stressors Heavy Metals arsenic +arsC|K03741 arsC|K03741 "arsC, arsenate reductase (thioredoxin)" metals Stressors Heavy Metals arsenic +arsH arsH|K11811 "arsH, arsenical resistance protein ArsH" metals Stressors Heavy Metals arsenic +aioR-aoxR aioR-aoxR "aioR-aoxR, Transcriptional activator protein; two-component system" metals Stressors Heavy Metals arsenic +aioS-aoxS aioS-aoxS "aioS-aoxS, Sensor protein; two-component system" metals Stressors Heavy Metals arsenic +arsR arsR|K03892 "arsR, arsenate/arsenite/antimonite-responsive transcriptional repressor" metals Stressors Heavy Metals arsenic +acr3 acr3|K03325 "acr3, arsenite transporter" metals Stressors Heavy Metals arsenic +arsA arsA|K01551 "arsA, arsenite/tail-anchored protein-transporting ATPase" metals Stressors Heavy Metals arsenic +arsB arsB|K03893 "arsB, arsenical pump membrane protein" metals Stressors Heavy Metals arsenic +cadC cadC|K03765 "cadC, transcriptional activator of cad operon" metals Stressors Heavy Metals cadmium +cadR cadR "cadR, Transcriptional regulator for cadmium resistance" metals Stressors Heavy Metals cadmium +cadX cadX|K21903 "cadX, lead/cadmium/zinc/bismuth-responsive transcriptional repressor" metals Stressors Heavy Metals cadmium +cmtR cmtR|K21885 "cmtR, cadmium/lead-responsive transcriptional repressor" metals Stressors Heavy Metals cadmium +cusR-ylcA cusR-ylcA|K07665 "cusR-ylcA, opper resistance phosphate regulon response regulator CusR" metals Stressors Heavy Metals cadmium +cusS cusS|K07644 "cusS, heavy metal sensor histidine kinase CusS" metals Stressors Heavy Metals cadmium +czcR czcR|K02483 "czcR, two-component system, OmpR family, response regulator" metals Stressors Heavy Metals cadmium +czrA czrA|K22043 "czrA, zinc-responsive transcriptional repressor" metals Stressors Heavy Metals cadmium +K03088 K03088 "RNA polymerase sigma-70 factor, ECF subfamily" metals Stressors Heavy Metals cadmium +K24079 K24079 nickel and cobalt resistance protein CnrY metals Stressors Heavy Metals cadmium +K24078 K24078 nickel and cobalt resistance protein CnrR metals Stressors Heavy Metals cadmium +cadD cadD "cadD, Cadmium resistance permease" metals Stressors Heavy Metals cadmium +czcA czcA|K15726 "czcA, heavy metal efflux system protein" metals Stressors Heavy Metals cadmium +czcB czcB|K15727 "czcB, membrane fusion protein, heavy metal efflux system" metals Stressors Heavy Metals cadmium +czcC czcC|K15725 "czcC, outer membrane protein, heavy metal efflux system" metals Stressors Heavy Metals cadmium +cznB cznB "cznB, Cadmium-zinc-nickel efflux; transporter" metals Stressors Heavy Metals cadmium +czrB czrB|K21133 "czrB, multidrug efflux pump" metals Stressors Heavy Metals cadmium +dmeF dmeF "dmeF, Broad range metal ion transporter" metals Stressors Heavy Metals cadmium +rcnA-yohM rcnA-yohM|K08970 "rcnA-yohM, nickel/cobalt transporter (NicO) family protein" metals Stressors Heavy Metals cadmium +zitB-ybgR zitB-ybgR|K16264 "zitB-ybgR, cobalt-zinc-cadmium efflux system protein" metals Stressors Heavy Metals cadmium +zntA-yhhO zntA-yhhO|K01534 "zntA-yhhO, Zn2+/Cd2+-exporting ATPase" metals Stressors Heavy Metals cadmium +ncrB ncrB "ncrB, Ni-Co efflux; regulator" metals Stressors Heavy Metals cobalt +ncrY ncrY "ncrY, Ni-Co efflux; regulator" metals Stressors Heavy Metals cobalt +rcnR-yohL rcnR-yohL|K23240 "rcnR-yohL, FrmR/RcnR family transcriptional regulator, repressor of rcnA expression" metals Stressors Heavy Metals cobalt +K24073 K24073 RNA polymerase sigma factor CnrH metals Stressors Heavy Metals cobalt +K06042 K06042 precorrin-8X/cobalt-precorrin-8 methylmutase metals Stressors Heavy Metals cobalt +cmeA cmeA|K03585 "cmeA, membrane fusion protein, multidrug efflux system" metals Stressors Heavy Metals cobalt +cmeB cmeB|K18138 "cmeB, multidrug efflux pump" metals Stressors Heavy Metals cobalt +cmeC cmeC|K18139 "cmeC, outer membrane protein, multidrug efflux system" metals Stressors Heavy Metals cobalt +cnrT cnrT "cnrT, Ni-Co efflux system; cation diffusion facilitator" metals Stressors Heavy Metals cobalt +corA corA|K03284 "corA, magnesium transporter" metals Stressors Heavy Metals cobalt +corB corB "corB, Magnesium-transporting ATPase" metals Stressors Heavy Metals cobalt +corC corC|K06189 "corC, hemolysin (HlyC) family protein" metals Stressors Heavy Metals cobalt +ctpD ctpD|K12951 "ctpD, cobalt/nickel-transporting P-type ATPase D" metals Stressors Heavy Metals cobalt +dmeR dmeR "dmeR, Co-Ni dmeRF efflux system" metals Stressors Heavy Metals cobalt +nrsD-nreB nrsD-nreB|K07785 "nrsD-nreB, MFS transporter, NRE family, putaive nickel resistance protein" metals Stressors Heavy Metals cobalt +rcnB-yohN rcnB-yohN|K23243 "rcnB-yohN, nickel/cobalt homeostasis protein" metals Stressors Heavy Metals cobalt +copC copC|K07156 "copC, copper resistance protein C" metals Stressors Heavy Metals copper +cutA cutA|K03926 "cutA, periplasmic divalent cation tolerance protein" metals Stressors Heavy Metals copper +cutC cutC|K06201 "cutC, copper homeostasis protein" metals Stressors Heavy Metals copper +mymT mymT|K21609 "mymT, Cu-binding metallothionein" metals Stressors Heavy Metals copper +pcoB pcoB|K07233 "pcoB, copper resistance protein B" metals Stressors Heavy Metals copper +pcoE pcoE "pcoE, Copper binding protein; downstream from regulatory genes" metals Stressors Heavy Metals copper +copZ copZ|K07213 "copZ, copper chaperone" metals Stressors Heavy Metals copper +K09796 K09796 periplasmic copper chaperone A metals Stressors Heavy Metals copper +K19342 K19342 copper chaperone NosL metals Stressors Heavy Metals copper +cinA cinA "cinA, Copper-binding azurin-like protein" metals Stressors Heavy Metals copper +cueO cueO|K14588 "cueO, cuproxidase" metals Stressors Heavy Metals copper +cutO cutO "cutO, Multicopper oxidase" metals Stressors Heavy Metals copper +mco mco|K22552 "mco, multicopper oxidase" metals Stressors Heavy Metals copper +copL copL "copL, Copper binding protein; higher affinity for Cu(I)" metals Stressors Heavy Metals copper +copY-tcrY copY-tcrY "copY-tcrY, Upstream repressor of CopA/CopB" metals Stressors Heavy Metals copper +corR corR "corR, Transcriptional regulator protein; two component system; cuoABC and copAB" metals Stressors Heavy Metals copper +crdR crdR|K02483 "crdR, two-component system, OmpR family, response regulator" metals Stressors Heavy Metals copper +csoR csoR|K21600 "csoR, CsoR family transcriptional regulator, copper-sensing transcriptional repressor" metals Stressors Heavy Metals copper +cueR-ybbI cueR-ybbI|K11923 "cueR-ybbI, copper efflux regulator" metals Stressors Heavy Metals copper +cusR-ylcA cusR-ylcA|K07665 "cusR-ylcA, copper resistance phosphate regulon response regulator CusR" metals Stressors Heavy Metals copper +hmrR hmrR|K19591 "hmrR, copper efflux regulator" metals Stressors Heavy Metals copper +ycnK ycnK|K21601 "ycnK, copper-sensing transcriptional repressor" metals Stressors Heavy Metals copper +yfmP yfmP|K21902 "yfmP, MerR family transcriptional regulator, repressor of the yfmOP operon" metals Stressors Heavy Metals copper +K18992 K18992 "TetR/AcrR family transcriptional regulator, cmeABC operon repressor" metals Stressors Heavy Metals copper +acrD acrD|K18324 "acrD, multidrug efflux pump" metals Stressors Heavy Metals copper +copA copA|K17686 "copA, P-type Cu+ transporter" metals Stressors Heavy Metals copper +copB copB|K01533 "copB, P-type Cu2+ transporter" metals Stressors Heavy Metals copper +copD copD|K07245 "copD, copper resistance protein D" metals Stressors Heavy Metals copper +copP copP "copP, Copper binding protein; part of cation transport system" metals Stressors Heavy Metals copper +crdA crdA "crdA, Copper resistance determinant" metals Stressors Heavy Metals copper +ctpG ctpG|K12954 "ctpG, cation-transporting P-type ATPase G" metals Stressors Heavy Metals copper +ctpV ctpV|K12956 "ctpV, copper-transporting P-type ATPase V" metals Stressors Heavy Metals copper +cusA-ybdE cusA-ybdE|K07787 "cusA-ybdE, copper/silver efflux system protein" metals Stressors Heavy Metals copper +cusB cusB|K07798 "cusB, membrane fusion protein, copper/silver efflux system" metals Stressors Heavy Metals copper +cusC-ylcB cusC-ylcB|K07796 "cusC-ylcB, outer membrane protein, copper/silver efflux system" metals Stressors Heavy Metals copper +cusF-cusX cusF-cusX|K07810 "cusF-cusX, Cu(I)/Ag(I) efflux system periplasmic protein CusF" metals Stressors Heavy Metals copper +cutE-lnt cutE-lnt|K03820 "cutE-lnt, apolipoprotein N-acyltransferase" metals Stressors Heavy Metals copper +cutF-nlpE cutF-nlpE|K06079 "cutF-nlpE, copper homeostasis protein (lipoprotein)" metals Stressors Heavy Metals copper +hpcopA hpcopA "hpcopA, Copper transport ATPase" metals Stressors Heavy Metals copper +mctB mctB "mctB, Pore-forming protein; copper efflux" metals Stressors Heavy Metals copper +ycnJ ycnJ|K14166 "ycnJ, copper transport protein" metals Stressors Heavy Metals copper +yfmO yfmO|K08221 "yfmO, MFS transporter, ACDE family, multidrug resistance protein" metals Stressors Heavy Metals copper +bfrA bfrA|K03594 "bfrA, bacterioferritin" metals Stressors Heavy Metals iron +dpr-dps dpr-dps "dpr-dps, Sequesters Fe(II), binds and oxidizes to Fe(III) " metals Stressors Heavy Metals iron +dpsA dpsA "dpsA, Stress response, iron-binding protein" metals Stressors Heavy Metals iron +pfr pfr|K02217 "pfr, ferritin" metals Stressors Heavy Metals iron +yqjH yqjH|K07229 "yqjH, ferric-chelate reductase (NADPH)" metals Stressors Heavy Metals iron +ideR ideR|K03709 "ideR, Mn-dependent transcriptional regulator" metals Stressors Heavy Metals iron +pmrA pmrA "pmrA, Transcriptional regulator protein; two component system" metals Stressors Heavy Metals iron +pmrB pmrB "pmrB, Sensor protein; two component system" metals Stressors Heavy Metals iron +fbpA fbpA|K02012 "fbpA, iron(III) transport system substrate-binding protein" metals Stressors Heavy Metals iron +fbpB fbpB|K02011 "fbpB, iron(III) transport system permease protein" metals Stressors Heavy Metals iron +fbpC fbpC|K02010 "fbpC, iron(III) transport system ATP-binding protein" metals Stressors Heavy Metals iron +fieF-yiip fieF-yiip|K13283 "fieF-yiip, ferrous-iron efflux pump FieF" metals Stressors Heavy Metals iron +fptA fptA|K16088 "fptA, outer-membrane receptor for ferric coprogen and ferric-rhodotorulic acid" metals Stressors Heavy Metals iron +mntH-yfeB mntH-yfeB|K03322 "mntH-yfeB, manganese transport protein" metals Stressors Heavy Metals iron +nia nia|K01552 "nia, energy-coupling factor transport system ATP-binding protein" metals Stressors Heavy Metals iron +pmrC pmrC "pmrC, Membrane protein" metals Stressors Heavy Metals iron +ybtP ybtP|K06147 "ybtP, ATP-binding cassette, subfamily B, bacterial" metals Stressors Heavy Metals iron +ybtQ ybtQ|K06147 "ybtQ, ATP-binding cassette, subfamily B, bacterial" metals Stressors Heavy Metals iron +yfeA yfeA|K11604 "yfeA, manganese/iron transport system substrate-binding protein" metals Stressors Heavy Metals iron +yfeB yfeB|K11607 "yfeB, manganese/iron transport system ATP-binding protein" metals Stressors Heavy Metals iron +yfeC yfeC|K11605 "yfeC, manganese/iron transport system permease protein" metals Stressors Heavy Metals iron +yfeD yfeD|K11606 "yfeD, manganese/iron transport system permease protein" metals Stressors Heavy Metals iron +K07224 K07224 iron uptake system component EfeO metals Stressors Heavy Metals iron +pbrR pbrR "pbrR, Transcription factor, regulator" metals Stressors Heavy Metals lead +pbrT pbrT "pbrT, Pb(II) uptake protein; membrane transporter" metals Stressors Heavy Metals lead +K03101 K03101 signal peptidase II metals Stressors Heavy Metals lead +mgtA mgtA|K01531 "mgtA, P-type Mg2+ transporter" metals Stressors Heavy Metals magnesium +K06213 K06213 magnesium transporter metals Stressors Heavy Metals magnesium +mntR mntR|K11924 "mntR, manganese transport regulator" metals Stressors Heavy Metals manganese +ctpC ctpC|K12950 "ctpC, manganese-transporting P-type ATPase C" metals Stressors Heavy Metals manganese +mntA-ytgA mntA-ytgA|K11707 "mntA-ytgA, manganese/zinc/iron transport system substrate-binding protein" metals Stressors Heavy Metals manganese +mntP-yebN mntP-yebN|K23242 "mntP-yebN, manganese efflux pump family protein" metals Stressors Heavy Metals manganese +merB merB|K00221 "merB, alkylmercury lyase" metals Stressors Heavy Metals mercury +merA merA|K00520 "merA, mercuric reductase" metals Stressors Heavy Metals mercury +merD merD|K19057 "merD, mercuric resistance operon regulatory protein" metals Stressors Heavy Metals mercury +merR merR|K08365 "merR, mercuric resistance operon regulatory protein" metals Stressors Heavy Metals mercury +merC merC|K19058 "merC, mercuric ion transport protein" metals Stressors Heavy Metals mercury +merE merE|K19059 "merE, mercuric ion transport protein" metals Stressors Heavy Metals mercury +merF merF|K19058 "merF, mercuric ion transport protein" metals Stressors Heavy Metals mercury +merP merP|K08364 "merP, periplasmic mercuric ion binding protein" metals Stressors Heavy Metals mercury +merT merT|K08363 "merT, mercuric ion transport protein" metals Stressors Heavy Metals mercury +nikR nikR|K07722 "nikR, CopG family transcriptional regulator, nickel-responsive regulator" metals Stressors Heavy Metals nickel +nrsS nrsS|K11328 "nrsS, Ni(II)-sensor and/or redox sensor kinase NrsS" metals Stressors Heavy Metals nickel +K11330 K11330 Ni(II)-responsive and/or redox-responsive regulator NrsR metals Stressors Heavy Metals nickel +hupE hupE "hupE, Nickel transporter; metal permease" metals Stressors Heavy Metals nickel +nikA nikA|K15584 "nikA, nickel transport system substrate-binding protein" metals Stressors Heavy Metals nickel +nikB nikB|K15585 "nikB, nickel transport system permease protein" metals Stressors Heavy Metals nickel +nikC nikC|K15586 "nikC, nickel transport system permease protein" metals Stressors Heavy Metals nickel +nikD nikD|K15587 "nikD, nickel transport system ATP-binding protein" metals Stressors Heavy Metals nickel +nikE nikE|K10824 "nikE, nickel transport system ATP-binding protein" metals Stressors Heavy Metals nickel +nixA nixA|K07241 "nixA, nickel/cobalt transporter (NiCoT) family protein" metals Stressors Heavy Metals nickel +nrsA nrsA|K11326 "nrsA, cation efflux system protein involved in nickel and cobalt tolerance" metals Stressors Heavy Metals nickel +silF silF "silF, Silver cation efflux system; chaperone" metals Stressors Heavy Metals silver +silE silE "silE, Silver cation efflux system; binding protein" metals Stressors Heavy Metals silver +silP silP|K23254 "silP, P-type Ag+ transporter" metals Stressors Heavy Metals silver +smtA smtA|K21904 "smtA, Zinc binding metallothionein" metals Stressors Heavy Metals zinc +zevA zevA "zevA, Zinc binding protein" metals Stressors Heavy Metals zinc +zraP zraP|K07803 "zraP, zinc resistance-associated protein" metals Stressors Heavy Metals zinc +zinT-yodA zinT-yodA "zinT-yodA, Periplasmic zinc (and cadmium) binding protein" metals Stressors Heavy Metals zinc +zntR-yhdM zntR-yhdM|K13638 "zntR-yhdM, Zn(II)-responsive regulator of zntA" metals Stressors Heavy Metals zinc +zraR-hydH zraR-hydH|K07713 "zraR-hydH, two-component system, NtrC family, response regulator HydG" metals Stressors Heavy Metals zinc +zraS-hydG zraS-hydG|K07709 "zraS-hydG, two-component system, NtrC family, sensor histidine kinase HydH" metals Stressors Heavy Metals zinc +zur-yjbK zur-yjbK|K09823 "zur-yjbK, Fur family transcriptional regulator, zinc uptake regulator" metals Stressors Heavy Metals zinc +K03709 K03709 Mn-dependent transcriptional regulator metals Stressors Heavy Metals zinc +mdtA mdtA|K07799 "mdtA, membrane fusion protein, multidrug efflux system" metals Stressors Heavy Metals zinc +mdtB mdtB|K07788 "mdtB, multidrug efflux pump" metals Stressors Heavy Metals zinc +mdtC mdtC|K07789 "mdtC, multidrug efflux pump" metals Stressors Heavy Metals zinc +troB troB|K11710 "troB, manganese/zinc/iron transport system ATP- binding protein" metals Stressors Heavy Metals zinc +zipB zipB|K07238 "zipB, zinc transporter, ZIP family" metals Stressors Heavy Metals zinc +znuA-yebL znuA-yebL|K09815 "znuA-yebL, zinc transport system substrate-binding protein" metals Stressors Heavy Metals zinc +znuB-yebI znuB-yebI|K09816 "znuB-yebI, zinc transport system permease protein" metals Stressors Heavy Metals zinc +znuC-yebM znuC-yebM|K09817 "znuC-yebM, zinc transport system ATP-binding protein" metals Stressors Heavy Metals zinc +K11708 K11708 manganese/zinc/iron transport system permease protein metals Stressors Heavy Metals zinc +K11709 K11709 manganese/zinc/iron transport system permease protein metals Stressors Heavy Metals zinc diff --git a/bin/assets/forms/distill_sheets/distill_misc.tsv b/bin/assets/forms/distill_sheets/distill_misc.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/distill_nitrogen.tsv b/bin/assets/forms/distill_sheets/distill_nitrogen.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/distill_transport.tsv b/bin/assets/forms/distill_sheets/distill_transport.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/dummy.tsv b/bin/assets/forms/distill_sheets/dummy.tsv old mode 100755 new mode 100644 index fe3a0735..7951defe --- a/bin/assets/forms/distill_sheets/dummy.tsv +++ b/bin/assets/forms/distill_sheets/dummy.tsv @@ -1 +1 @@ -NULL \ No newline at end of file +NULL diff --git a/bin/assets/forms/distill_sheets/methylotrophy_distillate.tsv b/bin/assets/forms/distill_sheets/methylotrophy_distillate.tsv old mode 100755 new mode 100644 index 45cce057..02dd0d35 --- a/bin/assets/forms/distill_sheets/methylotrophy_distillate.tsv +++ b/bin/assets/forms/distill_sheets/methylotrophy_distillate.tsv @@ -1,10 +1,10 @@ gene_id gene_description pathway topic_ecosystem category subcategory fasta -K25220 MtxB; Quaternary amine methyltransferase (Glycine betaine methyltransferase, MtgB) [EC:2.1.1.376] QA demethylation METHYL Catabolism Anaerobic +K25220 MtxB; Quaternary amine methyltransferase (Glycine betaine methyltransferase, MtgB) [EC:2.1.1.376] QA demethylation METHYL Catabolism Anaerobic METHYL_0001 MtgC; Quaternary amine/glycine betaine corrinoid binding protein QA demethylation METHYL Catabolism Anaerobic MtgC_DSY3155_Desulfitobacterium_hafniense_Q24SP8;MV8465_Methanolobus_vulcani_b1d_corrinoid_mtgC_homolog_WP_154809803.1 METHYL_0002 MtgA; Quaternary amine/glycine betaine specific methylcorrinoid:THF methyltransferase QA demethylation METHYL Catabolism Anaerobic MtgA_DSY3157_Desulfitobacterium_hafniense_Y51_substrate_glycine_betaine_corrinoid:THF_Q24SP6-1 METHYL_0003 MV8460; methanogenic glycine betaine:corrinoid methyltransferase QA demethylation METHYL Catabolism Anaerobic MV8460_methanogenic_Methanolobus_vulcani_b1d_substrate_glycine_betaine_WP_154809802.1 METHYL_0004 MV8465; methanogenic glycine betaine corrinoid binding protein QA demethylation METHYL Catabolism Anaerobic MV8465_Methanolobus_vulcani_b1d_corrinoid_mtgC_homolog_WP_154809803.1 -K14080 MV10360; methanogenic glycine betaine specific methylcorrinoid:CoM methyltransferase [EC:2.1.1.377] QA demethylation METHYL Catabolism Anaerobic +K14080 MV10360; methanogenic glycine betaine specific methylcorrinoid:CoM methyltransferase [EC:2.1.1.377] QA demethylation METHYL Catabolism Anaerobic METHYL_0005 MV10335/RamM; methanogenic corrinoid-protein reductive activase QA demethylation METHYL Catabolism Anaerobic MV10335_methanogenic_Methanolobus_vulcani_b1d_substrate_glycine_betaine_acrtivase_ramM METHYL_0006 MtpB; proline betaine:corrinoid methyltransferase QA demethylation METHYL Catabolism Anaerobic MtpB_proline_betaine:corrinoid_methyltransferase_Eubacterium_limosum_ATCC_8486 METHYL_0007 MtcB: L-carnitine:corrinoid methyltransferase QA demethylation METHYL Catabolism Anaerobic MtcB_L-carnitine:corrinoid_methyltransferase_Eubacterium_limosum_ATCC_8486 @@ -12,96 +12,96 @@ METHYL_0008 MtyB; gamma-butyrobetaine:corrinoid methyltransferase QA demethylati METHYL_0009 MtqC; quaternary amine promiscuous corrinoid binding protein QA demethylation METHYL Catabolism Anaerobic MtqC_promiscuous_QA_corrinoid_Carnitine_ProlineBetaine_Butyrobetaine_Eubacterium_limosum_ATCC_8486 METHYL_0010 MtqA; quaternary amine promiscuous methylcorrinoid:THF methyltransferase QA demethylation METHYL Catabolism Anaerobic MtqA_promiscuous_corrinoid:THF_MT_Carnitine_ProlineBetaine_Butyrobetaine_Eubacterium_limosum_ATCC_8486 METHYL_0011 RamQ; quaternary amine promiscuous corrinoid protein reductive activase QA demethylation METHYL Catabolism Anaerobic RamQ_promiscuous_MtqC_activase_Carnitine_ProlineBetaine_Butyrobetaine_Eubacterium_limosum_ATCC_8486 -K01599 uroporphyrinogen decarboxylase [EC:4.1.1.37] [RN:R03197] (methyltransferase homolog/frequent mis-annotation) Heme biosynthesis, animals and fungi, glycine => heme METHYL Catabolism Anaerobic -K14083 MttB/MtxB; Trimethylamine methyltransferase [EC:2.1.1.250], potentially a quaternary amine enzyme if lacking pyrrolysine QA demethylation METHYL Catabolism Anaerobic -K14084 MttC; trimethylamine corrinoid binding protein [EC:2.1.1.247] QA demethylation METHYL Catabolism Anaerobic -K16178 MtbB; dimethylamine methyltransferase DMA demethylation METHYL Catabolism Anaerobic -K16179 MtbC; dimethylamine corrinoid binding protein DMA demethylation METHYL Catabolism Anaerobic -K16176 MtmB; monomethylamine methyltransferase MMA demethylation METHYL Catabolism Anaerobic -K16177 MtmC; monomethylamine corrinoid binding protein MMA demethylation METHYL Catabolism Anaerobic -K14082 MtbA; methylamine methylcorrinoid:CoM methyltransferase [EC:2.1.1.247] Methylamine:CoM methyltransfer METHYL Catabolism Anaerobic +K01599 uroporphyrinogen decarboxylase [EC:4.1.1.37] [RN:R03197] (methyltransferase homolog/frequent mis-annotation) Heme biosynthesis, animals and fungi, glycine => heme METHYL Catabolism Anaerobic +K14083 MttB/MtxB; Trimethylamine methyltransferase [EC:2.1.1.250], potentially a quaternary amine enzyme if lacking pyrrolysine QA demethylation METHYL Catabolism Anaerobic +K14084 MttC; trimethylamine corrinoid binding protein [EC:2.1.1.247] QA demethylation METHYL Catabolism Anaerobic +K16178 MtbB; dimethylamine methyltransferase DMA demethylation METHYL Catabolism Anaerobic +K16179 MtbC; dimethylamine corrinoid binding protein DMA demethylation METHYL Catabolism Anaerobic +K16176 MtmB; monomethylamine methyltransferase MMA demethylation METHYL Catabolism Anaerobic +K16177 MtmC; monomethylamine corrinoid binding protein MMA demethylation METHYL Catabolism Anaerobic +K14082 MtbA; methylamine methylcorrinoid:CoM methyltransferase [EC:2.1.1.247] Methylamine:CoM methyltransfer METHYL Catabolism Anaerobic METHYL_0012 RamA; methylamine corrinoid binding protein reductive activase Methylamine:CoM methyltransfer METHYL Catabolism Anaerobic RamA;_methylamine_corrinoid_binding_protein_reductive_activase_Methanosarcina_barkeri -K16180 PylB; Methylornithine synthase [EC:5.4.99.58] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis -K16181 PylC; Pyrrolysine synthetase [EC:6.3.2.59] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis -K16182 PylD; Pyrrolysine synthase [EC:1.4.1.-] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis -K11627 PylS; pyrrolysyl-tRNA synthetase [EC:6.1.1.26] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis -K14239 PylT; tRNA-pyl Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis -K02302 CysG; uroporphyrin-III C-methyltransferase/precorrin-2 dehydrogenase/sirohydrochlorin ferrochelatase [ec:2.1.1.107;1.3.1.76;4.99.1.4] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K24866 SirC; preccorin-2 dehydrogenase [EC:1.3.1.76] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02303 CobAM; uroporphyrin-III C-methyltransferase [EC:2.1.1.107] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K22011 CfbA; sirohydrochlorin cobalto/nickelchelatase [EC:4.99.1.3;4.99.1.110] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K03795 CbiX; sirohydrochlorin cobaltochelatase [ED:4.99.1.3] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02190 CbiX; sirohydrochlorin cobaltochelatase [ED:4.99.1.3] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K03394 CobI, CbiL; precorrin-2/cobalt-factor-2 C20-methyltransferase [EC:2.1.1.130;2.1.1.151] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K21479 CbiH60; cobalt-factor-III methyltransferase Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K05934 CobJ, CibH; precorrin-3B C17-methyltransferase/cobalt-factor-III methyltransferase [EC:2.1.1.131;2.1.1.272] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K13541 CbiGH, CobJ; cobalt-precorrin 5A hydrolase/cobalt-factor-III methyltransferase/precorrin-3B C17 methyltransferase [ec:3.7.1.12;2.1.1.272;2.1.1.131] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K05936 CobM, CbiF; precorrin-4/cobalt-precorrin-4 C11-methyltransferase [EC 2.1.1.133;2.1.1.271] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02189 CbiG; cobalt-precorrin 5A hydrolase [EC:3.7.1.12] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02188 CbiD; cobalt-precorrin 5B hydrolase (C1) methyltransferase [EC:2.1.1.195] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K05895 CobK-CbiJ; precorrin-6A/cobalt-precorrin 6A reductase [EC:1.3.1.54;1.3.1.106] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02192 CbiT; cobalt-precorrin-6B (C15)-methyltransferase[EC:2.1.1.196] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K00595 CobL, CbiET; precorrin-6B C5, 15-methyltransferase/cobalt-precorrin-6B C5,C15-methyltransferase [EC:2.1.1.132,2.1.1.289,2.1.1.196] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02232 cobQ, cbiP; adenosylcobyric acid synthase [EC:6.3.5.10] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02231 CobP, CobU; adenosylcobinamide kinase/adenosylcobinamide phosphate guanylyltransferase [EC:2.7.1.156;2.7.7.62] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02233 E2.7.8.26, cobS, cobV; adenosylcobinamide-GDP ribazoletransferase [EC:2.7.8.26] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K00798 MMAB, pduO; cob(I)alamin adenosyltransferase [EC:2.5.1.17] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K19221 cobA, btuR; cob(I)alamin adenosyltransferase [EC:2.5.1.17] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K19712 cobY; adenosylcobinamide-phosphate guanylyltransferase [EC:2.7.7.62] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02227 cbiB, cobD; adenosylcobinamide-phosphate synthase [EC:6.3.1.10] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02225 cobC1, cobC; cobalamin biosynthetic protein Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K13786 cobR; cob(II)yrinic acid a,c-diamide reductase [EC:1.16.8.1] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K03399 CbiE; cobalt-precorrin-7 (C5)-methyltransferase [EC 2.1.1.289] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K06042 CobH, CbiC; precorrin-8X/cobalt-precorrin08 methylmutase [EC:5.4.99.61] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02224 CobB, CbiA; cobyrinic acid a,c-diamide synthase [EC:6.3.5.9;6.2.5.11] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K13540 CobIJ; precorrin-2 C20-methyltransferase/precorrin-3B C17-methyltransferase [EC:2.1.1.130;2.1.1.131] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02229 CobG; precorrin 3B synthase [EC:1.14.13.83] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02228 CobF; precorrin-6A synthase [EC:2.1.1.152] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02230 CobN; cobaltochelatase [EC:6.6.1.2] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K09882 CobS; cobaltochelatase [EC:6.6.1.2] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K09883 CobT; cobaltochelatase [EC:6.6.1.2] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K02226 CobC, PhpB; alpha-ribazole phosphatase [EC:3.1.3.73] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K22316 RhnA, CobC; ribonuclease h/adenosylcobalamin/alpha-ribazole phosphatase [EC:3.1.26.4;3.1.3.73] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K00768 CobU, CobT; nicotinate-nucleotide-dimethylbenzimidazole phosphoribosyltransferase [EC:2.4.2.21] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis -K16092 BtuB; vitamin-B12 transporter Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis -K06073 BtuC; vitamin-B12 transport system permease protein Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis -K06074 BtuD; vitamin-B12 transport system-ATP binding protein [EC:7.6.2.8] Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis -K25028 BtuD; vitamin-B12 transport system-ATP binding protein [EC:7.6.2.8] Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis -K00432 BtuE; vitamin-B12 transport system - periplasmic protein Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis -K06858 BtuF; vitamin-B12 transport system-substrate binding protein Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis -K02168 BetTS; choline/glycine/proline betaine transport protein QA transporter METHYL Transporter Transport -K03451 TC.BCT; choline/carnitine/betaine/glycine/BCCT transporter QA transporter METHYL Transporter Transport -K05020 OpuD, BetL; glycine-betaine transporter QA transporter METHYL Transporter Transport -K03762 ProP; Proline/betaine MFS transporter, PPII, proline permease II QA transporter METHYL Transporter Transport -K03607 ProQ; proline/betaine (ProP effector) QA transporter METHYL Transporter Transport -K02000 ProV; glycine-betaine/proline transport system ATP binding protein [EC:7.6.2.9] QA transporter METHYL Transporter Transport -K02001 ProW; glycine-betaine/proline transport system permease protein QA transporter METHYL Transporter Transport -K02002 ProX; glycine-betaine/proline transport system substrate binding protein QA transporter METHYL Transporter Transport -K05845 OpuC; Osmoprotectant transport system substrate binding protein QA transporter METHYL Transporter Transport -K05846 OpuBD; Osmoprotectant transport system permease QA transporter METHYL Transporter Transport -K05847 OpuA; Osmoprotectant transport system ATP-binding protein [EC:7.6.2.9] QA transporter METHYL Transporter Transport -K18896 GSMT; glycine/sarcosine N-methyltransferase [EC:2.1.1.156] QA transporter METHYL Transporter Aerobic -K18897 SDMT; sarcosine/dimethylglycine N-methyltransferase [EC:2.1.1.157] QA transporter METHYL Transporter Aerobic -K22443 YeaW; carnitine/QA-promiscuous monooxygenase subunit, YeaW [ED 1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic -K22444 YeaX carnitine/QA-promiscuous monooxygenase reductase subunit [EC 1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic -K22443 CntA; carnitine rieske-type oxygenase [EC:1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic -K22444 CntB; carnitine rieske-type reductase [EC:1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic -K20038 CutC; choline trimethylamine lysae [EC:4.3.99.4] QA cleavage to TMA METHYL Catabolism Anaerobic -K20037 CutD; glycyl-radical activating enzyme [EC:1.97.1.-] QA cleavage to TMA METHYL Catabolism Anaerobic -K01066 aes; actyl esterase (potentially HocS from Pseuodmonas); [EC:3.1.1.28] Acylcarnitine -> carnitine METHYL Catabolism -K05245 CaiT; L-carnitine/gamma-butyrobetaine antiporter Cai operon METHYL Carnitine reduction Anaerobic -K08297 CaiA; crotonobetainly-CoA dehydrogenase [EC:1.3.8.13] Cai operon METHYL Carnitine reduction Anaerobic -K08298 CaiB; L-carnitine CoA-transferase [EC:2.8.3.21] Cai operon METHYL Carnitine reduction Anaerobic -K02182 CaiC; carnitine-CoA ligase [EC:6.2.1.48] Cai operon METHYL Carnitine reduction Anaerobic -K08299 CaiD; crotonobetainyl-CoA hydratase [EC:4.2.1.149] Cai operon METHYL Carnitine reduction Anaerobic -K08279 CaiE; carnitine operon protein Cai operon METHYL Carnitine reduction Anaerobic -K08277 CaiF; tanscriptional activator Cai operon METHYL Carnitine reduction Anaerobic -K03521 FixA; electron transfer flavoprotein beta subunit Fix operon METHYL Carnitine reduction Anaerobic -K03522 FixB; electron transfer flavoprotein alpha subunit Fix operon METHYL Carnitine reduction Anaerobic -K00313 FixC; electron transfer flavoprotein-quinone oxidoreductase [EC:1.5.5.-] Fix operon METHYL Carnitine reduction Anaerobic -K03855 FixX; ferredoxin-like protein Fix operon METHYL Carnitine reduction Anaerobic -K00548 metH; cobalamin-dependent methionine synthase [EC:2.1.1.13] Methionine Biosynthesis METHYL Amino Acid Biosynthesis -K00471 BBOX1; gamma-butyrobetaine hydroxylase/dioxygenase [EC:1.14.11.1] Butyrobetaine -> Carnitine -> Glycine betaine METHYL Catabolism Aerobic +K16180 PylB; Methylornithine synthase [EC:5.4.99.58] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis +K16181 PylC; Pyrrolysine synthetase [EC:6.3.2.59] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis +K16182 PylD; Pyrrolysine synthase [EC:1.4.1.-] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis +K11627 PylS; pyrrolysyl-tRNA synthetase [EC:6.1.1.26] Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis +K14239 PylT; tRNA-pyl Pyrrolysine biosynthesis METHYL Amino Acid Biosynthesis Cofactor/Other_biosynthesis +K02302 CysG; uroporphyrin-III C-methyltransferase/precorrin-2 dehydrogenase/sirohydrochlorin ferrochelatase [ec:2.1.1.107;1.3.1.76;4.99.1.4] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K24866 SirC; preccorin-2 dehydrogenase [EC:1.3.1.76] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02303 CobAM; uroporphyrin-III C-methyltransferase [EC:2.1.1.107] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K22011 CfbA; sirohydrochlorin cobalto/nickelchelatase [EC:4.99.1.3;4.99.1.110] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K03795 CbiX; sirohydrochlorin cobaltochelatase [ED:4.99.1.3] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02190 CbiX; sirohydrochlorin cobaltochelatase [ED:4.99.1.3] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K03394 CobI, CbiL; precorrin-2/cobalt-factor-2 C20-methyltransferase [EC:2.1.1.130;2.1.1.151] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K21479 CbiH60; cobalt-factor-III methyltransferase Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K05934 CobJ, CibH; precorrin-3B C17-methyltransferase/cobalt-factor-III methyltransferase [EC:2.1.1.131;2.1.1.272] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K13541 CbiGH, CobJ; cobalt-precorrin 5A hydrolase/cobalt-factor-III methyltransferase/precorrin-3B C17 methyltransferase [ec:3.7.1.12;2.1.1.272;2.1.1.131] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K05936 CobM, CbiF; precorrin-4/cobalt-precorrin-4 C11-methyltransferase [EC 2.1.1.133;2.1.1.271] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02189 CbiG; cobalt-precorrin 5A hydrolase [EC:3.7.1.12] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02188 CbiD; cobalt-precorrin 5B hydrolase (C1) methyltransferase [EC:2.1.1.195] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K05895 CobK-CbiJ; precorrin-6A/cobalt-precorrin 6A reductase [EC:1.3.1.54;1.3.1.106] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02192 CbiT; cobalt-precorrin-6B (C15)-methyltransferase[EC:2.1.1.196] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K00595 CobL, CbiET; precorrin-6B C5, 15-methyltransferase/cobalt-precorrin-6B C5,C15-methyltransferase [EC:2.1.1.132,2.1.1.289,2.1.1.196] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02232 cobQ, cbiP; adenosylcobyric acid synthase [EC:6.3.5.10] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02231 CobP, CobU; adenosylcobinamide kinase/adenosylcobinamide phosphate guanylyltransferase [EC:2.7.1.156;2.7.7.62] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02233 E2.7.8.26, cobS, cobV; adenosylcobinamide-GDP ribazoletransferase [EC:2.7.8.26] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K00798 MMAB, pduO; cob(I)alamin adenosyltransferase [EC:2.5.1.17] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K19221 cobA, btuR; cob(I)alamin adenosyltransferase [EC:2.5.1.17] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K19712 cobY; adenosylcobinamide-phosphate guanylyltransferase [EC:2.7.7.62] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02227 cbiB, cobD; adenosylcobinamide-phosphate synthase [EC:6.3.1.10] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02225 cobC1, cobC; cobalamin biosynthetic protein Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K13786 cobR; cob(II)yrinic acid a,c-diamide reductase [EC:1.16.8.1] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K03399 CbiE; cobalt-precorrin-7 (C5)-methyltransferase [EC 2.1.1.289] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K06042 CobH, CbiC; precorrin-8X/cobalt-precorrin08 methylmutase [EC:5.4.99.61] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02224 CobB, CbiA; cobyrinic acid a,c-diamide synthase [EC:6.3.5.9;6.2.5.11] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K13540 CobIJ; precorrin-2 C20-methyltransferase/precorrin-3B C17-methyltransferase [EC:2.1.1.130;2.1.1.131] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02229 CobG; precorrin 3B synthase [EC:1.14.13.83] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02228 CobF; precorrin-6A synthase [EC:2.1.1.152] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02230 CobN; cobaltochelatase [EC:6.6.1.2] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K09882 CobS; cobaltochelatase [EC:6.6.1.2] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K09883 CobT; cobaltochelatase [EC:6.6.1.2] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K02226 CobC, PhpB; alpha-ribazole phosphatase [EC:3.1.3.73] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K22316 RhnA, CobC; ribonuclease h/adenosylcobalamin/alpha-ribazole phosphatase [EC:3.1.26.4;3.1.3.73] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K00768 CobU, CobT; nicotinate-nucleotide-dimethylbenzimidazole phosphoribosyltransferase [EC:2.4.2.21] Cobalamin biosynthesis METHYL Cofactors Cofactor/Other_biosynthesis +K16092 BtuB; vitamin-B12 transporter Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis +K06073 BtuC; vitamin-B12 transport system permease protein Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis +K06074 BtuD; vitamin-B12 transport system-ATP binding protein [EC:7.6.2.8] Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis +K25028 BtuD; vitamin-B12 transport system-ATP binding protein [EC:7.6.2.8] Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis +K00432 BtuE; vitamin-B12 transport system - periplasmic protein Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis +K06858 BtuF; vitamin-B12 transport system-substrate binding protein Cobalamin uptake METHYL Cofactors Cofactor/Other_biosynthesis +K02168 BetTS; choline/glycine/proline betaine transport protein QA transporter METHYL Transporter Transport +K03451 TC.BCT; choline/carnitine/betaine/glycine/BCCT transporter QA transporter METHYL Transporter Transport +K05020 OpuD, BetL; glycine-betaine transporter QA transporter METHYL Transporter Transport +K03762 ProP; Proline/betaine MFS transporter, PPII, proline permease II QA transporter METHYL Transporter Transport +K03607 ProQ; proline/betaine (ProP effector) QA transporter METHYL Transporter Transport +K02000 ProV; glycine-betaine/proline transport system ATP binding protein [EC:7.6.2.9] QA transporter METHYL Transporter Transport +K02001 ProW; glycine-betaine/proline transport system permease protein QA transporter METHYL Transporter Transport +K02002 ProX; glycine-betaine/proline transport system substrate binding protein QA transporter METHYL Transporter Transport +K05845 OpuC; Osmoprotectant transport system substrate binding protein QA transporter METHYL Transporter Transport +K05846 OpuBD; Osmoprotectant transport system permease QA transporter METHYL Transporter Transport +K05847 OpuA; Osmoprotectant transport system ATP-binding protein [EC:7.6.2.9] QA transporter METHYL Transporter Transport +K18896 GSMT; glycine/sarcosine N-methyltransferase [EC:2.1.1.156] QA transporter METHYL Transporter Aerobic +K18897 SDMT; sarcosine/dimethylglycine N-methyltransferase [EC:2.1.1.157] QA transporter METHYL Transporter Aerobic +K22443 YeaW; carnitine/QA-promiscuous monooxygenase subunit, YeaW [ED 1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic +K22444 YeaX carnitine/QA-promiscuous monooxygenase reductase subunit [EC 1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic +K22443 CntA; carnitine rieske-type oxygenase [EC:1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic +K22444 CntB; carnitine rieske-type reductase [EC:1.14.13.239] QA cleavage to TMA METHYL Catabolism Aerobic +K20038 CutC; choline trimethylamine lysae [EC:4.3.99.4] QA cleavage to TMA METHYL Catabolism Anaerobic +K20037 CutD; glycyl-radical activating enzyme [EC:1.97.1.-] QA cleavage to TMA METHYL Catabolism Anaerobic +K01066 aes; actyl esterase (potentially HocS from Pseuodmonas); [EC:3.1.1.28] Acylcarnitine -> carnitine METHYL Catabolism +K05245 CaiT; L-carnitine/gamma-butyrobetaine antiporter Cai operon METHYL Carnitine reduction Anaerobic +K08297 CaiA; crotonobetainly-CoA dehydrogenase [EC:1.3.8.13] Cai operon METHYL Carnitine reduction Anaerobic +K08298 CaiB; L-carnitine CoA-transferase [EC:2.8.3.21] Cai operon METHYL Carnitine reduction Anaerobic +K02182 CaiC; carnitine-CoA ligase [EC:6.2.1.48] Cai operon METHYL Carnitine reduction Anaerobic +K08299 CaiD; crotonobetainyl-CoA hydratase [EC:4.2.1.149] Cai operon METHYL Carnitine reduction Anaerobic +K08279 CaiE; carnitine operon protein Cai operon METHYL Carnitine reduction Anaerobic +K08277 CaiF; tanscriptional activator Cai operon METHYL Carnitine reduction Anaerobic +K03521 FixA; electron transfer flavoprotein beta subunit Fix operon METHYL Carnitine reduction Anaerobic +K03522 FixB; electron transfer flavoprotein alpha subunit Fix operon METHYL Carnitine reduction Anaerobic +K00313 FixC; electron transfer flavoprotein-quinone oxidoreductase [EC:1.5.5.-] Fix operon METHYL Carnitine reduction Anaerobic +K03855 FixX; ferredoxin-like protein Fix operon METHYL Carnitine reduction Anaerobic +K00548 metH; cobalamin-dependent methionine synthase [EC:2.1.1.13] Methionine Biosynthesis METHYL Amino Acid Biosynthesis +K00471 BBOX1; gamma-butyrobetaine hydroxylase/dioxygenase [EC:1.14.11.1] Butyrobetaine -> Carnitine -> Glycine betaine METHYL Catabolism Aerobic METHYL_0013 BcoA; gamma-butyrobetainyl-CoA synthetase Butyrobetaine -> Carnitine -> Glycine betaine METHYL Catabolism Aerobic BcoAB;_gamma-butyrobetainyl-CoA_synthetase METHYL_0014 BcoD; crotonobetainyl-CoA hydratase Butyrobetaine -> Carnitine -> Glycine betaine METHYL Catabolism Aerobic BcoD;_crotonobetainyl-CoA_hydratase _Sinorhizobium_meliloti_Emergencia_timonensis METHYL_0015 BcoE; carnitine dehydrogenase Butyrobetaine -> Carnitine -> Glycine betaine METHYL Catabolism Aerobic BcoEF;_carnitine_dehydrogenase/thioesterase_Sinorhizobium_meliloti_Emergencia_timonensis @@ -113,36 +113,36 @@ METHYL_0020 BbuC; class III CoA transferase Butyrobetaine -> TMA METHYL Cataboli METHYL_0021 BbuD; 2[4Fe-4S] ferredoxin Butyrobetaine -> TMA METHYL Catabolism Anaerobic BbuD;_2[4Fe-4S]_ferredoxin_Emergencia_timonensis METHYL_0022 BbuE; BCCT transporter Butyrobetaine -> TMA METHYL Catabolism Anaerobic BbuE;_BCCT_transporter _Emergencia_timonensis METHYL_0023 BbuF; CoA thiosesterase Butyrobetaine -> TMA METHYL Catabolism Anaerobic BbuF;_CoA_thiosesterase_Emergencia_timonensis\ -K00108 BetA; choline dehydrogenase [EC:1.1.99.1] Choline -> Glycine betaine METHYL Catabolism Aerobic -K00130 BetB; betaine-aldehyde dehydrogenase [EC:1.2.1.8] Choline -> Glycine betaine METHYL Catabolism Aerobic -1.1.1.254 DchH; D-carnitine dehydrogenase [EC1.1.1.254] Carnitine -> Glycine betaine METHYL Catabolism Aerobic -K17735 LcdH, CdhA; L-carnitine dehydrogenase [EC:1.1.1.108] Carnitine -> Glycine betaine METHYL Catabolism Aerobic +K00108 BetA; choline dehydrogenase [EC:1.1.99.1] Choline -> Glycine betaine METHYL Catabolism Aerobic +K00130 BetB; betaine-aldehyde dehydrogenase [EC:1.2.1.8] Choline -> Glycine betaine METHYL Catabolism Aerobic +1.1.1.254 DchH; D-carnitine dehydrogenase [EC1.1.1.254] Carnitine -> Glycine betaine METHYL Catabolism Aerobic +K17735 LcdH, CdhA; L-carnitine dehydrogenase [EC:1.1.1.108] Carnitine -> Glycine betaine METHYL Catabolism Aerobic METHYL_0024 BmoA; glycine betaine monooxygenase Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic BmoA;_glycine_betaine_monooxygenase_Chromohalobacter_salexigens_DSM3403 METHYL_0025 BmoB; glycine betaine NADH-dependent flavin reductase Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic BmoB;_glycine_betaine_NADH-dependent_flavin_reductase_Chromohalobacter_salexigens_DSM3403 -K00479 GbcA; glycine betaine demehthylae, subunit A Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic -K21832 GbcB; glycine betaine demethylase, subunit B Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic -K00544 BHMT; betaine-homocysteine methyltransferase [EC:2.1.1.5] Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic -K24003 Stc2; stachydrine N-demethylase Proline betaine --> N-methylproline METHYL Catabolism Aerobic -K22551 hpba; N-methyl-L-proline demethylase [EC:1.5.3.-] Proline betaine --> N-methylproline -> proline METHYL Catabolism Aerobic -K21579 GrdH; betaine reductase complex component B subunit beta [EC:1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic -K21578 GrdI; betaine reductase complex component B subunit alpha [EC:1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic -K10670 GrdA; glycine/sarcosine/betaine reductase complex component A [EC:1.21.4.2;1.21.4.3;1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic -K21576 GrdD; glycine/sarcosine/betaine reductase complex component C subunit alpha [EC:1.21.4.2;1.21.4.3;1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic -K21577 GrdC; glycine/sarcosine/betaine reductase complex component C subunit beta [EC:1.21.4.2;1.21.4.3;1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic -K10672 GrdB; glycine reductase complex component B subunit gamma [EC:1.21.4.2] Glycine betaine -> TMA METHYL Catabolism Aerobic -K10671 GrdE; glycine reductase complex component B subunit alpha and beta [EC:1.21.4.2] Glycine betaine -> TMA METHYL Catabolism Aerobic -K21584 GrdF; sarcosine reductase complex component B subunit beta [EC:1.21.4.3] Glycine betaine -> TMA METHYL Catabolism Aerobic -K21583 GrdG; sarcosine reductase complex component B subunit alpha [EC:1.21.4.3] Glycine betaine -> TMA METHYL Catabolism Aerobic -K15229 MauB; methylamine dehydrogenase heavy chain [EC:1.4.9.1] Methylamine catabolism METHYL Catabolism -K15228 MauB; methylamine dehydrogenase light chain [EC:1.4.9.1] Methylamine catabolism METHYL Catabolism -K00317 dmd, tmd; dimethylamine/trimethylamine dehydrogenase [EC:1.5.8.1/2] Methylamine catabolism METHYL Catabolism -K18277 Tmm; trimethylamine monooxygenase [EC:1.14.13.148] Methylamine catabolism METHYL Catabolism -K07811 TorA; trimethylamine N-oxide reductase [ec:1.7.2.3] Methylamine catabolism METHYL Catabolism -14.1.2.32 trimethylamine N-oxide aldolase [EC:4.1.2.32] Methylamine catabolism METHYL Catabolism -K22081 MgsA; methylamine-glutamate N-methyltransferase subunit A [EC:2.1.1.21] Methylamine catabolism METHYL Catabolism -K08685 QhpA; quinohemoprotein amine dehydrogenase/methylamine dehydrogenase [EC:1.4.9.1] Methylamine catabolism METHYL Catabolism -K21310 MddA; methanethiol S-methyltransferase [EC:2.1.1.334] Methylsulfur methylotrophy METHYL Catabolism -2.1.1.251 MtsA; methylsulfide (DMS, MMPA) methyltransferase [EC:2.1.1.251] Methylsulfur methylotrophy METHYL Catabolism +K00479 GbcA; glycine betaine demehthylae, subunit A Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic +K21832 GbcB; glycine betaine demethylase, subunit B Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic +K00544 BHMT; betaine-homocysteine methyltransferase [EC:2.1.1.5] Glycine betaine -> dimethylglycine -> -> glycine METHYL Catabolism Aerobic +K24003 Stc2; stachydrine N-demethylase Proline betaine --> N-methylproline METHYL Catabolism Aerobic +K22551 hpba; N-methyl-L-proline demethylase [EC:1.5.3.-] Proline betaine --> N-methylproline -> proline METHYL Catabolism Aerobic +K21579 GrdH; betaine reductase complex component B subunit beta [EC:1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic +K21578 GrdI; betaine reductase complex component B subunit alpha [EC:1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic +K10670 GrdA; glycine/sarcosine/betaine reductase complex component A [EC:1.21.4.2;1.21.4.3;1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic +K21576 GrdD; glycine/sarcosine/betaine reductase complex component C subunit alpha [EC:1.21.4.2;1.21.4.3;1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic +K21577 GrdC; glycine/sarcosine/betaine reductase complex component C subunit beta [EC:1.21.4.2;1.21.4.3;1.21.4.4] Glycine betaine -> TMA METHYL Catabolism Aerobic +K10672 GrdB; glycine reductase complex component B subunit gamma [EC:1.21.4.2] Glycine betaine -> TMA METHYL Catabolism Aerobic +K10671 GrdE; glycine reductase complex component B subunit alpha and beta [EC:1.21.4.2] Glycine betaine -> TMA METHYL Catabolism Aerobic +K21584 GrdF; sarcosine reductase complex component B subunit beta [EC:1.21.4.3] Glycine betaine -> TMA METHYL Catabolism Aerobic +K21583 GrdG; sarcosine reductase complex component B subunit alpha [EC:1.21.4.3] Glycine betaine -> TMA METHYL Catabolism Aerobic +K15229 MauB; methylamine dehydrogenase heavy chain [EC:1.4.9.1] Methylamine catabolism METHYL Catabolism +K15228 MauB; methylamine dehydrogenase light chain [EC:1.4.9.1] Methylamine catabolism METHYL Catabolism +K00317 dmd, tmd; dimethylamine/trimethylamine dehydrogenase [EC:1.5.8.1/2] Methylamine catabolism METHYL Catabolism +K18277 Tmm; trimethylamine monooxygenase [EC:1.14.13.148] Methylamine catabolism METHYL Catabolism +K07811 TorA; trimethylamine N-oxide reductase [ec:1.7.2.3] Methylamine catabolism METHYL Catabolism +14.1.2.32 trimethylamine N-oxide aldolase [EC:4.1.2.32] Methylamine catabolism METHYL Catabolism +K22081 MgsA; methylamine-glutamate N-methyltransferase subunit A [EC:2.1.1.21] Methylamine catabolism METHYL Catabolism +K08685 QhpA; quinohemoprotein amine dehydrogenase/methylamine dehydrogenase [EC:1.4.9.1] Methylamine catabolism METHYL Catabolism +K21310 MddA; methanethiol S-methyltransferase [EC:2.1.1.334] Methylsulfur methylotrophy METHYL Catabolism +2.1.1.251 MtsA; methylsulfide (DMS, MMPA) methyltransferase [EC:2.1.1.251] Methylsulfur methylotrophy METHYL Catabolism METHYL_0026 MtsB; methylsulfide (DMS, MMPA) corrinoid binding protein Methylsulfur methylotrophy METHYL Catabolism MtsB_corrinoid_protein_Methanosarcina_barkeri_Q48925-1;MtsB_Mx_luminyensis_WP_019177442.1 METHYL_0027 dimethylsulfide:corrinoid methyltransferase, MtsD Methylsulfur methylotrophy METHYL Catabolism MtsD_MA0859_Methanosarcina_acetivorans_C2A_Q8TSD9-1 METHYL_0028 methanethiol:corrinoid methyltransferase, MtsF Methylsulfur methylotrophy METHYL Catabolism MtsF_MA4384_Methanosarcina_acetivorans_C2A_Q8THX4 @@ -150,18 +150,18 @@ METHYL_0029 methylsulfur-compound:corrinoid methyltransferase, MtsH Methylsulfur METHYL_0030 methylmercaptopropionate:corrinoid methyltransferase (MT1/2), MtpA Methylsulfur methylotrophy METHYL Catabolism MtpA_MA_4165_methylmercaptopropionate:corrinoid_methyltransferase_Methanosarcina_acetivorans METHYL_0031 methylmercaptopropionate corrinoid binding protein, MtpC Methylsulfur methylotrophy METHYL Catabolism MtpC_MA_4164_Methanosarcina_acetivorans_C2A_Q8TII5 METHYL_0032 RamS; reductive activase Methylsulfur methylotrophy METHYL Catabolism RamS_MA0489_Methanosarcina_acetivorans_c2a_Q8TSE9 -K04480 MtaB; methanol:corrinoid methyltransferase [EC:2.1.1.90] Methoxy methylotrophy METHYL Catabolism -K14081 MtaC; methanol corrinoid binding protein Methoxy methylotrophy METHYL Catabolism -K14080 MtaA; methanol specific methylcorrinoid:CoM methyltransferase [EC:2.1.1.246] Methoxy methylotrophy METHYL Catabolism -PF01208 MtvB; vanillate methyltransferase/O-demethytlase Methoxy methylotrophy METHYL Catabolism +K04480 MtaB; methanol:corrinoid methyltransferase [EC:2.1.1.90] Methoxy methylotrophy METHYL Catabolism +K14081 MtaC; methanol corrinoid binding protein Methoxy methylotrophy METHYL Catabolism +K14080 MtaA; methanol specific methylcorrinoid:CoM methyltransferase [EC:2.1.1.246] Methoxy methylotrophy METHYL Catabolism +PF01208 MtvB; vanillate methyltransferase/O-demethytlase Methoxy methylotrophy METHYL Catabolism METHYL_0033 MtvC; vanillate/O-demethylase corrinoid binding protein Methoxy methylotrophy METHYL Catabolism MtvC_vanilate_corrinoid/methoxy_corrinoid_Syntrophaceticus_schinkii_A0A0B7MDG8-1;MtvC_Moorella_thermoacetica_Q2RLG8 METHYL_0034 MtvA; vanillate/O-demethylse specific methylcorrinoid:THF methyltransferase Methoxy methylotrophy METHYL Catabolism MtvA;_vanillate/O-demethylse_specific_methylcorrinoid:THF_methyltransferase uncultured_Treponema -O87604 OdmB; vanillate methyltransferase [PFAM:O87604] Methoxy methylotrophy METHYL Catabolism +O87604 OdmB; vanillate methyltransferase [PFAM:O87604] Methoxy methylotrophy METHYL Catabolism METHYL_0035 vanillate corrinoid binding protein, OdmA Methoxy methylotrophy METHYL Catabolism OdmA_vanillate_corrinoid_Acetobacterium_dehalogenans_O87603-1 -PF00809 OdmD; vanillate specific methylcorrinoid:THF methyltransferase Methoxy methylotrophy METHYL Catabolism -PF14574 Odmc; methoxy-specific reductivase activase/Activating Enzyme Methoxy methylotrophy METHYL Catabolism -PF00111 Odmc; methoxy-specific reductivase activase/Activating Enzyme Methoxy methylotrophy METHYL Catabolism -PF17651 Odmc; methoxy-specific reductivase activase/Activating Enzyme Methoxy methylotrophy METHYL Catabolism +PF00809 OdmD; vanillate specific methylcorrinoid:THF methyltransferase Methoxy methylotrophy METHYL Catabolism +PF14574 Odmc; methoxy-specific reductivase activase/Activating Enzyme Methoxy methylotrophy METHYL Catabolism +PF00111 Odmc; methoxy-specific reductivase activase/Activating Enzyme Methoxy methylotrophy METHYL Catabolism +PF17651 Odmc; methoxy-specific reductivase activase/Activating Enzyme Methoxy methylotrophy METHYL Catabolism METHYL_0036 VdmB; veratrole corrinoid methyltransferase Methoxy methylotrophy METHYL Catabolism VdmB_veratrole_corrinoid_methyltransferase_Acetobacterium_dehalogenans_Q6W001-1 METHYL_0037 VdmA; veratole corrinoid binding protein Methoxy methylotrophy METHYL Catabolism Vdma_veratrole_corrinoid_Acetobacterium_dehalogenans_Q6W002-1 METHYL_0038 VdmD; veratrole specific methylcorrinoid:THF methyltransferase Methoxy methylotrophy METHYL Catabolism VdmD;_veratrole_specific_methylcorrinoid:THF_methyltransferase_Acetobacterium_dehalogenans_Q6W003 @@ -169,7 +169,7 @@ METHYL_0039 SECO (secoisolariciresinol) corrinoid methyltransferase, E. limosum METHYL_0040 SECO (secoisolariciresinol) corrinoid binding protein, E. limosum ZL-II, ELI_2004 Methoxy methylotrophy METHYL Catabolism SECO_secoisolariciresinol_corrinoid_E._limosum_ZL-II,_ELI_2004 METHYL_0041 SECO (secoisolariciresinol) methylcorrinoid:THF, E. limosum ZL-II, ELI_2005 Methoxy methylotrophy METHYL Catabolism SECO_(secoisolariciresinol)_methylcorrinoid:THF,_E._limosum_ZL-II,_ELI_2005 METHYL_0042 SECO corrinoid binding protein reductive activase/AE,E. limosum ZL-II, ELI_0370 Methoxy methylotrophy METHYL Catabolism SECO_corrinoid_binding_protein_reductive_activase/AE,E._limosum_ZL-II,_ELI_0370 -PF01208 MtoB; methoxy corrinoid methyltransferase Methoxy methylotrophy METHYL Catabolism +PF01208 MtoB; methoxy corrinoid methyltransferase Methoxy methylotrophy METHYL Catabolism METHYL_0043 MtoC; methoxy corrinoid binding protein Methoxy methylotrophy METHYL Catabolism MtoC_AF_0006_Archaeoglobus_fulgidus_DSM_4304_AAB91221.1;MtoC_Archaeoglobus_fulgidus_DSM_4304_methoxy_compounds_including_2-methoxyphenol_AAB91218.1_NCBI_mtac2 METHYL_0044 MtoA; methoxy specific methylcorrinoid:H4MPT methyltranferase (AF_0009) Methoxy methylotrophy METHYL Catabolism MtoA_or_mtrH_AF_0009_Archaeoglobus_fulgidus_DSM_4304_WP_010877523.1;MtoA;_methoxy_specific_methylcorrinoid:H4MPT_methyltranferase_(AF_0009) _Archaeoglobus_fulgidus_DSM_4304_ AAB91219.1 METHYL_0045 O-demethylase D. hafniense DCB2, methyltransferase Dhaf_4610 Methoxy methylotrophy METHYL Catabolism O-demethylase_D._hafniense_DCB2_corrinoid_dep_MT_Dhaf_4610_including_vanillate_isovanillate_syringate_guaiacol_methylchloride diff --git a/bin/assets/forms/distill_sheets/test-1-multiple-gene-id.tsv b/bin/assets/forms/distill_sheets/test-1-multiple-gene-id.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/test-2-multiple-gene-id.csv b/bin/assets/forms/distill_sheets/test-2-multiple-gene-id.csv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/test-2-topic.tsv b/bin/assets/forms/distill_sheets/test-2-topic.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/distill_sheets/test-3-EC.tsv b/bin/assets/forms/distill_sheets/test-3-EC.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/etc_module_database.20220928.tsv b/bin/assets/forms/etc_module_database.20220928.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/function_heatmap_form.20220928.tsv b/bin/assets/forms/function_heatmap_form.20220928.tsv old mode 100755 new mode 100644 diff --git a/bin/assets/forms/genome_summary_form.tsv b/bin/assets/forms/genome_summary_form.tsv old mode 100755 new mode 100644 index fd864383..2e72783a --- a/bin/assets/forms/genome_summary_form.tsv +++ b/bin/assets/forms/genome_summary_form.tsv @@ -1,4 +1,4 @@ -gene_id gene_description pathway topic_ecosystem category subcategory potential_amg +gene_id gene_description pathway topic_ecosystem category subcategory potential_amg K02981 small subunit ribosomal protein S2e Ribosome, eukaryotes MISC Information systems TRUE K02985 small subunit ribosomal protein S3e Ribosome, eukaryotes MISC Information systems TRUE K02984 small subunit ribosomal protein S3Ae Ribosome, eukaryotes MISC Information systems TRUE diff --git a/bin/assets/forms/module_step_form.20220928.tsv b/bin/assets/forms/module_step_form.20220928.tsv old mode 100755 new mode 100644 index 8cc51882..20241ed1 --- a/bin/assets/forms/module_step_form.20220928.tsv +++ b/bin/assets/forms/module_step_form.20220928.tsv @@ -191,7 +191,7 @@ enoyl-CoA hydratase [EC:4.2.1.17] [RN:R03045] K07515 M00013 Malonate semialdehyd multifunctional beta-oxidation protein [EC:4.2.1.-] [RN:R03045] K14729 M00013 Malonate semialdehyde pathway, propanoyl-CoA => acetyl-CoA 1,3 C05668 3-Hydroxypropionyl-CoA C00894 Propenoyl-CoA 3-hydroxyisobutyryl-CoA hydrolase [EC:3.1.2.4] [RN:R03157 R03158] K05605 M00013 Malonate semialdehyde pathway, propanoyl-CoA => acetyl-CoA 2,0 C01013 3-Hydroxypropanoate C05668 3-Hydroxypropionyl-CoA 3-hydroxypropionate dehydrogenase [EC:1.1.1.59] [RN:R01608] K23146 M00013 Malonate semialdehyde pathway, propanoyl-CoA => acetyl-CoA 3,0 C00222 3-Oxopropanoate C01013 3-Hydroxypropanoate -malonate-semialdehyde dehydrogenase (acetylating) [EC:1.2.1.18] [RN:R00740] K00140 M00013 Malonate semialdehyde pathway, propanoyl-CoA => acetyl-CoA 4,0 +malonate-semialdehyde dehydrogenase (acetylating) [EC:1.2.1.18] [RN:R00740] K00140 M00013 Malonate semialdehyde pathway, propanoyl-CoA => acetyl-CoA 4,0 UDPglucose 6-dehydrogenase [EC:1.1.1.22] [RN:R00286] K00012 M00014 Glucuronate pathway (uronate pathway) 0,0 C00167 UDP-glucuronate C00029 UDP-glucose UDP-sugar pyrophosphorylase [EC:2.7.7.64] [RN:R01381] K12447 M00014 Glucuronate pathway (uronate pathway) 1,0,0,0 C05385 D-Glucuronate 1-phosphate C00167 UDP-glucuronate glucuronokinase [EC:2.7.1.43] [RN:R01476] K16190 M00014 Glucuronate pathway (uronate pathway) 1,0,1,0 C00191 D-Glucuronate C05385 D-Glucuronate 1-phosphate @@ -458,7 +458,7 @@ kynureninase [EC:3.7.1.3] [RN:R02668] K01556 M00038 Tryptophan metabolism, trypt aminocarboxymuconate-semialdehyde decarboxylase [EC:4.1.1.45] [RN:R04323] K03392 M00038 Tryptophan metabolism, tryptophan => kynurenine => 2-aminomuconate 5,0 C03824 2-Aminomuconate semialdehyde C04409 2-Amino-3-carboxymuconate semialdehyde aminomuconate-semialdehyde dehydrogenase [EC:1.2.1.32] [RN:R03889] K10217 M00038 Tryptophan metabolism, tryptophan => kynurenine => 2-aminomuconate 6,0 C02220 2-Aminomuconate C03824 2-Aminomuconate semialdehyde aminomuconate-semialdehyde dehydrogenase [EC:1.2.1.32] [RN:R03889] K23234 M00038 Tryptophan metabolism, tryptophan => kynurenine => 2-aminomuconate 6,1 C02220 2-Aminomuconate C03824 2-Aminomuconate semialdehyde -phenylalanine ammonia-lyase [EC:4.3.1.24] [RN:R00679] K10775 M00039 Monolignol biosynthesis, phenylalanine/tyrosine => monolignol 0,0 +phenylalanine ammonia-lyase [EC:4.3.1.24] [RN:R00679] K10775 M00039 Monolignol biosynthesis, phenylalanine/tyrosine => monolignol 0,0 phenylalanine/tyrosine ammonia-lyase [EC:4.3.1.25] [RN:R00697 R00737] K13064 M00039 Monolignol biosynthesis, phenylalanine/tyrosine => monolignol 0,1 C00811 4-Coumarate C00082 L-Tyrosine trans-cinnamate 4-monooxygenase [EC:1.14.14.91] [RN:R02253] K00487 M00039 Monolignol biosynthesis, phenylalanine/tyrosine => monolignol 1,0 C00811 4-Coumarate C00423 trans-Cinnamate 4-coumarate--CoA ligase [EC:6.2.1.12] [RN:R01616 R01943] K01904 M00039 Monolignol biosynthesis, phenylalanine/tyrosine => monolignol 2,0 C00223 p-Coumaroyl-CoA C00811 4-Coumarate @@ -626,11 +626,11 @@ glucuronyltransferase [EC:2.4.1.225] [RN:R05935] K02366 M00059 Glycosaminoglycan glucuronyltransferase [EC:2.4.1.225] [RN:R05935] K02367 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 1,1 G00163 (Gal)2 (GlcA)2 (GlcNAc)1 (Xyl)1 (Ser)1 G00162 (Gal)2 (GlcA)1 (GlcNAc)1 (Xyl)1 (Ser)1 alpha-1,4-N-acetylglucosaminyltransferase [EC:2.4.1.224] [RN:R05936] K02368 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 2,0 G00164 (Gal)2 (GlcA)2 (GlcNAc)2 (Xyl)1 (Ser)1 G00163 (Gal)2 (GlcA)2 (GlcNAc)1 (Xyl)1 (Ser)1 alpha-1,4-N-acetylglucosaminyltransferase [EC:2.4.1.223] [RN:R05930] K02370 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 2,1 G00162 (Gal)2 (GlcA)1 (GlcNAc)1 (Xyl)1 (Ser)1 G00157 (Gal)2 (GlcA)1 (Xyl)1 (Ser)1 -heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02576 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,0 -heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02577 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,1 -heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02578 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,2 -heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02579 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,3 -heparosan-N-sulfate-glucuronate 5-epimerase [EC:5.1.3.17] K01793 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 4,0 +heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02576 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,0 +heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02577 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,1 +heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02578 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,2 +heparan sulfate N-deacetylase/N-sulfotransferase NDST [EC:3.1.1.- 2.8.2.-] K02579 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 3,3 +heparosan-N-sulfate-glucuronate 5-epimerase [EC:5.1.3.17] K01793 M00059 Glycosaminoglycan biosynthesis, heparan sulfate backbone 4,0 lpxA; UDP-N-acetylglucosamine acyltransferase [EC:2.3.1.129] [RN:R04567] K00677 M00060 KDO2-lipid A biosynthesis, Raetz pathway, LpxL-LpxM type 0,0 C04738 UDP-3-O-(3-hydroxytetradecanoyl)-N-acetylglucosamine C00043 UDP-N-acetyl-D-glucosamine lpxC; UDP-3-O-[3-hydroxymyristoyl] N-acetylglucosamine deacetylase [EC:3.5.1.108] [RN:R04587] K02535 M00060 KDO2-lipid A biosynthesis, Raetz pathway, LpxL-LpxM type 1,0 C06022 UDP-3-O-(3-hydroxytetradecanoyl)-D-glucosamine C04738 UDP-3-O-(3-hydroxytetradecanoyl)-N-acetylglucosamine lpxD; UDP-3-O-[3-hydroxymyristoyl] glucosamine N-acyltransferase [EC:2.3.1.191] [RN:R04550] K02536 M00060 KDO2-lipid A biosynthesis, Raetz pathway, LpxL-LpxM type 2,0 C04652 UDP-2,3-bis(3-hydroxytetradecanoyl)glucosamine C06022 UDP-3-O-(3-hydroxytetradecanoyl)-D-glucosamine @@ -701,48 +701,48 @@ OST3; oligosaccharyltransferase complex subunit gamma K12669 M00072 N-glycosylat WBP1; oligosaccharyltransferase complex subunit beta K12670 M00072 N-glycosylation by oligosaccharyltransferase 0,0 C00621,G00009 Dolichyl diphosphate, G00008,C03021 ,Protein asparagine OST4; oligosaccharyl transferase complex subunit OST4 K00730 M00072 N-glycosylation by oligosaccharyltransferase 0,0 C00621,G00009 Dolichyl diphosphate, G00008,C03021 ,Protein asparagine OST5; oligosaccharyl transferase complex subunit OST5 K12691 M00072 N-glycosylation by oligosaccharyltransferase 0,0 C00621,G00009 Dolichyl diphosphate, G00008,C03021 ,Protein asparagine -mannosyl-oligosaccharide glucosidase [EC:3.2.1.106] [RN:R05979] K01228 M00073 N-glycan precursor trimming 0,0 G00171 G00009 -alpha 1,3-glucosidase [EC:3.2.1.84] [RN:R05980 R05981] K05546 M00073 N-glycan precursor trimming 1,0 G00011 G00010 -mannosyl-oligosaccharide alpha-1,2-mannosidase [EC:3.2.1.113] [RN:R05982] K01230 M00073 N-glycan precursor trimming 2,0 G00012 G00011 -alpha 1,3-glucosidase [EC:3.2.1.84] [RN:R05980 R05981] K05546 M00074 N-glycan biosynthesis, high-mannose type 0,0 G00011 G00010 -mannosyl-oligosaccharide alpha-1,2-mannosidase [EC:3.2.1.113] [RN:R05982 R06722] K01230 M00074 N-glycan biosynthesis, high-mannose type 1,0 G10694 G00011 -alpha 1,6-mannosyltransferase [EC:2.4.1.232] [RN:R08599] K05528 M00074 N-glycan biosynthesis, high-mannose type 2,0 G01813 G10694 -mannan polymerase I complexes [EC:2.4.1.232] K05529 M00074 N-glycan biosynthesis, high-mannose type 3,0 -mannan polymerase I complexes [EC:2.4.1.232] K05530 M00074 N-glycan biosynthesis, high-mannose type 3,0 -mannan polymerase I complexes [EC:2.4.1.232] K05529 M00074 N-glycan biosynthesis, high-mannose type 4,0 -mannan polymerase II complex [EC:2.4.1.232] K05531 M00074 N-glycan biosynthesis, high-mannose type 4,0 -mannan polymerase II complex [EC:2.4.1.232] K05532 M00074 N-glycan biosynthesis, high-mannose type 4,0 -mannan polymerase II complex [EC:2.4.1.232] K05533 M00074 N-glycan biosynthesis, high-mannose type 4,0 -mannan polymerase II complex [EC:2.4.1.232] K05534 M00074 N-glycan biosynthesis, high-mannose type 4,0 -alpha 1,2-mannosyltransferase [EC:2.4.1.-] K05535 M00074 N-glycan biosynthesis, high-mannose type 5,0 -glycoprotein 6-alpha-L-fucosyltransferase [EC:2.4.1.68] [RN:R05988] K00717 M00075 N-glycan biosynthesis, complex type 0,0 G00016 G00015 -beta-1,4-galactosyltransferase [EC:2.4.1.38] [RN:R05989] K07966 M00075 N-glycan biosynthesis, complex type 1,0 G00017 G00016 -beta-1,4-galactosyltransferase [EC:2.4.1.38] [RN:R05989] K07967 M00075 N-glycan biosynthesis, complex type 1,1 G00017 G00016 -beta-1,4-galactosyltransferase [EC:2.4.1.38] [RN:R05989] K07968 M00075 N-glycan biosynthesis, complex type 1,2 G00017 G00016 -beta-galactoside alpha-2,6-sialyltransferase [EC:2.4.99.1] [RN:R05990] K00778 M00075 N-glycan biosynthesis, complex type 2,0 G00018 G00017 -beta-galactoside alpha-2,6-sialyltransferase [EC:2.4.99.1] [RN:R05990] K00779 M00075 N-glycan biosynthesis, complex type 2,1 G00018 G00017 -iduronate 2-sulfatase [EC:3.1.6.13] [RN:R07821] K01136 M00076 Dermatan sulfate degradation 1,0 G13042 G13041 -L-iduronidase [EC:3.2.1.76] [RN:R07822] K01217 M00076 Dermatan sulfate degradation 2,0 G12336 G13042 -arylsulfatase B [EC:3.1.6.12] [RN:R07823] K01135 M00076 Dermatan sulfate degradation 3,0 G13043 G12336 -hyaluronoglucosaminidase [EC:3.2.1.35] [RN:R07824] K01197 M00076 Dermatan sulfate degradation 4,0 G00872 DWA-2 G13043 -beta-glucuronidase [EC:3.2.1.31] K01195 M00076 Dermatan sulfate degradation 5,0 -arylsulfatase B [EC:3.1.6.12] [RN:R07823] K01135 M00077 Chondroitin sulfate degradation 0,0 G13043 G12336 -hyaluronoglucosaminidase [EC:3.2.1.35] [RN:R07824] K01197 M00077 Chondroitin sulfate degradation 1,0 G00872 DWA-2 G13043 -beta-glucuronidase [EC:3.2.1.31] K01195 M00077 Chondroitin sulfate degradation 2,0 -N-acetylgalactosamine-6-sulfatase [EC:3.1.6.4] K01132 M00077 Chondroitin sulfate degradation 3,0 +mannosyl-oligosaccharide glucosidase [EC:3.2.1.106] [RN:R05979] K01228 M00073 N-glycan precursor trimming 0,0 G00171 G00009 +alpha 1,3-glucosidase [EC:3.2.1.84] [RN:R05980 R05981] K05546 M00073 N-glycan precursor trimming 1,0 G00011 G00010 +mannosyl-oligosaccharide alpha-1,2-mannosidase [EC:3.2.1.113] [RN:R05982] K01230 M00073 N-glycan precursor trimming 2,0 G00012 G00011 +alpha 1,3-glucosidase [EC:3.2.1.84] [RN:R05980 R05981] K05546 M00074 N-glycan biosynthesis, high-mannose type 0,0 G00011 G00010 +mannosyl-oligosaccharide alpha-1,2-mannosidase [EC:3.2.1.113] [RN:R05982 R06722] K01230 M00074 N-glycan biosynthesis, high-mannose type 1,0 G10694 G00011 +alpha 1,6-mannosyltransferase [EC:2.4.1.232] [RN:R08599] K05528 M00074 N-glycan biosynthesis, high-mannose type 2,0 G01813 G10694 +mannan polymerase I complexes [EC:2.4.1.232] K05529 M00074 N-glycan biosynthesis, high-mannose type 3,0 +mannan polymerase I complexes [EC:2.4.1.232] K05530 M00074 N-glycan biosynthesis, high-mannose type 3,0 +mannan polymerase I complexes [EC:2.4.1.232] K05529 M00074 N-glycan biosynthesis, high-mannose type 4,0 +mannan polymerase II complex [EC:2.4.1.232] K05531 M00074 N-glycan biosynthesis, high-mannose type 4,0 +mannan polymerase II complex [EC:2.4.1.232] K05532 M00074 N-glycan biosynthesis, high-mannose type 4,0 +mannan polymerase II complex [EC:2.4.1.232] K05533 M00074 N-glycan biosynthesis, high-mannose type 4,0 +mannan polymerase II complex [EC:2.4.1.232] K05534 M00074 N-glycan biosynthesis, high-mannose type 4,0 +alpha 1,2-mannosyltransferase [EC:2.4.1.-] K05535 M00074 N-glycan biosynthesis, high-mannose type 5,0 +glycoprotein 6-alpha-L-fucosyltransferase [EC:2.4.1.68] [RN:R05988] K00717 M00075 N-glycan biosynthesis, complex type 0,0 G00016 G00015 +beta-1,4-galactosyltransferase [EC:2.4.1.38] [RN:R05989] K07966 M00075 N-glycan biosynthesis, complex type 1,0 G00017 G00016 +beta-1,4-galactosyltransferase [EC:2.4.1.38] [RN:R05989] K07967 M00075 N-glycan biosynthesis, complex type 1,1 G00017 G00016 +beta-1,4-galactosyltransferase [EC:2.4.1.38] [RN:R05989] K07968 M00075 N-glycan biosynthesis, complex type 1,2 G00017 G00016 +beta-galactoside alpha-2,6-sialyltransferase [EC:2.4.99.1] [RN:R05990] K00778 M00075 N-glycan biosynthesis, complex type 2,0 G00018 G00017 +beta-galactoside alpha-2,6-sialyltransferase [EC:2.4.99.1] [RN:R05990] K00779 M00075 N-glycan biosynthesis, complex type 2,1 G00018 G00017 +iduronate 2-sulfatase [EC:3.1.6.13] [RN:R07821] K01136 M00076 Dermatan sulfate degradation 1,0 G13042 G13041 +L-iduronidase [EC:3.2.1.76] [RN:R07822] K01217 M00076 Dermatan sulfate degradation 2,0 G12336 G13042 +arylsulfatase B [EC:3.1.6.12] [RN:R07823] K01135 M00076 Dermatan sulfate degradation 3,0 G13043 G12336 +hyaluronoglucosaminidase [EC:3.2.1.35] [RN:R07824] K01197 M00076 Dermatan sulfate degradation 4,0 G00872 DWA-2 G13043 +beta-glucuronidase [EC:3.2.1.31] K01195 M00076 Dermatan sulfate degradation 5,0 +arylsulfatase B [EC:3.1.6.12] [RN:R07823] K01135 M00077 Chondroitin sulfate degradation 0,0 G13043 G12336 +hyaluronoglucosaminidase [EC:3.2.1.35] [RN:R07824] K01197 M00077 Chondroitin sulfate degradation 1,0 G00872 DWA-2 G13043 +beta-glucuronidase [EC:3.2.1.31] K01195 M00077 Chondroitin sulfate degradation 2,0 +N-acetylgalactosamine-6-sulfatase [EC:3.1.6.4] K01132 M00077 Chondroitin sulfate degradation 3,0 heparanase [EC:3.2.1.166 3.2.1.-] [RN:R07811] K07964 M00078 Heparan sulfate degradation 0,0 G13034 C00925 Heparan sulfate heparanase [EC:3.2.1.166 3.2.1.-] [RN:R07811] K07965 M00078 Heparan sulfate degradation 0,1 G13034 C00925 Heparan sulfate -iduronate 2-sulfatase [EC:3.1.6.13] [RN:R07812] K01136 M00078 Heparan sulfate degradation 1,0 G13035 G13034 -L-iduronidase [EC:3.2.1.76] [RN:R07813] K01217 M00078 Heparan sulfate degradation 2,0 G13036 G13035 -N-sulfoglucosamine sulfohydrolase [EC:3.10.1.1] [RN:R07814] K01565 M00078 Heparan sulfate degradation 3,0 G13037 G13036 -heparan-alpha-glucosaminide N-acetyltransferase [EC:2.3.1.78] [RN:R07815] K10532 M00078 Heparan sulfate degradation 4,0 G13038 G13037 -alpha-N-acetylglucosaminidase [EC:3.2.1.50] [RN:R07816] K01205 M00078 Heparan sulfate degradation 5,0 G13039 G13038 -beta-glucuronidase [EC:3.2.1.31] [RN:R07818] K01195 M00078 Heparan sulfate degradation 7,0 G09660 G13040 -N-acetylglucosamine-6-sulfatase [EC:3.1.6.14] [RN:R07819] K01137 M00078 Heparan sulfate degradation 8,0 G02632 G09660 -N-acetylgalactosamine-6-sulfatase [EC:3.1.6.4] [RN:R07806] K01132 M00079 Keratan sulfate degradation 1,0 G01977 G01945 -beta-galactosidase [EC:3.2.1.23] [RN:R07807] K12309 M00079 Keratan sulfate degradation 2,0 G13073 G01977 -N-acetylglucosamine-6-sulfatase [EC:3.1.6.14] [RN:R07808] K01137 M00079 Keratan sulfate degradation 3,0 G13074 G13073 -beta-hexosaminidase [EC:3.2.1.52] [RN:R07809 R07810] K12373 M00079 Keratan sulfate degradation 4,0 G01391 G13073 +iduronate 2-sulfatase [EC:3.1.6.13] [RN:R07812] K01136 M00078 Heparan sulfate degradation 1,0 G13035 G13034 +L-iduronidase [EC:3.2.1.76] [RN:R07813] K01217 M00078 Heparan sulfate degradation 2,0 G13036 G13035 +N-sulfoglucosamine sulfohydrolase [EC:3.10.1.1] [RN:R07814] K01565 M00078 Heparan sulfate degradation 3,0 G13037 G13036 +heparan-alpha-glucosaminide N-acetyltransferase [EC:2.3.1.78] [RN:R07815] K10532 M00078 Heparan sulfate degradation 4,0 G13038 G13037 +alpha-N-acetylglucosaminidase [EC:3.2.1.50] [RN:R07816] K01205 M00078 Heparan sulfate degradation 5,0 G13039 G13038 +beta-glucuronidase [EC:3.2.1.31] [RN:R07818] K01195 M00078 Heparan sulfate degradation 7,0 G09660 G13040 +N-acetylglucosamine-6-sulfatase [EC:3.1.6.14] [RN:R07819] K01137 M00078 Heparan sulfate degradation 8,0 G02632 G09660 +N-acetylgalactosamine-6-sulfatase [EC:3.1.6.4] [RN:R07806] K01132 M00079 Keratan sulfate degradation 1,0 G01977 G01945 +beta-galactosidase [EC:3.2.1.23] [RN:R07807] K12309 M00079 Keratan sulfate degradation 2,0 G13073 G01977 +N-acetylglucosamine-6-sulfatase [EC:3.1.6.14] [RN:R07808] K01137 M00079 Keratan sulfate degradation 3,0 G13074 G13073 +beta-hexosaminidase [EC:3.2.1.52] [RN:R07809 R07810] K12373 M00079 Keratan sulfate degradation 4,0 G01391 G13073 pectinesterase [EC:3.1.1.11] [RN:R02362] K01051 M00081 Pectin degradation 0,0 C00470 Pectate C00714 Pectin polygalacturonase [EC:3.2.1.15] [RN:R02360] K01184 M00081 Pectin degradation 1,0 C02273 Digalacturonate C00470 Pectate galacturan 1,4-alpha-galacturonidase [EC:3.2.1.67] [RN:R07413] K01213 M00081 Pectin degradation 2,0 C00333 D-Galacturonate C02273 Digalacturonate @@ -1166,17 +1166,17 @@ ND4; NADH-ubiquinone oxidoreductase chain 4 [EC:7.1.1.2] K03881 M00142 NADH:ubiq ND4L; NADH-ubiquinone oxidoreductase chain 4L [EC:7.1.1.2] K03882 M00142 NADH:ubiquinone oxidoreductase, mitochondria 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH ND5; NADH-ubiquinone oxidoreductase chain 5 [EC:7.1.1.2] K03883 M00142 NADH:ubiquinone oxidoreductase, mitochondria 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH ND6; NADH-ubiquinone oxidoreductase chain 6 [EC:7.1.1.2] K03884 M00142 NADH:ubiquinone oxidoreductase, mitochondria 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH -NDUFS1; NADH dehydrogenase (ubiquinone) Fe-S protein 1 [EC:7.1.1.2 1.6.99.3] K03934 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS2; NADH dehydrogenase (ubiquinone) Fe-S protein 2 [EC:7.1.1.2 1.6.99.3] K03935 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS3; NADH dehydrogenase (ubiquinone) Fe-S protein 3 [EC:7.1.1.2 1.6.99.3] K03936 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS4; NADH dehydrogenase (ubiquinone) Fe-S protein 4 K03937 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS5; NADH dehydrogenase (ubiquinone) Fe-S protein 5 K03938 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS6; NADH dehydrogenase (ubiquinone) Fe-S protein 6 K03939 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS7; NADH dehydrogenase (ubiquinone) Fe-S protein 7 [EC:7.1.1.2 1.6.99.3] K03940 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFS8; NADH dehydrogenase (ubiquinone) Fe-S protein 8 [EC:7.1.1.2 1.6.99.3] K03941 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFV1; NADH dehydrogenase (ubiquinone) flavoprotein 1 [EC:7.1.1.2 1.6.99.3] K03942 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFV2; NADH dehydrogenase (ubiquinone) flavoprotein 2 [EC:7.1.1.2 1.6.99.3] K03943 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 -NDUFV3; NADH dehydrogenase (ubiquinone) flavoprotein 3 K03944 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS1; NADH dehydrogenase (ubiquinone) Fe-S protein 1 [EC:7.1.1.2 1.6.99.3] K03934 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS2; NADH dehydrogenase (ubiquinone) Fe-S protein 2 [EC:7.1.1.2 1.6.99.3] K03935 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS3; NADH dehydrogenase (ubiquinone) Fe-S protein 3 [EC:7.1.1.2 1.6.99.3] K03936 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS4; NADH dehydrogenase (ubiquinone) Fe-S protein 4 K03937 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS5; NADH dehydrogenase (ubiquinone) Fe-S protein 5 K03938 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS6; NADH dehydrogenase (ubiquinone) Fe-S protein 6 K03939 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS7; NADH dehydrogenase (ubiquinone) Fe-S protein 7 [EC:7.1.1.2 1.6.99.3] K03940 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFS8; NADH dehydrogenase (ubiquinone) Fe-S protein 8 [EC:7.1.1.2 1.6.99.3] K03941 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFV1; NADH dehydrogenase (ubiquinone) flavoprotein 1 [EC:7.1.1.2 1.6.99.3] K03942 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFV2; NADH dehydrogenase (ubiquinone) flavoprotein 2 [EC:7.1.1.2 1.6.99.3] K03943 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 +NDUFV3; NADH dehydrogenase (ubiquinone) flavoprotein 3 K03944 M00143 NADH dehydrogenase (ubiquinone) Fe-S protein/flavoprotein complex, mitochondria 0,0 nuoA; NADH-quinone oxidoreductase subunit A [EC:7.1.1.2] K00330 M00144 NADH:quinone oxidoreductase, prokaryotes 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH nuoB; NADH-quinone oxidoreductase subunit B [EC:7.1.1.2] K00331 M00144 NADH:quinone oxidoreductase, prokaryotes 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH nuoC; NADH-quinone oxidoreductase subunit C [EC:7.1.1.2] K00332 M00144 NADH:quinone oxidoreductase, prokaryotes 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH @@ -1209,33 +1209,33 @@ ndhB; NAD(P)H-quinone oxidoreductase subunit 2 [EC:7.1.1.2] K05573 M00145 NAD(P) ndhL; NAD(P)H-quinone oxidoreductase subunit L [EC:7.1.1.2] K05583 M00145 NAD(P)H:quinone oxidoreductase, chloroplasts and cyanobacteria 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH ndhM; NAD(P)H-quinone oxidoreductase subunit M [EC:7.1.1.2] K05584 M00145 NAD(P)H:quinone oxidoreductase, chloroplasts and cyanobacteria 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH ndhN; NAD(P)H-quinone oxidoreductase subunit N [EC:7.1.1.2] K05585 M00145 NAD(P)H:quinone oxidoreductase, chloroplasts and cyanobacteria 0,0 C00390,C00003 Ubiquinol,NAD+ C00399,C00004 Ubiquinone,NADH -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 1 K03945 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 2 K03946 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 3 K03947 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 4 K03948 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 5 K03949 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 6 K03950 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 7 K03951 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 8 K03952 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 9 K03953 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 10 K03954 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha/beta subcomplex 1 K03955 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH-ubiquinone oxidoreductase subunit K03956 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 12 K11352 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 13 K11353 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 1 K03957 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 2 K03958 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 3 K03959 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 4 K03960 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 5 K03961 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 6 K03962 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 7 K03963 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 8 K03964 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 9 K03965 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 10 K03966 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 beta subcomplex 11 K11351 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 subcomplex unknown 1 K03967 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 -NADH dehydrogenase (ubiquinone) 1 subcomplex unknown 2 K03968 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 1 K03945 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 2 K03946 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 3 K03947 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 4 K03948 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 5 K03949 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 6 K03950 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 7 K03951 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 8 K03952 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 9 K03953 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 10 K03954 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha/beta subcomplex 1 K03955 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH-ubiquinone oxidoreductase subunit K03956 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 12 K11352 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 13 K11353 M00146 NADH dehydrogenase (ubiquinone) 1 alpha subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 1 K03957 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 2 K03958 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 3 K03959 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 4 K03960 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 5 K03961 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 6 K03962 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 7 K03963 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 8 K03964 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 9 K03965 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 10 K03966 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 beta subcomplex 11 K11351 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 subcomplex unknown 1 K03967 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 +NADH dehydrogenase (ubiquinone) 1 subcomplex unknown 2 K03968 M00147 NADH dehydrogenase (ubiquinone) 1 beta subcomplex 0,0 SDHC; succinate dehydrogenase (ubiquinone) cytochrome b560 subunit K00236 M00148 Succinate dehydrogenase (ubiquinone) 0,0 C00390,C00122 Ubiquinol,Fumarate C00399,C00042 Ubiquinone,Succinate SDHD; succinate dehydrogenase (ubiquinone) membrane anchor subunit K00237 M00148 Succinate dehydrogenase (ubiquinone) 0,0 C00390,C00122 Ubiquinol,Fumarate C00399,C00042 Ubiquinone,Succinate SDHA; succinate dehydrogenase (ubiquinone) flavoprotein subunit [EC:1.3.5.1] K00234 M00148 Succinate dehydrogenase (ubiquinone) 0,0 C00390,C00122 Ubiquinol,Fumarate C00399,C00042 Ubiquinone,Succinate @@ -1248,130 +1248,130 @@ frdA; fumarate reductase flavoprotein subunit [EC:1.3.5.4] K00244 M00150 Fumarat frdB; fumarate reductase iron-sulfur subunit [EC:1.3.5.4] K00245 M00150 Fumarate reductase, prokaryotes 0,0 C00122,C15603 Fumarate,Hydroquinone C00042,C15602 Succinate,Quinone frdC; fumarate reductase subunit C K00246 M00150 Fumarate reductase, prokaryotes 0,0 C00122,C15603 Fumarate,Hydroquinone C00042,C15602 Succinate,Quinone frdD; fumarate reductase subunit D K00247 M00150 Fumarate reductase, prokaryotes 0,0 C00122,C15603 Fumarate,Hydroquinone C00042,C15602 Succinate,Quinone -CYTB; ubiquinol-cytochrome c reductase cytochrome b subunit K00412 M00151 Cytochrome bc1 complex respiratory unit 0,0 -CYC1; ubiquinol-cytochrome c reductase cytochrome c1 subunit K00413 M00151 Cytochrome bc1 complex respiratory unit 0,0 -fbcH; ubiquinol-cytochrome c reductase cytochrome b/c1 subunit K00410 M00151 Cytochrome bc1 complex respiratory unit 0,0 -UQCRFS1; ubiquinol-cytochrome c reductase iron-sulfur subunit K00411 M00151 Cytochrome bc1 complex respiratory unit 0,0 -MQCRA; menaquinol-cytochrome c reductase iron-sulfur subunit [EC:1.10.2.-] K03886 M00151 Cytochrome bc1 complex respiratory unit 0,1 -MQCRB; menaquinol-cytochrome c reductase cytochrome b subunit K03887 M00151 Cytochrome bc1 complex respiratory unit 0,1 -MQCRC; menaquinol-cytochrome c reductase cytochrome b/c subunit K03888 M00151 Cytochrome bc1 complex respiratory unit 0,1 -qcrA; ubiquinol-cytochrome c reductase iron-sulfur subunit K03890 M00151 Cytochrome bc1 complex respiratory unit 0,2 -qcrB; ubiquinol-cytochrome c reductase cytochrome b subunit K03891 M00151 Cytochrome bc1 complex respiratory unit 0,2 -qcrC; ubiquinol-cytochrome c reductase cytochrome c subunit K03889 M00151 Cytochrome bc1 complex respiratory unit 0,2 -CYTB; ubiquinol-cytochrome c reductase cytochrome b subunit K00412 M00152 Cytochrome bc1 complex 0,0 -CYC1; ubiquinol-cytochrome c reductase cytochrome c1 subunit K00413 M00152 Cytochrome bc1 complex 0,0 -FBCH; ubiquinol-cytochrome c reductase cytochrome b/c1 subunit K00410 M00152 Cytochrome bc1 complex 0,0 -UQCRFS1; ubiquinol-cytochrome c reductase iron-sulfur subunit K00411 M00152 Cytochrome bc1 complex 0,0 -QCR1; ubiquinol-cytochrome c reductase core subunit 1 K00414 M00152 Cytochrome bc1 complex 0,0 -QCR2; ubiquinol-cytochrome c reductase core subunit 2 K00415 M00152 Cytochrome bc1 complex 0,0 -QCR6; ubiquinol-cytochrome c reductase subunit 6 K00416 M00152 Cytochrome bc1 complex 0,0 -QCR7; ubiquinol-cytochrome c reductase subunit 7 K00417 M00152 Cytochrome bc1 complex 0,0 -QCR8; ubiquinol-cytochrome c reductase subunit 8 K00418 M00152 Cytochrome bc1 complex 0,0 -QCR9; ubiquinol-cytochrome c reductase subunit 9 K00419 M00152 Cytochrome bc1 complex 0,0 -QCR10; ubiquinol-cytochrome c reductase subunit 10 K00420 M00152 Cytochrome bc1 complex 0,0 -cytochrome bd ubiquinol oxidase subunit I [EC:1.10.3.14] K00425 M00153 Cytochrome bd ubiquinol oxidase 0,0 -cytochrome bd ubiquinol oxidase subunit II [EC:1.10.3.14] K00426 M00153 Cytochrome bd ubiquinol oxidase 0,0 -cydX; cytochrome bd-I ubiquinol oxidase subunit X [EC:1.10.3.14] K00424 M00153 Cytochrome bd ubiquinol oxidase 0,0 -appX; cytochrome bd-II ubiquinol oxidase subunit AppX [EC:1.10.3.14] K22501 M00153 Cytochrome bd ubiquinol oxidase 0,0 -COX10; protoheme IX farnesyltransferase [EC:2.5.1.-] K02257 M00154 Cytochrome c oxidase 0,0 -COX3; cytochrome c oxidase subunit 3 K02262 M00154 Cytochrome c oxidase 0,0 -COX1; cytochrome c oxidase subunit 1 [EC:1.9.3.1] K02256 M00154 Cytochrome c oxidase 0,0 -COX2; cytochrome c oxidase subunit 2 K02261 M00154 Cytochrome c oxidase 0,0 -COX4; cytochrome c oxidase subunit 4 K02263 M00154 Cytochrome c oxidase 0,0 -COX5A; cytochrome c oxidase subunit 5a K02264 M00154 Cytochrome c oxidase 0,0 -COX5B; cytochrome c oxidase subunit 5b K02265 M00154 Cytochrome c oxidase 0,0 -COX6A; cytochrome c oxidase subunit 6a K02266 M00154 Cytochrome c oxidase 0,0 -COX6B; cytochrome c oxidase subunit 6b K02267 M00154 Cytochrome c oxidase 0,0 -COX6C; cytochrome c oxidase subunit 6c K02268 M00154 Cytochrome c oxidase 0,0 -COX7; cytochrome c oxidase subunit 7 K02269 M00154 Cytochrome c oxidase 0,0 -COX7A; cytochrome c oxidase subunit 7a K02270 M00154 Cytochrome c oxidase 0,0 -COX7B; cytochrome c oxidase subunit 7b K02271 M00154 Cytochrome c oxidase 0,0 -COX7C; cytochrome c oxidase subunit 7c K02272 M00154 Cytochrome c oxidase 0,0 -COX8; cytochrome c oxidase subunit 8 K02273 M00154 Cytochrome c oxidase 0,0 -COX11; cytochrome c oxidase assembly protein subunit 11 K02258 M00154 Cytochrome c oxidase 0,0 -COX15; cytochrome c oxidase assembly protein subunit 15 K02259 M00154 Cytochrome c oxidase 0,0 -COX17; cytochrome c oxidase assembly protein subunit 17 K02260 M00154 Cytochrome c oxidase 0,0 -coxB; cytochrome c oxidase subunit II [EC:1.9.3.1] K02275 M00155 Cytochrome c oxidase, prokaryotes 0,0 -coxA; cytochrome c oxidase subunit I [EC:1.9.3.1] K02274 M00155 Cytochrome c oxidase, prokaryotes 0,0 -coxC; cytochrome c oxidase subunit III [EC:1.9.3.1] K02276 M00155 Cytochrome c oxidase, prokaryotes 0,0 -coxAC; cytochrome c oxidase subunit I+III [EC:1.9.3.1] K15408 M00155 Cytochrome c oxidase, prokaryotes 0,0 -coxD; cytochrome c oxidase subunit IV [EC:1.9.3.1] K02277 M00155 Cytochrome c oxidase, prokaryotes 0,0 -ccoN; cb-type cytochrome c oxidase subunit I [EC:1.9.3.1] K00404 M00156 Cytochrome c oxidase, cbb3-type 0,0 -ccoO; cb-type cytochrome c oxidase subunit II K00405 M00156 Cytochrome c oxidase, cbb3-type 0,0 -ccoNO; cbb3-type cytochrome c oxidase subunit I/II K15862 M00156 Cytochrome c oxidase, cbb3-type 0,0 -ccoQ; cb-type cytochrome c oxidase subunit IV K00407 M00156 Cytochrome c oxidase, cbb3-type 0,0 -ccoP; cb-type cytochrome c oxidase subunit III K00406 M00156 Cytochrome c oxidase, cbb3-type 0,0 -ATPF1A; F-type H+-transporting ATPase subunit alpha [EC:7.1.2.2] K02111 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF1B; F-type H+-transporting ATPase subunit beta [EC:7.1.2.2] K02112 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF1D; F-type H+-transporting ATPase subunit delta K02113 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF1E; F-type H+-transporting ATPase subunit epsilon K02114 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF1G; F-type H+-transporting ATPase subunit gamma K02115 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF0A; F-type H+-transporting ATPase subunit a K02108 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF0B; F-type H+-transporting ATPase subunit b K02109 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPF0C; F-type H+-transporting ATPase subunit c K02110 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 -ATPeF1A; F-type H+-transporting ATPase subunit alpha K02132 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF1B; F-type H+-transporting ATPase subunit beta [EC:3.6.3.14] K02133 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF1G; F-type H+-transporting ATPase subunit gamma K02136 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF1D; F-type H+-transporting ATPase subunit delta K02134 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF1E; F-type H+-transporting ATPase subunit epsilon K02135 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0O; F-type H+-transporting ATPase subunit O K02137 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0A; F-type H+-transporting ATPase subunit a K02126 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0B; F-type H+-transporting ATPase subunit b K02127 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0C; F-type H+-transporting ATPase subunit c K02128 M00158 F-type ATPase, eukaryotes 0,0 -ATPeFD; F-type H+-transporting ATPase subunit d K02138 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0E; F-type H+-transporting ATPase subunit e K02129 M00158 F-type ATPase, eukaryotes 0,0 -TIM11; F-type H+-transporting ATP synthase subunit e K01549 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0F; F-type H+-transporting ATPase subunit f K02130 M00158 F-type ATPase, eukaryotes 0,0 -ATPeFF; F-type H+-transporting ATPase subunit f K02139 M00158 F-type ATPase, eukaryotes 0,0 -ATPeFG; F-type H+-transporting ATPase subunit g K02140 M00158 F-type ATPase, eukaryotes 0,0 -ATPeFH; F-type H+-transporting ATPase subunit h K02141 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF0F6; F-type H+-transporting ATPase subunit 6 K02131 M00158 F-type ATPase, eukaryotes 0,0 -ATPeFJ; F-type H+-transporting ATPase subunit j K02142 M00158 F-type ATPase, eukaryotes 0,0 -ATPeFK; F-type H+-transporting ATPase subunit k K02143 M00158 F-type ATPase, eukaryotes 0,0 -ATPeF08; F-type H+-transporting ATPase subunit 8 K02125 M00158 F-type ATPase, eukaryotes 0,0 -ATPVA; V/A-type H+-transporting ATPase subunit A [EC:3.6.3.14] K02117 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVB; V/A-type H+-transporting ATPase subunit B K02118 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVC; V/A-type H+-transporting ATPase subunit C K02119 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVD; V/A-type H+-transporting ATPase subunit D K02120 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVE; V/A-type H+-transporting ATPase subunit E K02121 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVF; V/A-type H+-transporting ATPase subunit F K02122 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVG; V/A-type H+-transporting ATPase subunit G/H K02107 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVI; V/A-type H+-transporting ATPase subunit I K02123 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPVK; V/A-type H+-transporting ATPase subunit K K02124 M00159 V/A-type ATPase, prokaryotes 0,0 -ATPeV1A; V-type H+-transporting ATPase subunit A [EC:3.6.3.14] K02145 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1B; V-type H+-transporting ATPase subunit B K02147 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1C; V-type H+-transporting ATPase subunit C K02148 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1D; V-type H+-transporting ATPase subunit D K02149 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1E; V-type H+-transporting ATPase subunit E K02150 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1F; V-type H+-transporting ATPase subunit F K02151 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1G; V-type H+-transporting ATPase subunit G K02152 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV1H; V-type H+-transporting ATPase subunit H K02144 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV0A; V-type H+-transporting ATPase subunit a K02154 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV0B; V-type H+-transporting ATPase 21kDa proteolipid subunit K03661 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV0C; V-type H+-transporting ATPase 16kDa proteolipid subunit K02155 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV0D; V-type H+-transporting ATPase subunit d K02146 M00160 V-type ATPase, eukaryotes 0,0 -ATPeV0E; V-type H+-transporting ATPase subunit e K02153 M00160 V-type ATPase, eukaryotes 0,0 -ATPeVS1; V-type H+-transporting ATPase S1 subunit K03662 M00160 V-type ATPase, eukaryotes 0,0 -psbA; photosystem II reaction center D1 protein [EC:1.10.3.9] K02703 M00161 Photosystem II 0,0 -psbD; photosystem II reaction center D2 protein [EC:1.10.3.9] K02706 M00161 Photosystem II 0,0 -psbC; photosystem II CP43 chlorophyll apoprotein K02705 M00161 Photosystem II 0,0 -psbB; photosystem II CP47 chlorophyll apoprotein K02704 M00161 Photosystem II 0,0 -psbE; photosystem II cytochrome b559 subunit alpha K02707 M00161 Photosystem II 0,0 -psbF; photosystem II cytochrome b559 subunit beta K02708 M00161 Photosystem II 0,0 -cytochrome b6 K02635 M00162 Cytochrome b6f complex 0,0 -cytochrome b6-f complex subunit 4 K02637 M00162 Cytochrome b6f complex 0,0 -apocytochrome f K02634 M00162 Cytochrome b6f complex 0,0 -cytochrome b6-f complex iron-sulfur subunit K02636 M00162 Cytochrome b6f complex 0,0 -cytochrome b6-f complex subunit 6 K02642 M00162 Cytochrome b6f complex 0,0 -cytochrome b6-f complex subunit 7 K02643 M00162 Cytochrome b6f complex 0,0 -cytochrome b6-f complex subunit 8 K03689 M00162 Cytochrome b6f complex 0,0 -cytochrome b6-f complex subunit 5 K02640 M00162 Cytochrome b6f complex 0,0 -psaA; photosystem I P700 chlorophyll a apoprotein A1 K02689 M00163 Photosystem I 0,0 -psaB; photosystem I P700 chlorophyll a apoprotein A2 K02690 M00163 Photosystem I 0,0 -psaC; photosystem I subunit VII K02691 M00163 Photosystem I 0,0 -psaD; photosystem I subunit II K02692 M00163 Photosystem I 0,0 -psaE; photosystem I subunit IV K02693 M00163 Photosystem I 0,0 -psaF; photosystem I subunit III K02694 M00163 Photosystem I 0,0 +CYTB; ubiquinol-cytochrome c reductase cytochrome b subunit K00412 M00151 Cytochrome bc1 complex respiratory unit 0,0 +CYC1; ubiquinol-cytochrome c reductase cytochrome c1 subunit K00413 M00151 Cytochrome bc1 complex respiratory unit 0,0 +fbcH; ubiquinol-cytochrome c reductase cytochrome b/c1 subunit K00410 M00151 Cytochrome bc1 complex respiratory unit 0,0 +UQCRFS1; ubiquinol-cytochrome c reductase iron-sulfur subunit K00411 M00151 Cytochrome bc1 complex respiratory unit 0,0 +MQCRA; menaquinol-cytochrome c reductase iron-sulfur subunit [EC:1.10.2.-] K03886 M00151 Cytochrome bc1 complex respiratory unit 0,1 +MQCRB; menaquinol-cytochrome c reductase cytochrome b subunit K03887 M00151 Cytochrome bc1 complex respiratory unit 0,1 +MQCRC; menaquinol-cytochrome c reductase cytochrome b/c subunit K03888 M00151 Cytochrome bc1 complex respiratory unit 0,1 +qcrA; ubiquinol-cytochrome c reductase iron-sulfur subunit K03890 M00151 Cytochrome bc1 complex respiratory unit 0,2 +qcrB; ubiquinol-cytochrome c reductase cytochrome b subunit K03891 M00151 Cytochrome bc1 complex respiratory unit 0,2 +qcrC; ubiquinol-cytochrome c reductase cytochrome c subunit K03889 M00151 Cytochrome bc1 complex respiratory unit 0,2 +CYTB; ubiquinol-cytochrome c reductase cytochrome b subunit K00412 M00152 Cytochrome bc1 complex 0,0 +CYC1; ubiquinol-cytochrome c reductase cytochrome c1 subunit K00413 M00152 Cytochrome bc1 complex 0,0 +FBCH; ubiquinol-cytochrome c reductase cytochrome b/c1 subunit K00410 M00152 Cytochrome bc1 complex 0,0 +UQCRFS1; ubiquinol-cytochrome c reductase iron-sulfur subunit K00411 M00152 Cytochrome bc1 complex 0,0 +QCR1; ubiquinol-cytochrome c reductase core subunit 1 K00414 M00152 Cytochrome bc1 complex 0,0 +QCR2; ubiquinol-cytochrome c reductase core subunit 2 K00415 M00152 Cytochrome bc1 complex 0,0 +QCR6; ubiquinol-cytochrome c reductase subunit 6 K00416 M00152 Cytochrome bc1 complex 0,0 +QCR7; ubiquinol-cytochrome c reductase subunit 7 K00417 M00152 Cytochrome bc1 complex 0,0 +QCR8; ubiquinol-cytochrome c reductase subunit 8 K00418 M00152 Cytochrome bc1 complex 0,0 +QCR9; ubiquinol-cytochrome c reductase subunit 9 K00419 M00152 Cytochrome bc1 complex 0,0 +QCR10; ubiquinol-cytochrome c reductase subunit 10 K00420 M00152 Cytochrome bc1 complex 0,0 +cytochrome bd ubiquinol oxidase subunit I [EC:1.10.3.14] K00425 M00153 Cytochrome bd ubiquinol oxidase 0,0 +cytochrome bd ubiquinol oxidase subunit II [EC:1.10.3.14] K00426 M00153 Cytochrome bd ubiquinol oxidase 0,0 +cydX; cytochrome bd-I ubiquinol oxidase subunit X [EC:1.10.3.14] K00424 M00153 Cytochrome bd ubiquinol oxidase 0,0 +appX; cytochrome bd-II ubiquinol oxidase subunit AppX [EC:1.10.3.14] K22501 M00153 Cytochrome bd ubiquinol oxidase 0,0 +COX10; protoheme IX farnesyltransferase [EC:2.5.1.-] K02257 M00154 Cytochrome c oxidase 0,0 +COX3; cytochrome c oxidase subunit 3 K02262 M00154 Cytochrome c oxidase 0,0 +COX1; cytochrome c oxidase subunit 1 [EC:1.9.3.1] K02256 M00154 Cytochrome c oxidase 0,0 +COX2; cytochrome c oxidase subunit 2 K02261 M00154 Cytochrome c oxidase 0,0 +COX4; cytochrome c oxidase subunit 4 K02263 M00154 Cytochrome c oxidase 0,0 +COX5A; cytochrome c oxidase subunit 5a K02264 M00154 Cytochrome c oxidase 0,0 +COX5B; cytochrome c oxidase subunit 5b K02265 M00154 Cytochrome c oxidase 0,0 +COX6A; cytochrome c oxidase subunit 6a K02266 M00154 Cytochrome c oxidase 0,0 +COX6B; cytochrome c oxidase subunit 6b K02267 M00154 Cytochrome c oxidase 0,0 +COX6C; cytochrome c oxidase subunit 6c K02268 M00154 Cytochrome c oxidase 0,0 +COX7; cytochrome c oxidase subunit 7 K02269 M00154 Cytochrome c oxidase 0,0 +COX7A; cytochrome c oxidase subunit 7a K02270 M00154 Cytochrome c oxidase 0,0 +COX7B; cytochrome c oxidase subunit 7b K02271 M00154 Cytochrome c oxidase 0,0 +COX7C; cytochrome c oxidase subunit 7c K02272 M00154 Cytochrome c oxidase 0,0 +COX8; cytochrome c oxidase subunit 8 K02273 M00154 Cytochrome c oxidase 0,0 +COX11; cytochrome c oxidase assembly protein subunit 11 K02258 M00154 Cytochrome c oxidase 0,0 +COX15; cytochrome c oxidase assembly protein subunit 15 K02259 M00154 Cytochrome c oxidase 0,0 +COX17; cytochrome c oxidase assembly protein subunit 17 K02260 M00154 Cytochrome c oxidase 0,0 +coxB; cytochrome c oxidase subunit II [EC:1.9.3.1] K02275 M00155 Cytochrome c oxidase, prokaryotes 0,0 +coxA; cytochrome c oxidase subunit I [EC:1.9.3.1] K02274 M00155 Cytochrome c oxidase, prokaryotes 0,0 +coxC; cytochrome c oxidase subunit III [EC:1.9.3.1] K02276 M00155 Cytochrome c oxidase, prokaryotes 0,0 +coxAC; cytochrome c oxidase subunit I+III [EC:1.9.3.1] K15408 M00155 Cytochrome c oxidase, prokaryotes 0,0 +coxD; cytochrome c oxidase subunit IV [EC:1.9.3.1] K02277 M00155 Cytochrome c oxidase, prokaryotes 0,0 +ccoN; cb-type cytochrome c oxidase subunit I [EC:1.9.3.1] K00404 M00156 Cytochrome c oxidase, cbb3-type 0,0 +ccoO; cb-type cytochrome c oxidase subunit II K00405 M00156 Cytochrome c oxidase, cbb3-type 0,0 +ccoNO; cbb3-type cytochrome c oxidase subunit I/II K15862 M00156 Cytochrome c oxidase, cbb3-type 0,0 +ccoQ; cb-type cytochrome c oxidase subunit IV K00407 M00156 Cytochrome c oxidase, cbb3-type 0,0 +ccoP; cb-type cytochrome c oxidase subunit III K00406 M00156 Cytochrome c oxidase, cbb3-type 0,0 +ATPF1A; F-type H+-transporting ATPase subunit alpha [EC:7.1.2.2] K02111 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF1B; F-type H+-transporting ATPase subunit beta [EC:7.1.2.2] K02112 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF1D; F-type H+-transporting ATPase subunit delta K02113 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF1E; F-type H+-transporting ATPase subunit epsilon K02114 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF1G; F-type H+-transporting ATPase subunit gamma K02115 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF0A; F-type H+-transporting ATPase subunit a K02108 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF0B; F-type H+-transporting ATPase subunit b K02109 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPF0C; F-type H+-transporting ATPase subunit c K02110 M00157 F-type ATPase, prokaryotes and chloroplasts 0,0 +ATPeF1A; F-type H+-transporting ATPase subunit alpha K02132 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF1B; F-type H+-transporting ATPase subunit beta [EC:3.6.3.14] K02133 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF1G; F-type H+-transporting ATPase subunit gamma K02136 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF1D; F-type H+-transporting ATPase subunit delta K02134 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF1E; F-type H+-transporting ATPase subunit epsilon K02135 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0O; F-type H+-transporting ATPase subunit O K02137 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0A; F-type H+-transporting ATPase subunit a K02126 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0B; F-type H+-transporting ATPase subunit b K02127 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0C; F-type H+-transporting ATPase subunit c K02128 M00158 F-type ATPase, eukaryotes 0,0 +ATPeFD; F-type H+-transporting ATPase subunit d K02138 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0E; F-type H+-transporting ATPase subunit e K02129 M00158 F-type ATPase, eukaryotes 0,0 +TIM11; F-type H+-transporting ATP synthase subunit e K01549 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0F; F-type H+-transporting ATPase subunit f K02130 M00158 F-type ATPase, eukaryotes 0,0 +ATPeFF; F-type H+-transporting ATPase subunit f K02139 M00158 F-type ATPase, eukaryotes 0,0 +ATPeFG; F-type H+-transporting ATPase subunit g K02140 M00158 F-type ATPase, eukaryotes 0,0 +ATPeFH; F-type H+-transporting ATPase subunit h K02141 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF0F6; F-type H+-transporting ATPase subunit 6 K02131 M00158 F-type ATPase, eukaryotes 0,0 +ATPeFJ; F-type H+-transporting ATPase subunit j K02142 M00158 F-type ATPase, eukaryotes 0,0 +ATPeFK; F-type H+-transporting ATPase subunit k K02143 M00158 F-type ATPase, eukaryotes 0,0 +ATPeF08; F-type H+-transporting ATPase subunit 8 K02125 M00158 F-type ATPase, eukaryotes 0,0 +ATPVA; V/A-type H+-transporting ATPase subunit A [EC:3.6.3.14] K02117 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVB; V/A-type H+-transporting ATPase subunit B K02118 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVC; V/A-type H+-transporting ATPase subunit C K02119 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVD; V/A-type H+-transporting ATPase subunit D K02120 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVE; V/A-type H+-transporting ATPase subunit E K02121 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVF; V/A-type H+-transporting ATPase subunit F K02122 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVG; V/A-type H+-transporting ATPase subunit G/H K02107 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVI; V/A-type H+-transporting ATPase subunit I K02123 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPVK; V/A-type H+-transporting ATPase subunit K K02124 M00159 V/A-type ATPase, prokaryotes 0,0 +ATPeV1A; V-type H+-transporting ATPase subunit A [EC:3.6.3.14] K02145 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1B; V-type H+-transporting ATPase subunit B K02147 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1C; V-type H+-transporting ATPase subunit C K02148 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1D; V-type H+-transporting ATPase subunit D K02149 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1E; V-type H+-transporting ATPase subunit E K02150 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1F; V-type H+-transporting ATPase subunit F K02151 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1G; V-type H+-transporting ATPase subunit G K02152 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV1H; V-type H+-transporting ATPase subunit H K02144 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV0A; V-type H+-transporting ATPase subunit a K02154 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV0B; V-type H+-transporting ATPase 21kDa proteolipid subunit K03661 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV0C; V-type H+-transporting ATPase 16kDa proteolipid subunit K02155 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV0D; V-type H+-transporting ATPase subunit d K02146 M00160 V-type ATPase, eukaryotes 0,0 +ATPeV0E; V-type H+-transporting ATPase subunit e K02153 M00160 V-type ATPase, eukaryotes 0,0 +ATPeVS1; V-type H+-transporting ATPase S1 subunit K03662 M00160 V-type ATPase, eukaryotes 0,0 +psbA; photosystem II reaction center D1 protein [EC:1.10.3.9] K02703 M00161 Photosystem II 0,0 +psbD; photosystem II reaction center D2 protein [EC:1.10.3.9] K02706 M00161 Photosystem II 0,0 +psbC; photosystem II CP43 chlorophyll apoprotein K02705 M00161 Photosystem II 0,0 +psbB; photosystem II CP47 chlorophyll apoprotein K02704 M00161 Photosystem II 0,0 +psbE; photosystem II cytochrome b559 subunit alpha K02707 M00161 Photosystem II 0,0 +psbF; photosystem II cytochrome b559 subunit beta K02708 M00161 Photosystem II 0,0 +cytochrome b6 K02635 M00162 Cytochrome b6f complex 0,0 +cytochrome b6-f complex subunit 4 K02637 M00162 Cytochrome b6f complex 0,0 +apocytochrome f K02634 M00162 Cytochrome b6f complex 0,0 +cytochrome b6-f complex iron-sulfur subunit K02636 M00162 Cytochrome b6f complex 0,0 +cytochrome b6-f complex subunit 6 K02642 M00162 Cytochrome b6f complex 0,0 +cytochrome b6-f complex subunit 7 K02643 M00162 Cytochrome b6f complex 0,0 +cytochrome b6-f complex subunit 8 K03689 M00162 Cytochrome b6f complex 0,0 +cytochrome b6-f complex subunit 5 K02640 M00162 Cytochrome b6f complex 0,0 +psaA; photosystem I P700 chlorophyll a apoprotein A1 K02689 M00163 Photosystem I 0,0 +psaB; photosystem I P700 chlorophyll a apoprotein A2 K02690 M00163 Photosystem I 0,0 +psaC; photosystem I subunit VII K02691 M00163 Photosystem I 0,0 +psaD; photosystem I subunit II K02692 M00163 Photosystem I 0,0 +psaE; photosystem I subunit IV K02693 M00163 Photosystem I 0,0 +psaF; photosystem I subunit III K02694 M00163 Photosystem I 0,0 phosphoribulokinase [EC:2.7.1.19] [RN:R01523] K00855 M00165 Reductive pentose phosphate cycle (Calvin cycle) 0,0 C01182 D-Ribulose 1,5-bisphosphate C00199 D-Ribulose 5-phosphate ribulose-bisphosphate carboxylase [EC:4.1.1.39] [RN:R00024] K01601 M00165 Reductive pentose phosphate cycle (Calvin cycle) 1,0 C00197 3-Phospho-D-glycerate C01182,C00011 D-Ribulose 1,5-bisphosphate,CO2 ribulose-bisphosphate carboxylase [EC:4.1.1.39] [RN:R00024] K01602 M00165 Reductive pentose phosphate cycle (Calvin cycle) 1,0 C00197 3-Phospho-D-glycerate C01182,C00011 D-Ribulose 1,5-bisphosphate,CO2 @@ -1516,301 +1516,301 @@ phosphoadenosine phosphosulfate reductase [EC:1.8.4.8] [RN:R02021] K00390 M00176 sulfite reductase (NADPH) [EC:1.8.1.2] [RN:R00858] K00380 M00176 Assimilatory sulfate reduction, sulfate => H2S 2,0 C00283 Hydrogen sulfide C00094 Sulfite sulfite reductase (NADPH) [EC:1.8.1.2] [RN:R00858] K00381 M00176 Assimilatory sulfate reduction, sulfate => H2S 2,0 C00283 Hydrogen sulfide C00094 Sulfite sulfite reductase (ferredoxin) [EC:1.8.7.1] [RN:R00859] K00392 M00176 Assimilatory sulfate reduction, sulfate => H2S 2,1 C00283 Hydrogen sulfide C00094 Sulfite -small subunit ribosomal protein S2e K02981 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S3e K02985 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S3Ae K02984 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S4e K02987 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S5e K02989 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S6e K02991 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S7e K02993 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S8e K02995 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S9e K02997 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S10e K02947 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S11e K02949 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S12e K02951 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S13e K02953 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S14e K02955 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S15e K02958 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S15Ae K02957 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S16e K02960 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S17e K02962 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S18e K02964 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S19e K02966 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S20e K02969 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S21e K02971 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S23e K02973 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S24e K02974 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S25e K02975 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S26e K02976 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S27e K02978 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S27Ae K02977 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S28e K02979 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S29e K02980 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S30e K02983 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein SAe K02998 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L3e K02925 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L4e K02930 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L5e K02932 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L6e K02934 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L7e K02937 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L7Ae K02936 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L8e K02938 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L9e K02940 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L10e K02866 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L10Ae K02865 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L11e K02868 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L12e K02870 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L13e K02873 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L13Ae K02872 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L14e K02875 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L15e K02877 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L17e K02880 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L18e K02883 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L18Ae K02882 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L19e K02885 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L21e K02889 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L22e K02891 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L23e K02894 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L23Ae K02893 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L24e K02896 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L26e K02898 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L27e K02901 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L27Ae K02900 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L28e K02903 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L29e K02905 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L30e K02908 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L31e K02910 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L32e K02912 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L34e K02915 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L35e K02918 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L35Ae K02917 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L36e K02920 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L37e K02922 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L37Ae K02921 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L38e K02923 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L39e K02924 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L40e K02927 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L41e K02928 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein L44e K02929 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein LP0 K02941 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein LP1 K02942 M00177 Ribosome, eukaryotes 0,0 -large subunit ribosomal protein LP2 K02943 M00177 Ribosome, eukaryotes 0,0 -small subunit ribosomal protein S10 K02946 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L3 K02906 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L4 K02926 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L23 K02892 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L2 K02886 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S19 K02965 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L22 K02890 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S3 K02982 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L16 K02878 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L29 K02904 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S17 K02961 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L14 K02874 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L24 K02895 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L5 K02931 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S14 K02954 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S8 K02994 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L6 K02933 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L18 K02881 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S5 K02988 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L30 K02907 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L15 K02876 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L36 K02919 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S13 K02952 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S11 K02948 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S4 K02986 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L17 K02879 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L13 K02871 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S9 K02996 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S7 K02992 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S12 K02950 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L7A K07590 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L7/L12 K02935 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L10 K02864 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L1 K02863 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L11 K02867 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S2 K02967 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S15 K02956 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L35 K02916 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L20 K02887 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L34 K02914 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L9 K02939 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S18 K02963 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S6 K02990 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L21 K02888 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L27 K02899 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L28 K02902 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L33 K02913 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L32 K02911 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L31 K02909 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L25 K02897 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S16 K02959 M00178 Ribosome, bacteria 0,0 -large subunit ribosomal protein L19 K02884 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S20 K02968 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S1 K02945 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S21 K02970 M00178 Ribosome, bacteria 0,0 -small subunit ribosomal protein S10 K02946 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L3 K02906 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L4e K02930 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L23 K02892 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L2 K02886 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S19 K02965 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L22 K02890 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S3 K02982 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L29 K02904 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S17 K02961 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L14 K02874 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L24 K02895 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S4e K02987 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L5 K02931 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S14 K02954 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S8 K02994 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L6 K02933 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L32e K02912 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L19e K02885 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L18 K02881 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S5 K02988 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L30 K02907 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L15 K02876 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S13 K02952 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S11 K02948 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S4 K02986 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L18e K02883 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L13 K02871 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S9 K02996 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S7 K02992 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S12 K02950 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L7Ae K02936 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S28e K02979 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L24e K02896 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L12 K02869 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L10 K02864 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L1 K02863 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L11 K02867 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S2 K02967 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S15 K02956 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S27e K02978 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L44e K02929 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L15e K02877 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S3Ae K02984 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S6e K02991 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S24e K02974 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S27Ae K02977 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S17e K02962 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L31e K02910 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L39e K02924 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L10e K02866 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L21e K02889 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L37e K02922 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L37Ae K02921 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S8e K02995 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S19e K02966 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L40e K02927 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein LX K02944 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S26e K02976 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S25e K02975 M00179 Ribosome, archaea 0,0 -small subunit ribosomal protein S30e K02983 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L13e K02873 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L35Ae K02917 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L41e K02928 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L34e K02915 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L14e K02875 M00179 Ribosome, archaea 0,0 -large subunit ribosomal protein L30e K02908 M00179 Ribosome, archaea 0,0 -RPB1; DNA-directed RNA polymerase II subunit RPB1 [EC:2.7.7.6] K03006 M00180 RNA polymerase II, eukaryotes 0,0 -RPB2; DNA-directed RNA polymerase II subunit RPB2 [EC:2.7.7.6] K03010 M00180 RNA polymerase II, eukaryotes 0,0 -RPB3; DNA-directed RNA polymerase II subunit RPB3 K03011 M00180 RNA polymerase II, eukaryotes 0,0 -RPB11; DNA-directed RNA polymerase II subunit RPB11 K03008 M00180 RNA polymerase II, eukaryotes 0,0 -RPB4; DNA-directed RNA polymerase II subunit RPB4 K03012 M00180 RNA polymerase II, eukaryotes 0,0 -RPB7; DNA-directed RNA polymerase II subunit RPB7 K03015 M00180 RNA polymerase II, eukaryotes 0,0 -RPB9; DNA-directed RNA polymerase II subunit RPB9 K03017 M00180 RNA polymerase II, eukaryotes 0,0 -RPB5; DNA-directed RNA polymerases I, II, and III subunit RPABC1 K03013 M00180 RNA polymerase II, eukaryotes 0,0 -RPB6; DNA-directed RNA polymerases I, II, and III subunit RPABC2 K03014 M00180 RNA polymerase II, eukaryotes 0,0 -RPB8; DNA-directed RNA polymerases I, II, and III subunit RPABC3 K03016 M00180 RNA polymerase II, eukaryotes 0,0 -RPB12; DNA-directed RNA polymerases I, II, and III subunit RPABC4 K03009 M00180 RNA polymerase II, eukaryotes 0,0 -RPB10; DNA-directed RNA polymerases I, II, and III subunit RPABC5 K03007 M00180 RNA polymerase II, eukaryotes 0,0 -RPC1; DNA-directed RNA polymerase III subunit RPC1 [EC:2.7.7.6] K03018 M00181 RNA polymerase III, eukaryotes 0,0 -RPC2; DNA-directed RNA polymerase III subunit RPC2 [EC:2.7.7.6] K03021 M00181 RNA polymerase III, eukaryotes 0,0 -RPC40; DNA-directed RNA polymerases I and III subunit RPAC1 K03027 M00181 RNA polymerase III, eukaryotes 0,0 -RPC19; DNA-directed RNA polymerases I and III subunit RPAC2 K03020 M00181 RNA polymerase III, eukaryotes 0,0 -RPC82; DNA-directed RNA polymerase III subunit RPC3 K03023 M00181 RNA polymerase III, eukaryotes 0,0 -RPC53; DNA-directed RNA polymerase III subunit RPC4 K03026 M00181 RNA polymerase III, eukaryotes 0,0 -RPC37; DNA-directed RNA polymerase III subunit RPC5 K14721 M00181 RNA polymerase III, eukaryotes 0,0 -RPC34; DNA-directed RNA polymerase III subunit RPC6 K03025 M00181 RNA polymerase III, eukaryotes 0,0 -RPC31; DNA-directed RNA polymerase III subunit RPC7 K03024 M00181 RNA polymerase III, eukaryotes 0,0 -RPC25; DNA-directed RNA polymerase III subunit RPC8 K03022 M00181 RNA polymerase III, eukaryotes 0,0 -RPC11; DNA-directed RNA polymerase III subunit RPC10 K03019 M00181 RNA polymerase III, eukaryotes 0,0 -RPB5; DNA-directed RNA polymerases I, II, and III subunit RPABC1 K03013 M00181 RNA polymerase III, eukaryotes 0,0 -RPB6; DNA-directed RNA polymerases I, II, and III subunit RPABC2 K03014 M00181 RNA polymerase III, eukaryotes 0,0 -RPB8; DNA-directed RNA polymerases I, II, and III subunit RPABC3 K03016 M00181 RNA polymerase III, eukaryotes 0,0 -RPB12; DNA-directed RNA polymerases I, II, and III subunit RPABC4 K03009 M00181 RNA polymerase III, eukaryotes 0,0 -RPB10; DNA-directed RNA polymerases I, II, and III subunit RPABC5 K03007 M00181 RNA polymerase III, eukaryotes 0,0 -RPA1; DNA-directed RNA polymerase I subunit RPA1 [EC:2.7.7.6] K02999 M00182 RNA polymerase I, eukaryotes 0,0 -RPA2; DNA-directed RNA polymerase I subunit RPA2 [EC:2.7.7.6] K03002 M00182 RNA polymerase I, eukaryotes 0,0 -RPC40; DNA-directed RNA polymerases I and III subunit RPAC1 K03027 M00182 RNA polymerase I, eukaryotes 0,0 -RPC19; DNA-directed RNA polymerases I and III subunit RPAC2 K03020 M00182 RNA polymerase I, eukaryotes 0,0 -RPA12; DNA-directed RNA polymerase I subunit RPA12 K03000 M00182 RNA polymerase I, eukaryotes 0,0 -RPA14; DNA-directed RNA polymerase I subunit RPA14 K03001 M00182 RNA polymerase I, eukaryotes 0,0 -RPA34; DNA-directed RNA polymerase I subunit RPA34 K03003 M00182 RNA polymerase I, eukaryotes 0,0 -RPA43; DNA-directed RNA polymerase I subunit RPA43 K03004 M00182 RNA polymerase I, eukaryotes 0,0 -RPA49; DNA-directed RNA polymerase I subunit RPA49 K03005 M00182 RNA polymerase I, eukaryotes 0,0 -RPB5; DNA-directed RNA polymerases I, II, and III subunit RPABC1 K03013 M00182 RNA polymerase I, eukaryotes 0,0 -RPB6; DNA-directed RNA polymerases I, II, and III subunit RPABC2 K03014 M00182 RNA polymerase I, eukaryotes 0,0 -RPB8; DNA-directed RNA polymerases I, II, and III subunit RPABC3 K03016 M00182 RNA polymerase I, eukaryotes 0,0 -RPB12; DNA-directed RNA polymerases I, II, and III subunit RPABC4 K03009 M00182 RNA polymerase I, eukaryotes 0,0 -RPB10; DNA-directed RNA polymerases I, II, and III subunit RPABC5 K03007 M00182 RNA polymerase I, eukaryotes 0,0 -rpoA; DNA-directed RNA polymerase subunit alpha [EC:2.7.7.6] K03040 M00183 RNA polymerase, bacteria 0,0 -rpoB; DNA-directed RNA polymerase subunit beta [EC:2.7.7.6] K03043 M00183 RNA polymerase, bacteria 0,0 -rpoC; DNA-directed RNA polymerase subunit beta' [EC:2.7.7.6] K03046 M00183 RNA polymerase, bacteria 0,0 -rpoBC; DNA-directed RNA polymerase subunit beta-beta' [EC:2.7.7.6] K13797 M00183 RNA polymerase, bacteria 0,0 -rpoZ; DNA-directed RNA polymerase subunit omega [EC:2.7.7.6] K03060 M00183 RNA polymerase, bacteria 0,0 -rpoE; DNA-directed RNA polymerase subunit delta K03048 M00183 RNA polymerase, bacteria 0,0 -"rpoA2; DNA-directed RNA polymerase subunit A"" [EC:2.7.7.6]" K03042 M00184 RNA polymerase, archaea 0,0 -rpoA1; DNA-directed RNA polymerase subunit A' [EC:2.7.7.6] K03041 M00184 RNA polymerase, archaea 0,0 -rpoB1; DNA-directed RNA polymerase subunit B' [EC:2.7.7.6] K03044 M00184 RNA polymerase, archaea 0,0 -"rpoB2; DNA-directed RNA polymerase subunit B"" [EC:2.7.7.6]" K03045 M00184 RNA polymerase, archaea 0,0 -rpoB; DNA-directed RNA polymerase subunit B [EC:2.7.7.6] K13798 M00184 RNA polymerase, archaea 0,0 -rpoH; DNA-directed RNA polymerase subunit H [EC:2.7.7.6] K03053 M00184 RNA polymerase, archaea 0,0 -rpoK; DNA-directed RNA polymerase subunit K [EC:2.7.7.6] K03055 M00184 RNA polymerase, archaea 0,0 -rpoN; DNA-directed RNA polymerase subunit N [EC:2.7.7.6] K03058 M00184 RNA polymerase, archaea 0,0 -rpoD; DNA-directed RNA polymerase subunit D [EC:2.7.7.6] K03047 M00184 RNA polymerase, archaea 0,0 -rpoE1; DNA-directed RNA polymerase subunit E' [EC:2.7.7.6] K03049 M00184 RNA polymerase, archaea 0,0 -"rpoE2; DNA-directed RNA polymerase subunit E"" [EC:2.7.7.6]" K03050 M00184 RNA polymerase, archaea 0,0 -rpoL; DNA-directed RNA polymerase subunit L [EC:2.7.7.6] K03056 M00184 RNA polymerase, archaea 0,0 -rpoP; DNA-directed RNA polymerase subunit P [EC:2.7.7.6] K03059 M00184 RNA polymerase, archaea 0,0 -rpoF; DNA-directed RNA polymerase subunit F [EC:2.7.7.6] K03051 M00184 RNA polymerase, archaea 0,0 -rpoG; DNA-directed RNA polymerase subunit G [EC:2.7.7.6] K03052 M00184 RNA polymerase, archaea 0,0 -rpoI; DNA-directed RNA polymerase subunit I [EC:2.7.7.6] K03054 M00184 RNA polymerase, archaea 0,0 -dnaE; DNA polymerase III subunit alpha [EC:2.7.7.7] K02337 M00260 DNA polymerase III complex, bacteria 0,0 -polC; DNA polymerase III subunit alpha, Gram-positive type [EC:2.7.7.7] K03763 M00260 DNA polymerase III complex, bacteria 0,0 -dnaQ; DNA polymerase III subunit epsilon [EC:2.7.7.7] K02342 M00260 DNA polymerase III complex, bacteria 0,0 -rnhA-dnaQ; ribonuclease HI / DNA polymerase III subunit epsilon [EC:3.1.26.4 2.7.7.7] K14159 M00260 DNA polymerase III complex, bacteria 0,0 -holE; DNA polymerase III subunit theta [EC:2.7.7.7] K02345 M00260 DNA polymerase III complex, bacteria 0,0 -dnaN; DNA polymerase III subunit beta [EC:2.7.7.7] K02338 M00260 DNA polymerase III complex, bacteria 0,0 -holA; DNA polymerase III subunit delta [EC:2.7.7.7] K02340 M00260 DNA polymerase III complex, bacteria 0,0 -holB; DNA polymerase III subunit delta' [EC:2.7.7.7] K02341 M00260 DNA polymerase III complex, bacteria 0,0 -dnaX; DNA polymerase III subunit gamma/tau [EC:2.7.7.7] K02343 M00260 DNA polymerase III complex, bacteria 0,0 -holC; DNA polymerase III subunit chi [EC:2.7.7.7] K02339 M00260 DNA polymerase III complex, bacteria 0,0 -holD; DNA polymerase III subunit psi [EC:2.7.7.7] K02344 M00260 DNA polymerase III complex, bacteria 0,0 -POLA1; DNA polymerase alpha, subunit A [EC:2.7.7.7] K02320 M00261 DNA polymerase alpha / primase complex 0,0 -POLA2; DNA polymerase alpha, subunit B [EC:2.7.7.7] K02321 M00261 DNA polymerase alpha / primase complex 0,0 -PRI2; DNA primase large subunit [EC:2.7.7.-] K02685 M00261 DNA polymerase alpha / primase complex 0,0 -PRI1; DNA primase small subunit [EC:2.7.7.-] K02684 M00261 DNA polymerase alpha / primase complex 0,0 -POLD1; DNA polymerase delta, subunit A [EC:2.7.7.7] K02327 M00262 DNA polymerase delta complex 0,0 -POLD2; DNA polymerase delta, subunit B [EC:2.7.7.7] K02328 M00262 DNA polymerase delta complex 0,0 -POLD3; DNA polymerase delta, subunit C [EC:2.7.7.7] K03504 M00262 DNA polymerase delta complex 0,0 -POLD4; DNA polymerase delta, subunit D [EC:2.7.7.7] K03505 M00262 DNA polymerase delta complex 0,0 -POLE1; DNA polymerase epsilon, subunit A [EC:2.7.7.7] K02324 M00263 DNA polymerase epsilon complex 0,0 -POLE2; DNA Polymerase epsilon, subunit B [EC:2.7.7.7] K02325 M00263 DNA polymerase epsilon complex 0,0 -POLE3; DNA Polymerase epsilon, subunit C [EC:2.7.7.7] K02326 M00263 DNA polymerase epsilon complex 0,0 -POLE4; DNA polymerase epsilon, subunit D [EC:2.7.7.7] K03506 M00263 DNA polymerase epsilon complex 0,0 -DPB1; DNA polymerase II large subunit [EC:2.7.7.7] K02322 M00264 DNA polymerase II complex, archaea 0,0 -DPB2; DNA polymerase II small subunit [EC:2.7.7.7] K02323 M00264 DNA polymerase II complex, archaea 0,0 -POLZ1, rev3; DNA polymerase zeta subunit K02350 M00293 DNA polymerase zeta complex 0,0 -POLZ2, rev7; DNA polymerase zeta subunit K03508 M00293 DNA polymerase zeta complex 0,0 -MAD2L2; mitotic spindle assembly checkpoint protein MAD2B K13728 M00293 DNA polymerase zeta complex 0,0 -POLG1; DNA polymerase gamma subunit [EC:2.7.7.7] [COG:COG0749] [GO:0003895] K02332 M00294 DNA polymerase gamma complex 0,0 -POLG2; DNA polymerase gamma2 subunit [EC:2.7.7.7] [GO:0003895] K02333 M00294 DNA polymerase gamma complex 0,0 +small subunit ribosomal protein S2e K02981 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S3e K02985 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S3Ae K02984 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S4e K02987 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S5e K02989 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S6e K02991 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S7e K02993 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S8e K02995 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S9e K02997 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S10e K02947 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S11e K02949 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S12e K02951 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S13e K02953 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S14e K02955 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S15e K02958 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S15Ae K02957 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S16e K02960 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S17e K02962 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S18e K02964 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S19e K02966 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S20e K02969 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S21e K02971 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S23e K02973 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S24e K02974 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S25e K02975 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S26e K02976 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S27e K02978 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S27Ae K02977 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S28e K02979 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S29e K02980 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S30e K02983 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein SAe K02998 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L3e K02925 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L4e K02930 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L5e K02932 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L6e K02934 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L7e K02937 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L7Ae K02936 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L8e K02938 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L9e K02940 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L10e K02866 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L10Ae K02865 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L11e K02868 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L12e K02870 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L13e K02873 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L13Ae K02872 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L14e K02875 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L15e K02877 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L17e K02880 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L18e K02883 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L18Ae K02882 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L19e K02885 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L21e K02889 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L22e K02891 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L23e K02894 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L23Ae K02893 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L24e K02896 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L26e K02898 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L27e K02901 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L27Ae K02900 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L28e K02903 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L29e K02905 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L30e K02908 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L31e K02910 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L32e K02912 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L34e K02915 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L35e K02918 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L35Ae K02917 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L36e K02920 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L37e K02922 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L37Ae K02921 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L38e K02923 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L39e K02924 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L40e K02927 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L41e K02928 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein L44e K02929 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein LP0 K02941 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein LP1 K02942 M00177 Ribosome, eukaryotes 0,0 +large subunit ribosomal protein LP2 K02943 M00177 Ribosome, eukaryotes 0,0 +small subunit ribosomal protein S10 K02946 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L3 K02906 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L4 K02926 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L23 K02892 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L2 K02886 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S19 K02965 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L22 K02890 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S3 K02982 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L16 K02878 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L29 K02904 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S17 K02961 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L14 K02874 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L24 K02895 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L5 K02931 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S14 K02954 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S8 K02994 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L6 K02933 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L18 K02881 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S5 K02988 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L30 K02907 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L15 K02876 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L36 K02919 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S13 K02952 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S11 K02948 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S4 K02986 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L17 K02879 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L13 K02871 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S9 K02996 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S7 K02992 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S12 K02950 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L7A K07590 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L7/L12 K02935 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L10 K02864 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L1 K02863 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L11 K02867 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S2 K02967 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S15 K02956 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L35 K02916 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L20 K02887 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L34 K02914 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L9 K02939 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S18 K02963 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S6 K02990 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L21 K02888 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L27 K02899 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L28 K02902 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L33 K02913 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L32 K02911 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L31 K02909 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L25 K02897 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S16 K02959 M00178 Ribosome, bacteria 0,0 +large subunit ribosomal protein L19 K02884 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S20 K02968 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S1 K02945 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S21 K02970 M00178 Ribosome, bacteria 0,0 +small subunit ribosomal protein S10 K02946 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L3 K02906 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L4e K02930 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L23 K02892 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L2 K02886 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S19 K02965 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L22 K02890 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S3 K02982 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L29 K02904 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S17 K02961 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L14 K02874 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L24 K02895 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S4e K02987 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L5 K02931 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S14 K02954 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S8 K02994 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L6 K02933 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L32e K02912 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L19e K02885 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L18 K02881 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S5 K02988 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L30 K02907 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L15 K02876 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S13 K02952 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S11 K02948 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S4 K02986 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L18e K02883 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L13 K02871 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S9 K02996 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S7 K02992 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S12 K02950 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L7Ae K02936 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S28e K02979 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L24e K02896 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L12 K02869 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L10 K02864 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L1 K02863 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L11 K02867 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S2 K02967 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S15 K02956 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S27e K02978 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L44e K02929 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L15e K02877 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S3Ae K02984 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S6e K02991 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S24e K02974 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S27Ae K02977 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S17e K02962 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L31e K02910 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L39e K02924 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L10e K02866 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L21e K02889 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L37e K02922 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L37Ae K02921 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S8e K02995 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S19e K02966 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L40e K02927 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein LX K02944 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S26e K02976 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S25e K02975 M00179 Ribosome, archaea 0,0 +small subunit ribosomal protein S30e K02983 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L13e K02873 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L35Ae K02917 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L41e K02928 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L34e K02915 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L14e K02875 M00179 Ribosome, archaea 0,0 +large subunit ribosomal protein L30e K02908 M00179 Ribosome, archaea 0,0 +RPB1; DNA-directed RNA polymerase II subunit RPB1 [EC:2.7.7.6] K03006 M00180 RNA polymerase II, eukaryotes 0,0 +RPB2; DNA-directed RNA polymerase II subunit RPB2 [EC:2.7.7.6] K03010 M00180 RNA polymerase II, eukaryotes 0,0 +RPB3; DNA-directed RNA polymerase II subunit RPB3 K03011 M00180 RNA polymerase II, eukaryotes 0,0 +RPB11; DNA-directed RNA polymerase II subunit RPB11 K03008 M00180 RNA polymerase II, eukaryotes 0,0 +RPB4; DNA-directed RNA polymerase II subunit RPB4 K03012 M00180 RNA polymerase II, eukaryotes 0,0 +RPB7; DNA-directed RNA polymerase II subunit RPB7 K03015 M00180 RNA polymerase II, eukaryotes 0,0 +RPB9; DNA-directed RNA polymerase II subunit RPB9 K03017 M00180 RNA polymerase II, eukaryotes 0,0 +RPB5; DNA-directed RNA polymerases I, II, and III subunit RPABC1 K03013 M00180 RNA polymerase II, eukaryotes 0,0 +RPB6; DNA-directed RNA polymerases I, II, and III subunit RPABC2 K03014 M00180 RNA polymerase II, eukaryotes 0,0 +RPB8; DNA-directed RNA polymerases I, II, and III subunit RPABC3 K03016 M00180 RNA polymerase II, eukaryotes 0,0 +RPB12; DNA-directed RNA polymerases I, II, and III subunit RPABC4 K03009 M00180 RNA polymerase II, eukaryotes 0,0 +RPB10; DNA-directed RNA polymerases I, II, and III subunit RPABC5 K03007 M00180 RNA polymerase II, eukaryotes 0,0 +RPC1; DNA-directed RNA polymerase III subunit RPC1 [EC:2.7.7.6] K03018 M00181 RNA polymerase III, eukaryotes 0,0 +RPC2; DNA-directed RNA polymerase III subunit RPC2 [EC:2.7.7.6] K03021 M00181 RNA polymerase III, eukaryotes 0,0 +RPC40; DNA-directed RNA polymerases I and III subunit RPAC1 K03027 M00181 RNA polymerase III, eukaryotes 0,0 +RPC19; DNA-directed RNA polymerases I and III subunit RPAC2 K03020 M00181 RNA polymerase III, eukaryotes 0,0 +RPC82; DNA-directed RNA polymerase III subunit RPC3 K03023 M00181 RNA polymerase III, eukaryotes 0,0 +RPC53; DNA-directed RNA polymerase III subunit RPC4 K03026 M00181 RNA polymerase III, eukaryotes 0,0 +RPC37; DNA-directed RNA polymerase III subunit RPC5 K14721 M00181 RNA polymerase III, eukaryotes 0,0 +RPC34; DNA-directed RNA polymerase III subunit RPC6 K03025 M00181 RNA polymerase III, eukaryotes 0,0 +RPC31; DNA-directed RNA polymerase III subunit RPC7 K03024 M00181 RNA polymerase III, eukaryotes 0,0 +RPC25; DNA-directed RNA polymerase III subunit RPC8 K03022 M00181 RNA polymerase III, eukaryotes 0,0 +RPC11; DNA-directed RNA polymerase III subunit RPC10 K03019 M00181 RNA polymerase III, eukaryotes 0,0 +RPB5; DNA-directed RNA polymerases I, II, and III subunit RPABC1 K03013 M00181 RNA polymerase III, eukaryotes 0,0 +RPB6; DNA-directed RNA polymerases I, II, and III subunit RPABC2 K03014 M00181 RNA polymerase III, eukaryotes 0,0 +RPB8; DNA-directed RNA polymerases I, II, and III subunit RPABC3 K03016 M00181 RNA polymerase III, eukaryotes 0,0 +RPB12; DNA-directed RNA polymerases I, II, and III subunit RPABC4 K03009 M00181 RNA polymerase III, eukaryotes 0,0 +RPB10; DNA-directed RNA polymerases I, II, and III subunit RPABC5 K03007 M00181 RNA polymerase III, eukaryotes 0,0 +RPA1; DNA-directed RNA polymerase I subunit RPA1 [EC:2.7.7.6] K02999 M00182 RNA polymerase I, eukaryotes 0,0 +RPA2; DNA-directed RNA polymerase I subunit RPA2 [EC:2.7.7.6] K03002 M00182 RNA polymerase I, eukaryotes 0,0 +RPC40; DNA-directed RNA polymerases I and III subunit RPAC1 K03027 M00182 RNA polymerase I, eukaryotes 0,0 +RPC19; DNA-directed RNA polymerases I and III subunit RPAC2 K03020 M00182 RNA polymerase I, eukaryotes 0,0 +RPA12; DNA-directed RNA polymerase I subunit RPA12 K03000 M00182 RNA polymerase I, eukaryotes 0,0 +RPA14; DNA-directed RNA polymerase I subunit RPA14 K03001 M00182 RNA polymerase I, eukaryotes 0,0 +RPA34; DNA-directed RNA polymerase I subunit RPA34 K03003 M00182 RNA polymerase I, eukaryotes 0,0 +RPA43; DNA-directed RNA polymerase I subunit RPA43 K03004 M00182 RNA polymerase I, eukaryotes 0,0 +RPA49; DNA-directed RNA polymerase I subunit RPA49 K03005 M00182 RNA polymerase I, eukaryotes 0,0 +RPB5; DNA-directed RNA polymerases I, II, and III subunit RPABC1 K03013 M00182 RNA polymerase I, eukaryotes 0,0 +RPB6; DNA-directed RNA polymerases I, II, and III subunit RPABC2 K03014 M00182 RNA polymerase I, eukaryotes 0,0 +RPB8; DNA-directed RNA polymerases I, II, and III subunit RPABC3 K03016 M00182 RNA polymerase I, eukaryotes 0,0 +RPB12; DNA-directed RNA polymerases I, II, and III subunit RPABC4 K03009 M00182 RNA polymerase I, eukaryotes 0,0 +RPB10; DNA-directed RNA polymerases I, II, and III subunit RPABC5 K03007 M00182 RNA polymerase I, eukaryotes 0,0 +rpoA; DNA-directed RNA polymerase subunit alpha [EC:2.7.7.6] K03040 M00183 RNA polymerase, bacteria 0,0 +rpoB; DNA-directed RNA polymerase subunit beta [EC:2.7.7.6] K03043 M00183 RNA polymerase, bacteria 0,0 +rpoC; DNA-directed RNA polymerase subunit beta' [EC:2.7.7.6] K03046 M00183 RNA polymerase, bacteria 0,0 +rpoBC; DNA-directed RNA polymerase subunit beta-beta' [EC:2.7.7.6] K13797 M00183 RNA polymerase, bacteria 0,0 +rpoZ; DNA-directed RNA polymerase subunit omega [EC:2.7.7.6] K03060 M00183 RNA polymerase, bacteria 0,0 +rpoE; DNA-directed RNA polymerase subunit delta K03048 M00183 RNA polymerase, bacteria 0,0 +"rpoA2; DNA-directed RNA polymerase subunit A"" [EC:2.7.7.6]" K03042 M00184 RNA polymerase, archaea 0,0 +rpoA1; DNA-directed RNA polymerase subunit A' [EC:2.7.7.6] K03041 M00184 RNA polymerase, archaea 0,0 +rpoB1; DNA-directed RNA polymerase subunit B' [EC:2.7.7.6] K03044 M00184 RNA polymerase, archaea 0,0 +"rpoB2; DNA-directed RNA polymerase subunit B"" [EC:2.7.7.6]" K03045 M00184 RNA polymerase, archaea 0,0 +rpoB; DNA-directed RNA polymerase subunit B [EC:2.7.7.6] K13798 M00184 RNA polymerase, archaea 0,0 +rpoH; DNA-directed RNA polymerase subunit H [EC:2.7.7.6] K03053 M00184 RNA polymerase, archaea 0,0 +rpoK; DNA-directed RNA polymerase subunit K [EC:2.7.7.6] K03055 M00184 RNA polymerase, archaea 0,0 +rpoN; DNA-directed RNA polymerase subunit N [EC:2.7.7.6] K03058 M00184 RNA polymerase, archaea 0,0 +rpoD; DNA-directed RNA polymerase subunit D [EC:2.7.7.6] K03047 M00184 RNA polymerase, archaea 0,0 +rpoE1; DNA-directed RNA polymerase subunit E' [EC:2.7.7.6] K03049 M00184 RNA polymerase, archaea 0,0 +"rpoE2; DNA-directed RNA polymerase subunit E"" [EC:2.7.7.6]" K03050 M00184 RNA polymerase, archaea 0,0 +rpoL; DNA-directed RNA polymerase subunit L [EC:2.7.7.6] K03056 M00184 RNA polymerase, archaea 0,0 +rpoP; DNA-directed RNA polymerase subunit P [EC:2.7.7.6] K03059 M00184 RNA polymerase, archaea 0,0 +rpoF; DNA-directed RNA polymerase subunit F [EC:2.7.7.6] K03051 M00184 RNA polymerase, archaea 0,0 +rpoG; DNA-directed RNA polymerase subunit G [EC:2.7.7.6] K03052 M00184 RNA polymerase, archaea 0,0 +rpoI; DNA-directed RNA polymerase subunit I [EC:2.7.7.6] K03054 M00184 RNA polymerase, archaea 0,0 +dnaE; DNA polymerase III subunit alpha [EC:2.7.7.7] K02337 M00260 DNA polymerase III complex, bacteria 0,0 +polC; DNA polymerase III subunit alpha, Gram-positive type [EC:2.7.7.7] K03763 M00260 DNA polymerase III complex, bacteria 0,0 +dnaQ; DNA polymerase III subunit epsilon [EC:2.7.7.7] K02342 M00260 DNA polymerase III complex, bacteria 0,0 +rnhA-dnaQ; ribonuclease HI / DNA polymerase III subunit epsilon [EC:3.1.26.4 2.7.7.7] K14159 M00260 DNA polymerase III complex, bacteria 0,0 +holE; DNA polymerase III subunit theta [EC:2.7.7.7] K02345 M00260 DNA polymerase III complex, bacteria 0,0 +dnaN; DNA polymerase III subunit beta [EC:2.7.7.7] K02338 M00260 DNA polymerase III complex, bacteria 0,0 +holA; DNA polymerase III subunit delta [EC:2.7.7.7] K02340 M00260 DNA polymerase III complex, bacteria 0,0 +holB; DNA polymerase III subunit delta' [EC:2.7.7.7] K02341 M00260 DNA polymerase III complex, bacteria 0,0 +dnaX; DNA polymerase III subunit gamma/tau [EC:2.7.7.7] K02343 M00260 DNA polymerase III complex, bacteria 0,0 +holC; DNA polymerase III subunit chi [EC:2.7.7.7] K02339 M00260 DNA polymerase III complex, bacteria 0,0 +holD; DNA polymerase III subunit psi [EC:2.7.7.7] K02344 M00260 DNA polymerase III complex, bacteria 0,0 +POLA1; DNA polymerase alpha, subunit A [EC:2.7.7.7] K02320 M00261 DNA polymerase alpha / primase complex 0,0 +POLA2; DNA polymerase alpha, subunit B [EC:2.7.7.7] K02321 M00261 DNA polymerase alpha / primase complex 0,0 +PRI2; DNA primase large subunit [EC:2.7.7.-] K02685 M00261 DNA polymerase alpha / primase complex 0,0 +PRI1; DNA primase small subunit [EC:2.7.7.-] K02684 M00261 DNA polymerase alpha / primase complex 0,0 +POLD1; DNA polymerase delta, subunit A [EC:2.7.7.7] K02327 M00262 DNA polymerase delta complex 0,0 +POLD2; DNA polymerase delta, subunit B [EC:2.7.7.7] K02328 M00262 DNA polymerase delta complex 0,0 +POLD3; DNA polymerase delta, subunit C [EC:2.7.7.7] K03504 M00262 DNA polymerase delta complex 0,0 +POLD4; DNA polymerase delta, subunit D [EC:2.7.7.7] K03505 M00262 DNA polymerase delta complex 0,0 +POLE1; DNA polymerase epsilon, subunit A [EC:2.7.7.7] K02324 M00263 DNA polymerase epsilon complex 0,0 +POLE2; DNA Polymerase epsilon, subunit B [EC:2.7.7.7] K02325 M00263 DNA polymerase epsilon complex 0,0 +POLE3; DNA Polymerase epsilon, subunit C [EC:2.7.7.7] K02326 M00263 DNA polymerase epsilon complex 0,0 +POLE4; DNA polymerase epsilon, subunit D [EC:2.7.7.7] K03506 M00263 DNA polymerase epsilon complex 0,0 +DPB1; DNA polymerase II large subunit [EC:2.7.7.7] K02322 M00264 DNA polymerase II complex, archaea 0,0 +DPB2; DNA polymerase II small subunit [EC:2.7.7.7] K02323 M00264 DNA polymerase II complex, archaea 0,0 +POLZ1, rev3; DNA polymerase zeta subunit K02350 M00293 DNA polymerase zeta complex 0,0 +POLZ2, rev7; DNA polymerase zeta subunit K03508 M00293 DNA polymerase zeta complex 0,0 +MAD2L2; mitotic spindle assembly checkpoint protein MAD2B K13728 M00293 DNA polymerase zeta complex 0,0 +POLG1; DNA polymerase gamma subunit [EC:2.7.7.7] [COG:COG0749] [GO:0003895] K02332 M00294 DNA polymerase gamma complex 0,0 +POLG2; DNA polymerase gamma2 subunit [EC:2.7.7.7] [GO:0003895] K02333 M00294 DNA polymerase gamma complex 0,0 pyruvate dehydrogenase complex [EC:1.2.4.1 2.3.1.12 1.8.1.4] [RN:R00209] K00163 M00307 Pyruvate oxidation, pyruvate => acetyl-CoA 0,0 C00024 Acetyl-CoA C00022 Pyruvate pyruvate dehydrogenase complex [EC:1.2.4.1 2.3.1.12 1.8.1.4] [RN:R00209] K00161 M00307 Pyruvate oxidation, pyruvate => acetyl-CoA 0,0 C00024 Acetyl-CoA C00022 Pyruvate pyruvate dehydrogenase complex [EC:1.2.4.1 2.3.1.12 1.8.1.4] [RN:R00209] K00162 M00307 Pyruvate oxidation, pyruvate => acetyl-CoA 0,0 C00024 Acetyl-CoA C00022 Pyruvate @@ -1922,8 +1922,8 @@ phosphosulfolactate synthase [EC:4.4.1.19] [RN:R07476] K08097 M00358 Coenzyme M L-2-hydroxycarboxylate dehydrogenase (NAD+) [EC:1.1.1.337] [RN:R07136] K05884 M00358 Coenzyme M biosynthesis 2,0 C05528 3-Sulfopyruvate C11537 (2R)-3-Sulfolactate sulfopyruvate decarboxylase [EC:4.1.1.79] [RN:R05774] K13039 M00358 Coenzyme M biosynthesis 3,0 C00593 Sulfoacetaldehyde C05528 3-Sulfopyruvate sulfopyruvate decarboxylase [EC:4.1.1.79] [RN:R05774] K06034 M00358 Coenzyme M biosynthesis 3,0 C00593 Sulfoacetaldehyde C05528 3-Sulfopyruvate -stxA; shiga toxin subunit A K11006 M00363 EHEC pathogenicity signature, Shiga toxin 0,0 -stxB; shiga toxin subunit B K11007 M00363 EHEC pathogenicity signature, Shiga toxin 1,0 +stxA; shiga toxin subunit A K11006 M00363 EHEC pathogenicity signature, Shiga toxin 0,0 +stxB; shiga toxin subunit B K11007 M00363 EHEC pathogenicity signature, Shiga toxin 1,0 IPP <-> DMPP [EC:5.3.3.2] [RN:R01123] K01823 M00364 C10-C20 isoprenoid biosynthesis, bacteria 0,0 C00235 Dimethylallyl diphosphate (DMPP) C00129 Isopentenyl diphosphate (IPP) DMPP -> GPP -> FPP [EC:2.5.1.1 2.5.1.10] [RN:R01658 R02003] K00795 M00364 C10-C20 isoprenoid biosynthesis, bacteria 1,0 C00448 trans,trans-Farnesyl diphosphate (FPP) C00341,C00129 Geranyl diphosphate (GPP),Isopentenyl diphosphate (IPP) DMPP -> GPP -> FPP -> GGPP [EC:2.5.1.1 2.5.1.10 2.5.1.29] [RN:R01658 R02003 R02061] K13789 M00364 C10-C20 isoprenoid biosynthesis, bacteria 1,1 C00353 Geranylgeranyl diphosphate (GGPP) C00448,C00129 trans,trans-Farnesyl diphosphate (FPP),Isopentenyl diphosphate (IPP) @@ -2029,27 +2029,27 @@ acetyl-CoA decarbonylase/synthase complex [EC:2.3.1.-] [RN:R10243] K00197 M00377 acetyl-CoA decarbonylase/synthase complex [EC:2.3.1.-] [RN:R10243] K00194 M00377 Reductive acetyl-CoA pathway (Wood-Ljungdahl pathway) 6,0 C00101,C00024 Tetrahydrofolate,Acetyl-CoA C00237,C00440 CO,5-Methyltetrahydrofolate LPPG:FO 2-phospho-L-lactate transferase [EC:2.7.8.28] [RN:R09398] K11212 M00378 F420 biosynthesis 0,0 C19153 Coenzyme F420-0 C19155,C19154 (2S)-Lactyl-2-diphospho-5'-guanosine,7,8-Didemethyl-8-hydroxy-5-deazariboflavin coenzyme F420-0:L-glutamate ligase / coenzyme F420-1:gamma-L-glutamate ligase [EC:6.3.2.31 6.3.2.34] [RN:R09399 R09400] K12234 M00378 F420 biosynthesis 1,0 C00876 Coenzyme F420 C19152 Coenzyme F420-1 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10247 M00415 Fatty acid elongation in endoplasmic reticulum 0,0 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10205 M00415 Fatty acid elongation in endoplasmic reticulum 0,1 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10248 M00415 Fatty acid elongation in endoplasmic reticulum 0,2 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10249 M00415 Fatty acid elongation in endoplasmic reticulum 0,3 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10244 M00415 Fatty acid elongation in endoplasmic reticulum 0,4 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10203 M00415 Fatty acid elongation in endoplasmic reticulum 0,5 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10250 M00415 Fatty acid elongation in endoplasmic reticulum 0,6 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K15397 M00415 Fatty acid elongation in endoplasmic reticulum 0,7 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10245 M00415 Fatty acid elongation in endoplasmic reticulum 0,8 -elongation of very long chain fatty acids protein [EC:2.3.1.199] K10246 M00415 Fatty acid elongation in endoplasmic reticulum 0,9 -beta-keto reductase [EC:1.1.1.330] K10251 M00415 Fatty acid elongation in endoplasmic reticulum 1,0 -3-hydroxy acyl-CoA dehydratase [EC:4.2.1.134] K10703 M00415 Fatty acid elongation in endoplasmic reticulum 2,0 -enoyl reductase [EC:1.3.1.93] K10258 M00415 Fatty acid elongation in endoplasmic reticulum 3,0 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10247 M00415 Fatty acid elongation in endoplasmic reticulum 0,0 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10205 M00415 Fatty acid elongation in endoplasmic reticulum 0,1 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10248 M00415 Fatty acid elongation in endoplasmic reticulum 0,2 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10249 M00415 Fatty acid elongation in endoplasmic reticulum 0,3 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10244 M00415 Fatty acid elongation in endoplasmic reticulum 0,4 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10203 M00415 Fatty acid elongation in endoplasmic reticulum 0,5 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10250 M00415 Fatty acid elongation in endoplasmic reticulum 0,6 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K15397 M00415 Fatty acid elongation in endoplasmic reticulum 0,7 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10245 M00415 Fatty acid elongation in endoplasmic reticulum 0,8 +elongation of very long chain fatty acids protein [EC:2.3.1.199] K10246 M00415 Fatty acid elongation in endoplasmic reticulum 0,9 +beta-keto reductase [EC:1.1.1.330] K10251 M00415 Fatty acid elongation in endoplasmic reticulum 1,0 +3-hydroxy acyl-CoA dehydratase [EC:4.2.1.134] K10703 M00415 Fatty acid elongation in endoplasmic reticulum 2,0 +enoyl reductase [EC:1.3.1.93] K10258 M00415 Fatty acid elongation in endoplasmic reticulum 3,0 qoxB; cytochrome aa3-600 menaquinol oxidase subunit I [EC:1.10.3.12] K02827 M00416 Cytochrome aa3-600 menaquinol oxidase 0,0 C00828,C00001 Menaquinone,H2O C05819,C00007 Menaquinol,Oxygen qoxA; cytochrome aa3-600 menaquinol oxidase subunit II [EC:1.10.3.12] K02826 M00416 Cytochrome aa3-600 menaquinol oxidase 0,0 C00828,C00001 Menaquinone,H2O C05819,C00007 Menaquinol,Oxygen qoxC; cytochrome aa3-600 menaquinol oxidase subunit III [EC:1.10.3.12] K02828 M00416 Cytochrome aa3-600 menaquinol oxidase 0,0 C00828,C00001 Menaquinone,H2O C05819,C00007 Menaquinol,Oxygen qoxD; cytochrome aa3-600 menaquinol oxidase subunit IV [EC:1.10.3.12] K02829 M00416 Cytochrome aa3-600 menaquinol oxidase 0,0 C00828,C00001 Menaquinone,H2O C05819,C00007 Menaquinol,Oxygen -cyoA; cytochrome o ubiquinol oxidase subunit II [EC:1.10.3.10] K02297 M00417 Cytochrome o ubiquinol oxidase 0,0 -cyoB; cytochrome o ubiquinol oxidase subunit I [EC:1.10.3.10] K02298 M00417 Cytochrome o ubiquinol oxidase 0,0 -cyoC; cytochrome o ubiquinol oxidase subunit III K02299 M00417 Cytochrome o ubiquinol oxidase 0,0 -cyoD; cytochrome o ubiquinol oxidase operon protein cyoD K02300 M00417 Cytochrome o ubiquinol oxidase 0,0 +cyoA; cytochrome o ubiquinol oxidase subunit II [EC:1.10.3.10] K02297 M00417 Cytochrome o ubiquinol oxidase 0,0 +cyoB; cytochrome o ubiquinol oxidase subunit I [EC:1.10.3.10] K02298 M00417 Cytochrome o ubiquinol oxidase 0,0 +cyoC; cytochrome o ubiquinol oxidase subunit III K02299 M00417 Cytochrome o ubiquinol oxidase 0,0 +cyoD; cytochrome o ubiquinol oxidase operon protein cyoD K02300 M00417 Cytochrome o ubiquinol oxidase 0,0 benzylsuccinate synthase [EC:4.1.99.11] [RN:R05598] K07540 M00418 Toluene degradation, anaerobic, toluene => benzoyl-CoA 0,0 C09816 Benzylsuccinate C01455 Toluene benzylsuccinate CoA-transferase subunit [EC:2.8.3.15] [RN:R05588] K07543 M00418 Toluene degradation, anaerobic, toluene => benzoyl-CoA 1,0 C09817 Benzylsuccinyl-CoA C09816 Benzylsuccinate benzylsuccinate CoA-transferase subunit [EC:2.8.3.15] [RN:R05588] K07544 M00418 Toluene degradation, anaerobic, toluene => benzoyl-CoA 1,0 C09817 Benzylsuccinyl-CoA C09816 Benzylsuccinate @@ -2138,7 +2138,7 @@ nitrate reductase (NAD(P)H) [EC:1.7.1.1 1.7.1.2 1.7.1.3] [RN:R00794 R00796] K105 assimilatory nitrate reductase [EC:1.7.99.-] [RN:R00798] K00372 M00531 Assimilatory nitrate reduction, nitrate => ammonia 0,2 C00088 Nitrite C00244 Nitrate assimilatory nitrate reductase [EC:1.7.99.-] [RN:R00798] K00360 M00531 Assimilatory nitrate reduction, nitrate => ammonia 0,2 C00088 Nitrite C00244 Nitrate assimilatory nitrite reductase [EC:1.7.7.1] [RN:R00790] K00366 M00531 Assimilatory nitrate reduction, nitrate => ammonia 1,0 C00014 NH3 C00088 Nitrite -assimilatory nitrite reductase [EC:1.7.1.4] [RN:R00787 R00789] K17877 M00531 Assimilatory nitrate reduction, nitrate => ammonia 1,1 +assimilatory nitrite reductase [EC:1.7.1.4] [RN:R00787 R00789] K17877 M00531 Assimilatory nitrate reduction, nitrate => ammonia 1,1 glycine cleavage system [RN:R01221] K00281 M00532 Photorespiration 0,0 C00014 NH3 C00037 Glycine glycine cleavage system [RN:R01221] K00605 M00532 Photorespiration 0,0 C00014 NH3 C00037 Glycine glycine cleavage system [RN:R01221] K00382 M00532 Photorespiration 0,0 C00014 NH3 C00037 Glycine @@ -2195,23 +2195,23 @@ benzoyl-CoA reductase [EC:1.3.-.-] [RN:R10961] K19516 M00541 Benzoyl-CoA degrada cyclohexa-1,5-dienecarbonyl-CoA hydratase [EC:4.2.1.100] [RN:R05597] K07537 M00541 Benzoyl-CoA degradation, benzoyl-CoA => 3-hydroxypimeloyl-CoA 1,0 C06749 6-Hydroxycyclohex-1-enecarbonyl-CoA C06322 S-1,5-Cyclohexadiene-1-carboxylate coenzymeA 6-hydroxycyclohex-1-ene-1-carboxyl-CoA dehydrogenase [EC:1.1.1.368] [RN:R05581] K07538 M00541 Benzoyl-CoA degradation, benzoyl-CoA => 3-hydroxypimeloyl-CoA 2,0 C09821 6-Ketoxycyclohex-1-ene-1-carboxyl-CoA C06749 6-Hydroxycyclohex-1-enecarbonyl-CoA 6-oxo-cyclohex-1-ene-carbonyl-CoA hydrolase [EC:3.7.1.21] [RN:R05594] K07539 M00541 Benzoyl-CoA degradation, benzoyl-CoA => 3-hydroxypimeloyl-CoA 3,0 C06714 3-Hydroxypimeloyl-CoA C09821 6-Ketoxycyclohex-1-ene-1-carboxyl-CoA -yscF; type III secretion protein SctF K03221 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscC; type III secretion protein SctC K03219 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscJ; type III secretion protein SctJ K03222 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscR; type III secretion protein SctR K03226 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscS; type III secretion protein SctS K03227 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscT; type III secretion protein SctT K03228 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscU; type III secretion protein SctU K03229 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscV; type III secretion protein SctV K03230 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscN; ATP synthase in type III secretion protein SctN [EC:3.6.3.14] K03224 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -yscQ; type III secretion protein SctQ K03225 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 -tir; translocated intimin receptor K12784 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 1,0 -map; LEE-encoded effector Map K12787 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 2,0 -espG; LEE-encoded effector EspG K12785 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 3,0 -espF; LEE-encoded effector EspF K12786 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 4,0 -espH; LEE-encoded effector EspH K12788 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 5,0 -nleA; non-LEE-encoded effector NleA K16041 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 6,0 -nleH; non-LEE-encoded effector NleH K16042 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 7,0 +yscF; type III secretion protein SctF K03221 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscC; type III secretion protein SctC K03219 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscJ; type III secretion protein SctJ K03222 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscR; type III secretion protein SctR K03226 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscS; type III secretion protein SctS K03227 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscT; type III secretion protein SctT K03228 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscU; type III secretion protein SctU K03229 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscV; type III secretion protein SctV K03230 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscN; ATP synthase in type III secretion protein SctN [EC:3.6.3.14] K03224 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +yscQ; type III secretion protein SctQ K03225 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 0,0 +tir; translocated intimin receptor K12784 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 1,0 +map; LEE-encoded effector Map K12787 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 2,0 +espG; LEE-encoded effector EspG K12785 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 3,0 +espF; LEE-encoded effector EspF K12786 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 4,0 +espH; LEE-encoded effector EspH K12788 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 5,0 +nleA; non-LEE-encoded effector NleA K16041 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 6,0 +nleH; non-LEE-encoded effector NleH K16042 M00542 EHEC/EPEC pathogenicity signature, T3SS and effectors 7,0 biphenyl 2,3-dioxygenase [EC:1.14.12.18] [RN:R05263 R05264 R05261 R05262] K08689 M00543 Biphenyl degradation, biphenyl => 2-oxopent-4-enoate + benzoate 0,0 C06585 cis-2,3-Dihydro-2,3-dihydroxy-4'-chlorobiphenyl C06584 4-Chlorobiphenyl biphenyl 2,3-dioxygenase [EC:1.14.12.18] [RN:R05263 R05264 R05261 R05262] K15750 M00543 Biphenyl degradation, biphenyl => 2-oxopent-4-enoate + benzoate 0,0 C06585 cis-2,3-Dihydro-2,3-dihydroxy-4'-chlorobiphenyl C06584 4-Chlorobiphenyl biphenyl 2,3-dioxygenase [EC:1.14.12.18] [RN:R05263 R05264 R05261 R05262] K18087 M00543 Biphenyl degradation, biphenyl => 2-oxopent-4-enoate + benzoate 0,0 C06585 cis-2,3-Dihydro-2,3-dihydroxy-4'-chlorobiphenyl C06584 4-Chlorobiphenyl @@ -2249,7 +2249,7 @@ urate oxidase [EC:1.7.3.3] [RN:R02106] K00365 M00546 Purine degradation, xanthin urate oxidase [EC:1.7.3.3] [RN:R02106] K16838 M00546 Purine degradation, xanthine => urea 1,1 C11821 5-Hydroxyisourate C00366 Urate FAD-dependent urate hydroxylase [EC:1.14.13.113] [RN:R09514] K16839 M00546 Purine degradation, xanthine => urea 1,2 C11821 5-Hydroxyisourate C00366 Urate FAD-dependent urate hydroxylase [EC:1.14.13.113] [RN:R09514] K22879 M00546 Purine degradation, xanthine => urea 1,3 C11821 5-Hydroxyisourate C00366 Urate -5-hydroxyisourate hydrolase / 2-oxo-4-hydroxy-4-carboxy-5-ureidoimidazoline decarboxylase [EC:3.5.2.17 4.1.1.97] [RN:R06601+R06604] K13484 M00546 Purine degradation, xanthine => urea 2,0 +5-hydroxyisourate hydrolase / 2-oxo-4-hydroxy-4-carboxy-5-ureidoimidazoline decarboxylase [EC:3.5.2.17 4.1.1.97] [RN:R06601+R06604] K13484 M00546 Purine degradation, xanthine => urea 2,0 5-hydroxyisourate hydrolase [EC:3.5.2.17] [RN:R06601] K07127 M00546 Purine degradation, xanthine => urea 2,1,0,0 C12248 5-Hydroxy-2-oxo-4-ureido-2,5-dihydro-1H-imidazole-5-carboxylate C11821 5-Hydroxyisourate 2-oxo-4-hydroxy-4-carboxy-5-ureidoimidazoline decarboxylase [EC:4.1.1.97] [RN:R06604] K13485 M00546 Purine degradation, xanthine => urea 2,1,1,0 C02350 (S)(+)-Allantoin C12248 5-Hydroxy-2-oxo-4-ureido-2,5-dihydro-1H-imidazole-5-carboxylate urate oxidase [EC:1.7.3.3] [RN:R02106] K16838 M00546 Purine degradation, xanthine => urea 2,1,1,1 C11821 5-Hydroxyisourate C00366 Urate @@ -2322,33 +2322,33 @@ F420-non-reducing hydrogenase [EC:1.8.98.5] [RN:R11943] K14126 M00563 Methanogen F420-non-reducing hydrogenase [EC:1.8.98.5] [RN:R11943] K14128 M00563 Methanogenesis, methylamine/dimethylamine/trimethylamine => methane 3,3 C04628 Coenzyme B C04832 Coenzyme M 7-mercaptoheptanoylthreonine-phosphate heterodisulfide formate dehydrogenase (coenzyme F420) [EC:1.8.98.6] [RN:R11944] K22516 M00563 Methanogenesis, methylamine/dimethylamine/trimethylamine => methane 3,3 C04628 Coenzyme B C04832 Coenzyme M 7-mercaptoheptanoylthreonine-phosphate heterodisulfide formate dehydrogenase (coenzyme F420) [EC:1.8.98.6] [RN:R11944] K00125 M00563 Methanogenesis, methylamine/dimethylamine/trimethylamine => methane 3,3 C04628 Coenzyme B C04832 Coenzyme M 7-mercaptoheptanoylthreonine-phosphate heterodisulfide -cagA; cytotoxicity-associated immunodominant antigen K15842 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 0,0 -cag1; cag pathogenicity island protein 1 K12086 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 1,0 -cag2; cag pathogenicity island protein 2 K12087 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 2,0 -cag3; cag pathogenicity island protein 3 K12088 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 3,0 -cag4; cag pathogenicity island protein 4 K12089 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 4,0 -cag5; cag pathogenicity island protein 5 K12090 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 5,0 -virB11; type IV secretion system protein VirB11 K03196 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 6,0 -cag6; cag pathogenicity island protein 6 K12091 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 7,0 -cag7; cag pathogenicity island protein 7 K12092 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 8,0 -cag8; cag pathogenicity island protein 8 K12093 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 9,0 -cag9; cag pathogenicity island protein 9 K12094 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 10,0 -cag10; cag pathogenicity island protein 10 K12095 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 11,0 -cag11; cag pathogenicity island protein 11 K12096 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 12,0 -cag12; cag pathogenicity island protein 12 K12097 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 13,0 -cag13; cag pathogenicity island protein 13 K12098 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 14,0 -cag14; cag pathogenicity island protein 14 K12099 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 15,0 -cag15; cag pathogenicity island protein 15 K12100 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 16,0 -cag16; cag pathogenicity island protein 16 K12101 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 17,0 -cag17; cag pathogenicity island protein 17 K12102 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 18,0 -cag18; cag pathogenicity island protein 18 K12103 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 19,0 -cag19; cag pathogenicity island protein 19 K12104 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 20,0 -cag20; cag pathogenicity island protein 20 K12105 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 21,0 -cag21; cag pathogenicity island protein 21 K12106 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 22,0 -cag22; cag pathogenicity island protein 22 K12107 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 23,0 -cag23; cag pathogenicity island protein 23 K12108 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 24,0 -cag24; cag pathogenicity island protein 24 K12109 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 25,0 -cag25; cag pathogenicity island protein 25 K12110 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 26,0 +cagA; cytotoxicity-associated immunodominant antigen K15842 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 0,0 +cag1; cag pathogenicity island protein 1 K12086 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 1,0 +cag2; cag pathogenicity island protein 2 K12087 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 2,0 +cag3; cag pathogenicity island protein 3 K12088 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 3,0 +cag4; cag pathogenicity island protein 4 K12089 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 4,0 +cag5; cag pathogenicity island protein 5 K12090 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 5,0 +virB11; type IV secretion system protein VirB11 K03196 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 6,0 +cag6; cag pathogenicity island protein 6 K12091 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 7,0 +cag7; cag pathogenicity island protein 7 K12092 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 8,0 +cag8; cag pathogenicity island protein 8 K12093 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 9,0 +cag9; cag pathogenicity island protein 9 K12094 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 10,0 +cag10; cag pathogenicity island protein 10 K12095 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 11,0 +cag11; cag pathogenicity island protein 11 K12096 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 12,0 +cag12; cag pathogenicity island protein 12 K12097 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 13,0 +cag13; cag pathogenicity island protein 13 K12098 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 14,0 +cag14; cag pathogenicity island protein 14 K12099 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 15,0 +cag15; cag pathogenicity island protein 15 K12100 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 16,0 +cag16; cag pathogenicity island protein 16 K12101 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 17,0 +cag17; cag pathogenicity island protein 17 K12102 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 18,0 +cag18; cag pathogenicity island protein 18 K12103 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 19,0 +cag19; cag pathogenicity island protein 19 K12104 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 20,0 +cag20; cag pathogenicity island protein 20 K12105 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 21,0 +cag21; cag pathogenicity island protein 21 K12106 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 22,0 +cag22; cag pathogenicity island protein 22 K12107 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 23,0 +cag23; cag pathogenicity island protein 23 K12108 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 24,0 +cag24; cag pathogenicity island protein 24 K12109 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 25,0 +cag25; cag pathogenicity island protein 25 K12110 M00564 Helicobacter pylori pathogenicity signature, cagA pathogenicity island 26,0 glgC; glucose-1-phosphate adenylyltransferase [EC:2.7.7.27] [RN:R00948] K00975 M00565 Trehalose biosynthesis, D-glucose 1P => trehalose 0,0 C00498 ADP-glucose C00103 D-Glucose 1-phosphate starch synthase [EC:2.4.1.21] [RN:R02421] K00703 M00565 Trehalose biosynthesis, D-glucose 1P => trehalose 1,0 C00718 Amylose C00498 ADP-glucose 1,4-alpha-glucan branching enzyme [EC:2.4.1.18] [RN:R02110] K00700 M00565 Trehalose biosynthesis, D-glucose 1P => trehalose 2,0 C00369 Starch C00718 Amylose @@ -2437,20 +2437,20 @@ adenosylmethionine---8-amino-7-oxononanoate aminotransferase [EC:2.6.1.62] [RN:R lysine---8-amino-7-oxononanoate aminotransferase [EC:2.6.1.105] [RN:R10699] K19563 M00573 Biotin biosynthesis, BioI pathway, long-chain-acyl-ACP => pimeloyl-ACP => biotin 2,1 C01037 7,8-Diaminononanoate C01092 8-Amino-7-oxononanoate dethiobiotin synthetase [EC:6.3.3.3] [RN:R03182] K01935 M00573 Biotin biosynthesis, BioI pathway, long-chain-acyl-ACP => pimeloyl-ACP => biotin 3,0 C01909 Dethiobiotin C01037 7,8-Diaminononanoate biotin synthetase [EC:2.8.1.6] [RN:R01078] K01012 M00573 Biotin biosynthesis, BioI pathway, long-chain-acyl-ACP => pimeloyl-ACP => biotin 4,0 C00120 Biotin C01909 Dethiobiotin -ptxA; pertussis toxin subunit 1 [EC:2.4.2.-] K11023 M00574 Pertussis pathogenicity signature, pertussis toxin 0,0 -ptxB; pertussis toxin subunit 2 K11024 M00574 Pertussis pathogenicity signature, pertussis toxin 1,0 -ptxC; pertussis toxin subunit 3 K11025 M00574 Pertussis pathogenicity signature, pertussis toxin 2,0 -ptxD; pertussis toxin subunit 4 K11026 M00574 Pertussis pathogenicity signature, pertussis toxin 3,0 -ptxE; pertussis toxin subunit 5 K11027 M00574 Pertussis pathogenicity signature, pertussis toxin 4,0 -cyaA; bifunctional hemolysin/adenylate cyclase [EC:4.6.1.1] K22944 M00575 Pertussis pathogenicity signature, T1SS 0,0 -hlyB; ATP-binding cassette, subfamily B, bacterial HlyB/CyaB K11004 M00575 Pertussis pathogenicity signature, T1SS 1,0 -cyaC; cytolysin-activating lysine-acyltransferase [EC:2.3.1.-] K07389 M00575 Pertussis pathogenicity signature, T1SS 2,0 -hlyD; hemolysin D K11003 M00575 Pertussis pathogenicity signature, T1SS 3,0 -tolC; outer membrane channel protein K12340 M00575 Pertussis pathogenicity signature, T1SS 4,0 -ctxA; cholera enterotoxin subunit A [EC:2.4.2.36] K10928 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 0,0 -ctxB; cholera enterotoxin subunit B K10929 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 0,0 -sta; heat-stable enterotoxin STa/STI K16883 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 1,0 -stb; heat-stable enterotoxin STb/STII K16884 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 1,1 +ptxA; pertussis toxin subunit 1 [EC:2.4.2.-] K11023 M00574 Pertussis pathogenicity signature, pertussis toxin 0,0 +ptxB; pertussis toxin subunit 2 K11024 M00574 Pertussis pathogenicity signature, pertussis toxin 1,0 +ptxC; pertussis toxin subunit 3 K11025 M00574 Pertussis pathogenicity signature, pertussis toxin 2,0 +ptxD; pertussis toxin subunit 4 K11026 M00574 Pertussis pathogenicity signature, pertussis toxin 3,0 +ptxE; pertussis toxin subunit 5 K11027 M00574 Pertussis pathogenicity signature, pertussis toxin 4,0 +cyaA; bifunctional hemolysin/adenylate cyclase [EC:4.6.1.1] K22944 M00575 Pertussis pathogenicity signature, T1SS 0,0 +hlyB; ATP-binding cassette, subfamily B, bacterial HlyB/CyaB K11004 M00575 Pertussis pathogenicity signature, T1SS 1,0 +cyaC; cytolysin-activating lysine-acyltransferase [EC:2.3.1.-] K07389 M00575 Pertussis pathogenicity signature, T1SS 2,0 +hlyD; hemolysin D K11003 M00575 Pertussis pathogenicity signature, T1SS 3,0 +tolC; outer membrane channel protein K12340 M00575 Pertussis pathogenicity signature, T1SS 4,0 +ctxA; cholera enterotoxin subunit A [EC:2.4.2.36] K10928 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 0,0 +ctxB; cholera enterotoxin subunit B K10929 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 0,0 +sta; heat-stable enterotoxin STa/STI K16883 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 1,0 +stb; heat-stable enterotoxin STb/STII K16884 M00576 ETEC pathogenicity signature, heat-labile and heat-stable enterotoxins 1,1 6-carboxyhexanoate--CoA ligase [EC:6.2.1.14] [RN:R03209] K01906 M00577 Biotin biosynthesis, BioW pathway, pimelate => pimeloyl-CoA => biotin 0,0 C01063 6-Carboxyhexanoyl-CoA C02656 Pimelate 8-amino-7-oxononanoate synthase [EC:2.3.1.47] [RN:R03210] K00652 M00577 Biotin biosynthesis, BioW pathway, pimelate => pimeloyl-CoA => biotin 1,0 C01092 8-Amino-7-oxononanoate C01063 6-Carboxyhexanoyl-CoA adenosylmethionine---8-amino-7-oxononanoate aminotransferase [EC:2.6.1.62] [RN:R03231] K00833 M00577 Biotin biosynthesis, BioW pathway, pimelate => pimeloyl-CoA => biotin 2,0 C01037 7,8-Diaminononanoate C01092 8-Amino-7-oxononanoate @@ -2480,12 +2480,12 @@ adenylylsulfate reductase [EC:1.8.99.2] [RN:R08553] K00394 M00596 Dissimilatory adenylylsulfate reductase [EC:1.8.99.2] [RN:R08553] K00395 M00596 Dissimilatory sulfate reduction, sulfate => H2S 1,0 C00094 Sulfite C00224 Adenylyl sulfate sulfite reductase, dissimilatory-type [EC:1.8.99.5] [RN:R00861] K11180 M00596 Dissimilatory sulfate reduction, sulfate => H2S 2,0 C00283 Hydrogen sulfide C00094 Sulfite sulfite reductase, dissimilatory-type [EC:1.8.99.5] [RN:R00861] K11181 M00596 Dissimilatory sulfate reduction, sulfate => H2S 2,0 C00283 Hydrogen sulfide C00094 Sulfite -pufL; photosynthetic reaction center L subunit K08928 M00597 Anoxygenic photosystem II 0,0 -pufM; photosynthetic reaction center M subunit K08929 M00597 Anoxygenic photosystem II 0,0 -pscA; photosystem P840 reaction center large subunit K08940 M00598 Anoxygenic photosystem I 0,0 -pscB; photosystem P840 reaction center iron-sulfur protein K08941 M00598 Anoxygenic photosystem I 0,0 -pscC; photosystem P840 reaction center cytochrome c551 K08942 M00598 Anoxygenic photosystem I 0,0 -pscD; photosystem P840 reaction center protein PscD K08943 M00598 Anoxygenic photosystem I 0,0 +pufL; photosynthetic reaction center L subunit K08928 M00597 Anoxygenic photosystem II 0,0 +pufM; photosynthetic reaction center M subunit K08929 M00597 Anoxygenic photosystem II 0,0 +pscA; photosystem P840 reaction center large subunit K08940 M00598 Anoxygenic photosystem I 0,0 +pscB; photosystem P840 reaction center iron-sulfur protein K08941 M00598 Anoxygenic photosystem I 0,0 +pscC; photosystem P840 reaction center cytochrome c551 K08942 M00598 Anoxygenic photosystem I 0,0 +pscD; photosystem P840 reaction center protein PscD K08943 M00598 Anoxygenic photosystem I 0,0 methanogen homocitrate synthase [EC:2.3.3.14 2.3.3.-] [RN:R00271 R08331 R08332] K10977 M00608 2-Oxocarboxylic acid chain extension, 2-oxoglutarate => 2-oxoadipate => 2-oxopimelate => 2-oxosuberate 0,0 C16598 (R)-(Homo)3-citrate C16588,C00024 2-Oxopimelate,Acetyl-CoA methanogen homoaconitase large subunit [EC:4.2.1.114] [RN:R03444 R04371 R09720 R10392 R10393 R10391 R10395 R10396 R10394] K16792 M00608 2-Oxocarboxylic acid chain extension, 2-oxoglutarate => 2-oxoadipate => 2-oxopimelate => 2-oxosuberate 1,0 C16600 (-)-threo-Iso(homo)3-citrate C16598 (R)-(Homo)3-citrate methanogen homoaconitase large subunit [EC:4.2.1.114] [RN:R03444 R04371 R09720 R10392 R10393 R10391 R10395 R10396 R10394] K16793 M00608 2-Oxocarboxylic acid chain extension, 2-oxoglutarate => 2-oxoadipate => 2-oxopimelate => 2-oxosuberate 1,0 C16600 (-)-threo-Iso(homo)3-citrate C16598 (R)-(Homo)3-citrate @@ -2497,7 +2497,7 @@ S-adenosylhomocysteine/5'-methylthioadenosine nucleosidase [EC:3.2.2.9] [RN:R001 S-ribosylhomocysteine lyase [EC:4.4.1.21] [RN:R01291] K07173 M00609 Cysteine biosynthesis, methionine => cysteine 3,0 C00155 L-Homocysteine C03539 S-Ribosyl-L-homocysteine cystathionine beta-synthase (O-acetyl-L-serine) [EC:2.5.1.134] [RN:R10305] K17216 M00609 Cysteine biosynthesis, methionine => cysteine 4,0 C02291 L-Cystathionine C00155 L-Homocysteine cystathionine gamma-lyase [EC:4.4.1.1] [RN:R01001] K17217 M00609 Cysteine biosynthesis, methionine => cysteine 5,0 C00097 L-Cysteine C02291 L-Cystathionine -NRT; MFS transporter, NNP family, nitrate/nitrite transporter K02575 M00615 Nitrate assimilation 0,0 +NRT; MFS transporter, NNP family, nitrate/nitrite transporter K02575 M00615 Nitrate assimilation 0,0 pyruvate ferredoxin oxidoreductase [EC:1.2.7.1] [RN:R01196] K00169 M00620 Incomplete reductive citrate cycle, acetyl-CoA => oxoglutarate 0,0 C00022 Pyruvate C00024 Acetyl-CoA pyruvate ferredoxin oxidoreductase [EC:1.2.7.1] [RN:R01196] K00170 M00620 Incomplete reductive citrate cycle, acetyl-CoA => oxoglutarate 0,0 C00022 Pyruvate C00024 Acetyl-CoA pyruvate ferredoxin oxidoreductase [EC:1.2.7.1] [RN:R01196] K00171 M00620 Incomplete reductive citrate cycle, acetyl-CoA => oxoglutarate 0,0 C00022 Pyruvate C00024 Acetyl-CoA @@ -2530,13 +2530,13 @@ K18075,K18077 terephthalate 1,2-dioxygenase [EC:1.14.12.15] [RN:R05148] K18074 M tphA3 K18075 M00624 Terephthalate degradation, terephthalate => 3,4-dihydroxybenzoate 0,0 C06318 (3S,4R)-3,4-Dihydroxycyclohexa-1,5-diene-1,4-dicarboxylate C06337 Terephthalate tphA1 K18077 M00624 Terephthalate degradation, terephthalate => 3,4-dihydroxybenzoate 0,0 C06318 (3S,4R)-3,4-Dihydroxycyclohexa-1,5-diene-1,4-dicarboxylate C06337 Terephthalate 1,2-dihydroxy-3,5-cyclohexadiene-1,4-dicarboxylate dehydrogenase [EC:1.3.1.53] [RN:R01633] K18076 M00624 Terephthalate degradation, terephthalate => 3,4-dihydroxybenzoate 1,0 C00230 3,4-Dihydroxybenzoate C06318 (3S,4R)-3,4-Dihydroxycyclohexa-1,5-diene-1,4-dicarboxylate -mecR1; methicillin resistance protein K02547 M00625 Methicillin resistance 0,0 -mecI; methicillin resistance regulatory protein K02546 M00625 Methicillin resistance 1,0 -mecA; penicillin-binding protein 2 prime K02545 M00625 Methicillin resistance 2,0 -blaR1; bla regulator protein blaR1 K02172 M00627 beta-Lactam resistance, Bla system 0,0 -blaI; BlaI family transcriptional regulator, penicillinase repressor K02171 M00627 beta-Lactam resistance, Bla system 1,0 -blaZ; beta-lactamase class A BlaZ [EC:3.5.2.6] K18766 M00627 beta-Lactam resistance, Bla system 2,0 -penP; beta-lactamase class A [EC:3.5.2.6] K17836 M00627 beta-Lactam resistance, Bla system 2,1 +mecR1; methicillin resistance protein K02547 M00625 Methicillin resistance 0,0 +mecI; methicillin resistance regulatory protein K02546 M00625 Methicillin resistance 1,0 +mecA; penicillin-binding protein 2 prime K02545 M00625 Methicillin resistance 2,0 +blaR1; bla regulator protein blaR1 K02172 M00627 beta-Lactam resistance, Bla system 0,0 +blaI; BlaI family transcriptional regulator, penicillinase repressor K02171 M00627 beta-Lactam resistance, Bla system 1,0 +blaZ; beta-lactamase class A BlaZ [EC:3.5.2.6] K18766 M00627 beta-Lactam resistance, Bla system 2,0 +penP; beta-lactamase class A [EC:3.5.2.6] K17836 M00627 beta-Lactam resistance, Bla system 2,1 D-galacturonate reductase [EC:1.1.1.-] [RN:R07676 R10565] K18106 M00630 D-Galacturonate degradation (fungi), D-galacturonate => glycerol 0,0 C15930 L-Galactonate C00333 D-Galacturonate D-galacturonate reductase [EC:1.1.1.365] [RN:R07676] K19634 M00630 D-Galacturonate degradation (fungi), D-galacturonate => glycerol 0,1 C15930 L-Galactonate C00333 D-Galacturonate L-galactonate dehydratase [EC:4.2.1.146] [RN:R10532] K18102 M00630 D-Galacturonate degradation (fungi), D-galacturonate => glycerol 1,0 C20680 2-Dehydro-3-deoxy-L-galactonate C15930 L-Galactonate @@ -2576,68 +2576,68 @@ salicylate 5-hydroxylase [EC:1.14.13.172] [RN:R07709 R07710] K18242 M00638 Salic salicylate 5-hydroxylase [EC:1.14.13.172] [RN:R07709 R07710] K18243 M00638 Salicylate degradation, salicylate => gentisate 0,0 C00628 2,5-Dihydroxybenzoate C00805 Salicylate salicylate 5-hydroxylase [EC:1.14.13.172] [RN:R07709 R07710] K14578 M00638 Salicylate degradation, salicylate => gentisate 0,0 C00628 2,5-Dihydroxybenzoate C00805 Salicylate salicylate 5-hydroxylase [EC:1.14.13.172] [RN:R07709 R07710] K14581 M00638 Salicylate degradation, salicylate => gentisate 0,0 C00628 2,5-Dihydroxybenzoate C00805 Salicylate -nfxB; TetR/AcrR family transcriptional regulator, mexCD-oprJ operon repressor K18294 M00639 Multidrug resistance, efflux pump MexCD-OprJ 0,0 -mexC; membrane fusion protein K18295 M00639 Multidrug resistance, efflux pump MexCD-OprJ 1,0 -mexD; multidrug efflux pump K18296 M00639 Multidrug resistance, efflux pump MexCD-OprJ 1,0 -oprJ; multidrug resistance outer membrane protein OprJ K08721 M00639 Multidrug resistance, efflux pump MexCD-OprJ 1,0 -mexT; LysR family transcriptional regulator, mexEF-oprN operon transcriptional activator K18297 M00641 Multidrug resistance, efflux pump MexEF-OprN 0,0 -mexE; membrane fusion protein K18298 M00641 Multidrug resistance, efflux pump MexEF-OprN 1,0 -mexF; multidrug efflux pump K18299 M00641 Multidrug resistance, efflux pump MexEF-OprN 1,0 -oprN; outer membrane protein K18300 M00641 Multidrug resistance, efflux pump MexEF-OprN 1,0 -mexL; TetR/AcrR family transcriptional regulator, mexJK operon transcriptional repressor K18301 M00642 Multidrug resistance, efflux pump MexJK-OprM 0,0 -mexJ; membrane fusion protein K18302 M00642 Multidrug resistance, efflux pump MexJK-OprM 1,0 -mexK; multidrug efflux pump K18303 M00642 Multidrug resistance, efflux pump MexJK-OprM 1,0 -oprM; outer membrane protein K18139 M00642 Multidrug resistance, efflux pump MexJK-OprM 1,0 -mexZ; TetR/AcrR family transcriptional regulator, mexXY operon repressor K18129 M00643 Multidrug resistance, efflux pump MexXY-OprM 0,0 -mexX; membrane fusion protein K18094 M00643 Multidrug resistance, efflux pump MexXY-OprM 1,0 -mexY; multidrug efflux pump K18095 M00643 Multidrug resistance, efflux pump MexXY-OprM 1,0 -oprM; outer membrane protein K18139 M00643 Multidrug resistance, efflux pump MexXY-OprM 1,0 -adeS; two-component system, OmpR family, sensor histidine kinase AdeS [EC:2.7.13.3] K18143 M00649 Multidrug resistance, efflux pump AdeABC 0,0 -adeR; two-component system, OmpR family, response regulator AdeR K18144 M00649 Multidrug resistance, efflux pump AdeABC 1,0 -adeA; membrane fusion protein K18145 M00649 Multidrug resistance, efflux pump AdeABC 2,0 -adeB; multidrug efflux pump K18146 M00649 Multidrug resistance, efflux pump AdeABC 2,0 -adeC; outer membrane protein K18147 M00649 Multidrug resistance, efflux pump AdeABC 2,0 -vanSB; two-component system, OmpR family, sensor histidine kinase VanS [EC:2.7.13.3] K18345 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,0,0 -vanRB; two-component system, OmpR family, response regulator VanR K18344 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,1,0 -vanY; D-alanyl-D-alanine carboxypeptidase [EC:3.4.16.4] K07260 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,2,0 -vanW; vancomycin resistance protein VanW K18346 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,3,0 -vanSAc; two-component system, OmpR family, sensor histidine kinase VanS [EC:2.7.13.3] K18351 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,0,0 -vanRAc; two-component system, OmpR family, response regulator VanR K18352 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,1,0 -vanK; vancomycin resistance protein VanK K18354 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,2,0 -vanJ; vancomycin resistance protein VanJ K18353 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,3,0 -vanH; D-specific alpha-keto acid dehydrogenase [EC:1.1.1.-] K18347 M00651 Vancomycin resistance, D-Ala-D-Lac type 1,0,0,0 -vanB; D-alanine---(R)-lactate ligase [EC:6.1.2.1] K15739 M00651 Vancomycin resistance, D-Ala-D-Lac type 1,0,1,0 -vanX; D-alanyl-D-alanine dipeptidase [EC:3.4.13.22] K08641 M00651 Vancomycin resistance, D-Ala-D-Lac type 1,0,2,0 -vanSE; two-component system, OmpR family, sensor histidine kinase VanS [EC:2.7.13.3] K18350 M00652 Vancomycin resistance, D-Ala-D-Ser type 0,0 -vanRE; two-component system, OmpR family, response regulator VanR K18349 M00652 Vancomycin resistance, D-Ala-D-Ser type 1,0 -vanT; serine/alanine racemase [EC:5.1.1.18 5.1.1.1] K18348 M00652 Vancomycin resistance, D-Ala-D-Ser type 2,0 -vanC; D-alanine---D-serine ligase [EC:6.3.2.35] K18856 M00652 Vancomycin resistance, D-Ala-D-Ser type 3,0 -vanXY; D-alanyl-D-alanine dipeptidase/carboxypeptidase [EC:3.4.13.22 3.4.16.4] K18866 M00652 Vancomycin resistance, D-Ala-D-Ser type 4,0 -yscJ; type III secretion protein SctJ K03222 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscR; type III secretion protein SctR K03226 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscS; type III secretion protein SctS K03227 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscT; type III secretion protein SctT K03228 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscU; type III secretion protein SctU K03229 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscV; type III secretion protein SctV K03230 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscN; ATP synthase in type III secretion protein SctN [EC:3.6.3.14] K03224 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscQ; type III secretion protein SctQ K03225 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -yscL; type III secretion protein SctL K03223 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -hrpB2; type III secretion inner rod protein HrpB2 K18374 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -hrpF; type III secretion translocon protein HrpF K18376 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 -hrpB1; type III secretion protein HrpB1 K18373 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 1,0 -hrpE; type III secretion hrp pilus HrpE K18375 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 2,0 -hpa2; lysozyme-related protein Hpa2 K18377 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 3,0 -hpa1; type III secretion harpin protein Hpa1 K18378 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 4,0 -K18379; type III secretion regulatory protein HpaA K18379 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 5,0 -K18380; type III secretion control protein HpaB K18380 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 6,0 -K18381; type III secretion control protein HpaP K18381 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 7,0 +nfxB; TetR/AcrR family transcriptional regulator, mexCD-oprJ operon repressor K18294 M00639 Multidrug resistance, efflux pump MexCD-OprJ 0,0 +mexC; membrane fusion protein K18295 M00639 Multidrug resistance, efflux pump MexCD-OprJ 1,0 +mexD; multidrug efflux pump K18296 M00639 Multidrug resistance, efflux pump MexCD-OprJ 1,0 +oprJ; multidrug resistance outer membrane protein OprJ K08721 M00639 Multidrug resistance, efflux pump MexCD-OprJ 1,0 +mexT; LysR family transcriptional regulator, mexEF-oprN operon transcriptional activator K18297 M00641 Multidrug resistance, efflux pump MexEF-OprN 0,0 +mexE; membrane fusion protein K18298 M00641 Multidrug resistance, efflux pump MexEF-OprN 1,0 +mexF; multidrug efflux pump K18299 M00641 Multidrug resistance, efflux pump MexEF-OprN 1,0 +oprN; outer membrane protein K18300 M00641 Multidrug resistance, efflux pump MexEF-OprN 1,0 +mexL; TetR/AcrR family transcriptional regulator, mexJK operon transcriptional repressor K18301 M00642 Multidrug resistance, efflux pump MexJK-OprM 0,0 +mexJ; membrane fusion protein K18302 M00642 Multidrug resistance, efflux pump MexJK-OprM 1,0 +mexK; multidrug efflux pump K18303 M00642 Multidrug resistance, efflux pump MexJK-OprM 1,0 +oprM; outer membrane protein K18139 M00642 Multidrug resistance, efflux pump MexJK-OprM 1,0 +mexZ; TetR/AcrR family transcriptional regulator, mexXY operon repressor K18129 M00643 Multidrug resistance, efflux pump MexXY-OprM 0,0 +mexX; membrane fusion protein K18094 M00643 Multidrug resistance, efflux pump MexXY-OprM 1,0 +mexY; multidrug efflux pump K18095 M00643 Multidrug resistance, efflux pump MexXY-OprM 1,0 +oprM; outer membrane protein K18139 M00643 Multidrug resistance, efflux pump MexXY-OprM 1,0 +adeS; two-component system, OmpR family, sensor histidine kinase AdeS [EC:2.7.13.3] K18143 M00649 Multidrug resistance, efflux pump AdeABC 0,0 +adeR; two-component system, OmpR family, response regulator AdeR K18144 M00649 Multidrug resistance, efflux pump AdeABC 1,0 +adeA; membrane fusion protein K18145 M00649 Multidrug resistance, efflux pump AdeABC 2,0 +adeB; multidrug efflux pump K18146 M00649 Multidrug resistance, efflux pump AdeABC 2,0 +adeC; outer membrane protein K18147 M00649 Multidrug resistance, efflux pump AdeABC 2,0 +vanSB; two-component system, OmpR family, sensor histidine kinase VanS [EC:2.7.13.3] K18345 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,0,0 +vanRB; two-component system, OmpR family, response regulator VanR K18344 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,1,0 +vanY; D-alanyl-D-alanine carboxypeptidase [EC:3.4.16.4] K07260 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,2,0 +vanW; vancomycin resistance protein VanW K18346 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,0,3,0 +vanSAc; two-component system, OmpR family, sensor histidine kinase VanS [EC:2.7.13.3] K18351 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,0,0 +vanRAc; two-component system, OmpR family, response regulator VanR K18352 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,1,0 +vanK; vancomycin resistance protein VanK K18354 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,2,0 +vanJ; vancomycin resistance protein VanJ K18353 M00651 Vancomycin resistance, D-Ala-D-Lac type 0,1,3,0 +vanH; D-specific alpha-keto acid dehydrogenase [EC:1.1.1.-] K18347 M00651 Vancomycin resistance, D-Ala-D-Lac type 1,0,0,0 +vanB; D-alanine---(R)-lactate ligase [EC:6.1.2.1] K15739 M00651 Vancomycin resistance, D-Ala-D-Lac type 1,0,1,0 +vanX; D-alanyl-D-alanine dipeptidase [EC:3.4.13.22] K08641 M00651 Vancomycin resistance, D-Ala-D-Lac type 1,0,2,0 +vanSE; two-component system, OmpR family, sensor histidine kinase VanS [EC:2.7.13.3] K18350 M00652 Vancomycin resistance, D-Ala-D-Ser type 0,0 +vanRE; two-component system, OmpR family, response regulator VanR K18349 M00652 Vancomycin resistance, D-Ala-D-Ser type 1,0 +vanT; serine/alanine racemase [EC:5.1.1.18 5.1.1.1] K18348 M00652 Vancomycin resistance, D-Ala-D-Ser type 2,0 +vanC; D-alanine---D-serine ligase [EC:6.3.2.35] K18856 M00652 Vancomycin resistance, D-Ala-D-Ser type 3,0 +vanXY; D-alanyl-D-alanine dipeptidase/carboxypeptidase [EC:3.4.13.22 3.4.16.4] K18866 M00652 Vancomycin resistance, D-Ala-D-Ser type 4,0 +yscJ; type III secretion protein SctJ K03222 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscR; type III secretion protein SctR K03226 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscS; type III secretion protein SctS K03227 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscT; type III secretion protein SctT K03228 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscU; type III secretion protein SctU K03229 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscV; type III secretion protein SctV K03230 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscN; ATP synthase in type III secretion protein SctN [EC:3.6.3.14] K03224 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscQ; type III secretion protein SctQ K03225 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +yscL; type III secretion protein SctL K03223 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +hrpB2; type III secretion inner rod protein HrpB2 K18374 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +hrpF; type III secretion translocon protein HrpF K18376 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 0,0 +hrpB1; type III secretion protein HrpB1 K18373 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 1,0 +hrpE; type III secretion hrp pilus HrpE K18375 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 2,0 +hpa2; lysozyme-related protein Hpa2 K18377 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 3,0 +hpa1; type III secretion harpin protein Hpa1 K18378 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 4,0 +K18379; type III secretion regulatory protein HpaA K18379 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 5,0 +K18380; type III secretion control protein HpaB K18380 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 6,0 +K18381; type III secretion control protein HpaP K18381 M00660 Xanthomonas spp. pathogenicity signature, T3SS and effectors 7,0 geranylgeranyldiphosphate transferase [RN:R10349] K18385 M00661 Paspaline biosynthesis, geranylgeranyl-PP + indoleglycerol phosphate => paspaline 0,0 C20525 3-Geranylgeranylindole C00353,C03506 Geranylgeranyl diphosphate,Indoleglycerol phosphate FAD dependent monooxygenase [EC:1.14.13.-] [RN:R10350 R10351] K18386 M00661 Paspaline biosynthesis, geranylgeranyl-PP + indoleglycerol phosphate => paspaline 1,0 C20529 14,15-Epoxyemindole SB C20527 Emindole SB paspaline synthase [RN:R10352 R10353] K18387 M00661 Paspaline biosynthesis, geranylgeranyl-PP + indoleglycerol phosphate => paspaline 2,0 C20530 Paspaline C20529 14,15-Epoxyemindole SB -nodA; nodulation protein A [EC:2.3.1.-] K14658 M00664 Nodulation 0,0 -nodB; chitooligosaccharide deacetylase [EC:3.5.1.-] K14659 M00664 Nodulation 1,0 -nodC; N-acetylglucosaminyltransferase [EC:2.4.1.-] K14666 M00664 Nodulation 2,0 -nodD; LysR family transcriptional regulator, nod-box dependent transcriptional activator K14657 M00664 Nodulation 3,0 +nodA; nodulation protein A [EC:2.3.1.-] K14658 M00664 Nodulation 0,0 +nodB; chitooligosaccharide deacetylase [EC:3.5.1.-] K14659 M00664 Nodulation 1,0 +nodC; N-acetylglucosaminyltransferase [EC:2.4.1.-] K14666 M00664 Nodulation 2,0 +nodD; LysR family transcriptional regulator, nod-box dependent transcriptional activator K14657 M00664 Nodulation 3,0 N-(5-amino-5-carboxypentanoyl)-L-cysteinyl-D-valine synthase [EC:6.3.2.26] [RN:R04870] K12743 M00672 Penicillin biosynthesis, aminoadipate + cycteine + valine => penicillin 0,0 C05556 delta-(L-2-Aminoadipyl)-L-cysteinyl-D-valine C00956,C00183,C00097 L-2-Aminoadipate,L-Valine,L-Cysteine isopenicillin-N synthase [EC:1.21.3.1] [RN:R04872] K04126 M00672 Penicillin biosynthesis, aminoadipate + cycteine + valine => penicillin 1,0 C05557 Isopenicillin N C05556 delta-(L-2-Aminoadipyl)-L-cysteinyl-D-valine isopenicillin-N N-acyltransferase [EC:2.3.1.164] [RN:R06361] K10852 M00672 Penicillin biosynthesis, aminoadipate + cycteine + valine => penicillin 2,0 C00395 Penicillin C05557 Isopenicillin N @@ -2656,47 +2656,47 @@ proclavaminate amidinohydrolase [EC:3.5.3.22] [RN:R05357] K12676 M00674 Clavamin carboxymethylproline synthase [EC:2.3.1.226] [RN:R10485] K18317 M00675 Carbapenem-3-carboxylate biosynthesis, pyrroline-5-carboxylate + malonyl-CoA => carbapenem-3-carboxylate 0,0 C17366 (2S,5S)-trans-Carboxymethylproline C03912,C00083 (S)-1-Pyrroline-5-carboxylate,Malonyl-CoA carbapenam-3-carboxylate synthase [EC:6.3.3.6] [RN:R10556] K18316 M00675 Carbapenem-3-carboxylate biosynthesis, pyrroline-5-carboxylate + malonyl-CoA => carbapenem-3-carboxylate 1,0 C17367 (3S,5S)-Carbapenam-3-carboxylic acid C17366 (2S,5S)-trans-Carboxymethylproline (5R)-carbapenem-3-carboxylate synthase [EC:1.14.20.3] [RN:R10415] K18315 M00675 Carbapenem-3-carboxylate biosynthesis, pyrroline-5-carboxylate + malonyl-CoA => carbapenem-3-carboxylate 2,0 C06669 (5R)-Carbapen-2-em-3-carboxylate C17367 (3S,5S)-Carbapenam-3-carboxylic acid -envR, acrS; TetR/AcrR family transcriptional regulator, acrEF/envCD operon repressor [COG:COG1309] K18140 M00696 Multidrug resistance, efflux pump AcrEF-TolC 0,0 -acrE; membrane fusion protein [COG:COG0845] [TC:2.A.6.2] K18141 M00696 Multidrug resistance, efflux pump AcrEF-TolC 1,0 -acrF; multidrug efflux pump [COG:COG0841] [TC:2.A.6.2] K18142 M00696 Multidrug resistance, efflux pump AcrEF-TolC 1,0 -tolC; outer membrane channel protein [COG:COG1538] [TC:1.B.17 2.A.6.2] K12340 M00696 Multidrug resistance, efflux pump AcrEF-TolC 1,0 -evgA, bvgA; two-component system, NarL family, response regulator EvgA [COG:COG2197] [GO:0000156] K07690 M00697 Multidrug resistance, efflux pump MdtEF-TolC 0,0 -mdtE; membrane fusion protein [COG:COG0845] [TC:8.A.1.6.3 2.A.6.2] K18898 M00697 Multidrug resistance, efflux pump MdtEF-TolC 1,0 -mdtF; multidrug efflux pump [COG:COG0841] [TC:2.A.6.2.13] K18899 M00697 Multidrug resistance, efflux pump MdtEF-TolC 1,0 -tolC; outer membrane channel protein [COG:COG1538] [TC:1.B.17 2.A.6.2] K12340 M00697 Multidrug resistance, efflux pump MdtEF-TolC 1,0 -bpeT; LysR family transcriptional regulator, regulator for bpeEF and oprC [COG:COG0583] K18900 M00698 Multidrug resistance, efflux pump BpeEF-OprC 0,0 -bpeE; membrane fusion protein [COG:COG0845] [TC:8.A.1 2.A.6.2] K18901 M00698 Multidrug resistance, efflux pump BpeEF-OprC 1,0 -bpeF; multidrug efflux pump [COG:COG0841] [TC:2.A.6.2] K18902 M00698 Multidrug resistance, efflux pump BpeEF-OprC 1,0 -oprC, opcM; outer membrane protein [COG:COG1538] [TC:1.B.17.3.3] K18903 M00698 Multidrug resistance, efflux pump BpeEF-OprC 1,0 -mgrA; MarR family transcriptional regulator, multiple gene regulator MgrA [COG:COG1846] K18906 M00700 Multidrug resistance, efflux pump AbcA 0,0 -norG; GntR family transcriptional regulator, regulator for abcA and norABC [COG:COG1167] K18907 M00700 Multidrug resistance, efflux pump AbcA 0,1 -abcA, bmrA; ATP-binding cassette, subfamily B, bacterial AbcA/BmrA [EC:3.6.3.44] [COG:COG1132] [GO:0008559] [TC:3.A.1.117 3.A.1.123] K18104 M00700 Multidrug resistance, efflux pump AbcA 1,0 -mgrA; MarR family transcriptional regulator, multiple gene regulator MgrA [COG:COG1846] K18906 M00702 Multidrug resistance, efflux pump NorB 0,0 -norG; GntR family transcriptional regulator, regulator for abcA and norABC [COG:COG1167] K18907 M00702 Multidrug resistance, efflux pump NorB 0,1 -BLTL; MFS transporter, DHA2 family, multidrug resistance protein [COG:COG0477] [TC:2.A.1.3] K08170 M00702 Multidrug resistance, efflux pump NorB 1,0 -mgrA; MarR family transcriptional regulator, multiple gene regulator MgrA [COG:COG1846] K18906 M00704 Tetracycline resistance, efflux pump Tet38 0,0 -tetB; MFS transporter, DHA2 family, metal-tetracycline-proton antiporter [COG:COG0477] [TC:2.A.1.3] K08168 M00704 Tetracycline resistance, efflux pump Tet38 1,0 -mepR; MarR family transcriptional regulator, repressor for mepA [COG:COG1846] K18909 M00705 Multidrug resistance, efflux pump MepA 0,0 -mepA; multidrug efflux pump [COG:COG0534] [TC:2.A.66.1.13] K18908 M00705 Multidrug resistance, efflux pump MepA 1,0 -qacR; TetR/AcrR family transcriptional regulator, repressor for qacA K18938 M00714 Multidrug resistance, efflux pump QacA 0,0 -smvA; MFS transporter, DHA2 family, multidrug resistance protein K08167 M00714 Multidrug resistance, efflux pump QacA 1,0 -mexR; MarR family transcriptional regulator, repressor of the mexAB-oprM multidrug resistance operon K18131 M00718 Multidrug resistance, efflux pump MexAB-OprM 0,0 -acrA; membrane fusion protein, multidrug efflux system K03585 M00718 Multidrug resistance, efflux pump MexAB-OprM 1,0 -acrB; multidrug efflux pump K18138 M00718 Multidrug resistance, efflux pump MexAB-OprM 1,0 -oprM; outer membrane protein, multidrug efflux system K18139 M00718 Multidrug resistance, efflux pump MexAB-OprM 1,0 -graS; two-component system, OmpR family, sensor histidine kinase GraS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K19077 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 0,0 -graR; two-component system, OmpR family, response regulator protein GraR [COG:COG0745] [GO:0000156] K19078 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 1,0 -dltA; D-alanine--poly(phosphoribitol) ligase subunit 1 [EC:6.1.1.13] [COG:COG1020] [GO:0047473] K03367 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 -dltB; membrane protein involved in D-alanine export [COG:COG1696] K03739 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 -dltC; D-alanine--poly(phosphoribitol) ligase subunit 2 [EC:6.1.1.13] [COG:COG0236] [GO:0047473] K14188 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 -dltD; D-alanine transfer protein [COG:COG3966] K03740 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 -graS; two-component system, OmpR family, sensor histidine kinase GraS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K19077 M00726 Cationic antimicrobial peptide (CAMP) resistance, lysyl-phosphatidylglycerol (L-PG) synthase MprF 0,0 -graR; two-component system, OmpR family, response regulator protein GraR [COG:COG0745] [GO:0000156] K19078 M00726 Cationic antimicrobial peptide (CAMP) resistance, lysyl-phosphatidylglycerol (L-PG) synthase MprF 1,0 -mprF, fmtC; phosphatidylglycerol lysyltransferase [EC:2.3.2.3] [COG:COG0392 COG2898] [GO:0050071] [TC:2 K14205 M00726 Cationic antimicrobial peptide (CAMP) resistance, lysyl-phosphatidylglycerol (L-PG) synthase MprF 2,0 -graS; two-component system, OmpR family, sensor histidine kinase GraS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K19077 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 0,0 -graR; two-component system, OmpR family, response regulator protein GraR [COG:COG0745] [GO:0000156] K19078 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 1,0 -vraF; cationic antimicrobial peptide transport system ATP-binding protein [COG:COG1136] [TC:3.A.1.134.7] K19079 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 2,0 -vraG; cationic antimicrobial peptide transport system permease protein [COG:COG0577] [TC:3.A.1.134.7] K19080 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 2,0 +envR, acrS; TetR/AcrR family transcriptional regulator, acrEF/envCD operon repressor [COG:COG1309] K18140 M00696 Multidrug resistance, efflux pump AcrEF-TolC 0,0 +acrE; membrane fusion protein [COG:COG0845] [TC:2.A.6.2] K18141 M00696 Multidrug resistance, efflux pump AcrEF-TolC 1,0 +acrF; multidrug efflux pump [COG:COG0841] [TC:2.A.6.2] K18142 M00696 Multidrug resistance, efflux pump AcrEF-TolC 1,0 +tolC; outer membrane channel protein [COG:COG1538] [TC:1.B.17 2.A.6.2] K12340 M00696 Multidrug resistance, efflux pump AcrEF-TolC 1,0 +evgA, bvgA; two-component system, NarL family, response regulator EvgA [COG:COG2197] [GO:0000156] K07690 M00697 Multidrug resistance, efflux pump MdtEF-TolC 0,0 +mdtE; membrane fusion protein [COG:COG0845] [TC:8.A.1.6.3 2.A.6.2] K18898 M00697 Multidrug resistance, efflux pump MdtEF-TolC 1,0 +mdtF; multidrug efflux pump [COG:COG0841] [TC:2.A.6.2.13] K18899 M00697 Multidrug resistance, efflux pump MdtEF-TolC 1,0 +tolC; outer membrane channel protein [COG:COG1538] [TC:1.B.17 2.A.6.2] K12340 M00697 Multidrug resistance, efflux pump MdtEF-TolC 1,0 +bpeT; LysR family transcriptional regulator, regulator for bpeEF and oprC [COG:COG0583] K18900 M00698 Multidrug resistance, efflux pump BpeEF-OprC 0,0 +bpeE; membrane fusion protein [COG:COG0845] [TC:8.A.1 2.A.6.2] K18901 M00698 Multidrug resistance, efflux pump BpeEF-OprC 1,0 +bpeF; multidrug efflux pump [COG:COG0841] [TC:2.A.6.2] K18902 M00698 Multidrug resistance, efflux pump BpeEF-OprC 1,0 +oprC, opcM; outer membrane protein [COG:COG1538] [TC:1.B.17.3.3] K18903 M00698 Multidrug resistance, efflux pump BpeEF-OprC 1,0 +mgrA; MarR family transcriptional regulator, multiple gene regulator MgrA [COG:COG1846] K18906 M00700 Multidrug resistance, efflux pump AbcA 0,0 +norG; GntR family transcriptional regulator, regulator for abcA and norABC [COG:COG1167] K18907 M00700 Multidrug resistance, efflux pump AbcA 0,1 +abcA, bmrA; ATP-binding cassette, subfamily B, bacterial AbcA/BmrA [EC:3.6.3.44] [COG:COG1132] [GO:0008559] [TC:3.A.1.117 3.A.1.123] K18104 M00700 Multidrug resistance, efflux pump AbcA 1,0 +mgrA; MarR family transcriptional regulator, multiple gene regulator MgrA [COG:COG1846] K18906 M00702 Multidrug resistance, efflux pump NorB 0,0 +norG; GntR family transcriptional regulator, regulator for abcA and norABC [COG:COG1167] K18907 M00702 Multidrug resistance, efflux pump NorB 0,1 +BLTL; MFS transporter, DHA2 family, multidrug resistance protein [COG:COG0477] [TC:2.A.1.3] K08170 M00702 Multidrug resistance, efflux pump NorB 1,0 +mgrA; MarR family transcriptional regulator, multiple gene regulator MgrA [COG:COG1846] K18906 M00704 Tetracycline resistance, efflux pump Tet38 0,0 +tetB; MFS transporter, DHA2 family, metal-tetracycline-proton antiporter [COG:COG0477] [TC:2.A.1.3] K08168 M00704 Tetracycline resistance, efflux pump Tet38 1,0 +mepR; MarR family transcriptional regulator, repressor for mepA [COG:COG1846] K18909 M00705 Multidrug resistance, efflux pump MepA 0,0 +mepA; multidrug efflux pump [COG:COG0534] [TC:2.A.66.1.13] K18908 M00705 Multidrug resistance, efflux pump MepA 1,0 +qacR; TetR/AcrR family transcriptional regulator, repressor for qacA K18938 M00714 Multidrug resistance, efflux pump QacA 0,0 +smvA; MFS transporter, DHA2 family, multidrug resistance protein K08167 M00714 Multidrug resistance, efflux pump QacA 1,0 +mexR; MarR family transcriptional regulator, repressor of the mexAB-oprM multidrug resistance operon K18131 M00718 Multidrug resistance, efflux pump MexAB-OprM 0,0 +acrA; membrane fusion protein, multidrug efflux system K03585 M00718 Multidrug resistance, efflux pump MexAB-OprM 1,0 +acrB; multidrug efflux pump K18138 M00718 Multidrug resistance, efflux pump MexAB-OprM 1,0 +oprM; outer membrane protein, multidrug efflux system K18139 M00718 Multidrug resistance, efflux pump MexAB-OprM 1,0 +graS; two-component system, OmpR family, sensor histidine kinase GraS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K19077 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 0,0 +graR; two-component system, OmpR family, response regulator protein GraR [COG:COG0745] [GO:0000156] K19078 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 1,0 +dltA; D-alanine--poly(phosphoribitol) ligase subunit 1 [EC:6.1.1.13] [COG:COG1020] [GO:0047473] K03367 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 +dltB; membrane protein involved in D-alanine export [COG:COG1696] K03739 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 +dltC; D-alanine--poly(phosphoribitol) ligase subunit 2 [EC:6.1.1.13] [COG:COG0236] [GO:0047473] K14188 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 +dltD; D-alanine transfer protein [COG:COG3966] K03740 M00725 Cationic antimicrobial peptide (CAMP) resistance, dltABCD operon 2,0 +graS; two-component system, OmpR family, sensor histidine kinase GraS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K19077 M00726 Cationic antimicrobial peptide (CAMP) resistance, lysyl-phosphatidylglycerol (L-PG) synthase MprF 0,0 +graR; two-component system, OmpR family, response regulator protein GraR [COG:COG0745] [GO:0000156] K19078 M00726 Cationic antimicrobial peptide (CAMP) resistance, lysyl-phosphatidylglycerol (L-PG) synthase MprF 1,0 +mprF, fmtC; phosphatidylglycerol lysyltransferase [EC:2.3.2.3] [COG:COG0392 COG2898] [GO:0050071] [TC:2 K14205 M00726 Cationic antimicrobial peptide (CAMP) resistance, lysyl-phosphatidylglycerol (L-PG) synthase MprF 2,0 +graS; two-component system, OmpR family, sensor histidine kinase GraS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K19077 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 0,0 +graR; two-component system, OmpR family, response regulator protein GraR [COG:COG0745] [GO:0000156] K19078 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 1,0 +vraF; cationic antimicrobial peptide transport system ATP-binding protein [COG:COG1136] [TC:3.A.1.134.7] K19079 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 2,0 +vraG; cationic antimicrobial peptide transport system permease protein [COG:COG0577] [TC:3.A.1.134.7] K19080 M00730 Cationic antimicrobial peptide (CAMP) resistance, VraFG transporter 2,0 nocardicin nonribosomal peptide synthetase [RN:R10880] K19102 M00736 Nocardicin A biosynthesis, L-pHPG + arginine + serine => nocardicin A 0,0 C17355 Nocardicin G C12323,C00062,C00065 L-4-Hydroxyphenylglycine,L-Arginine,L-Serine nocardicin nonribosomal peptide synthetase [RN:R10880] K19103 M00736 Nocardicin A biosynthesis, L-pHPG + arginine + serine => nocardicin A 0,0 C17355 Nocardicin G C12323,C00062,C00065 L-4-Hydroxyphenylglycine,L-Arginine,L-Serine MbtH protein [RN:R10880] K05375 M00736 Nocardicin A biosynthesis, L-pHPG + arginine + serine => nocardicin A 0,0 C17355 Nocardicin G C12323,C00062,C00065 L-4-Hydroxyphenylglycine,L-Arginine,L-Serine @@ -2728,18 +2728,18 @@ methylmalonyl-CoA/ethylmalonyl-CoA epimerase [EC:5.1.99.1] [RN:R02765] K05606 M0 methylmalonyl-CoA mutase [EC:5.4.99.2] [RN:R00833] K01847 M00741 Propanoyl-CoA metabolism, propanoyl-CoA => succinyl-CoA 2,0 C00091 Succinyl-CoA C01213 (R)-Methylmalonyl-CoA methylmalonyl-CoA mutase [EC:5.4.99.2] [RN:R00833] K01848 M00741 Propanoyl-CoA metabolism, propanoyl-CoA => succinyl-CoA 2,1 C00091 Succinyl-CoA C01213 (R)-Methylmalonyl-CoA methylmalonyl-CoA mutase [EC:5.4.99.2] [RN:R00833] K01849 M00741 Propanoyl-CoA metabolism, propanoyl-CoA => succinyl-CoA 2,1 C00091 Succinyl-CoA C01213 (R)-Methylmalonyl-CoA -phoQ; two-component system, OmpR family, sensor histidine kinase PhoQ [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K07637 M00744 Cationic antimicrobial peptide (CAMP) resistance, protease PgtE 0,0 -phoP; two-component system, OmpR family, response regulator PhoP [COG:COG0745] [GO:0000156] K07660 M00744 Cationic antimicrobial peptide (CAMP) resistance, protease PgtE 1,0 -pgtE; outer membrane protease E [EC:3.4.21.-] [COG:COG4571] K08477 M00744 Cationic antimicrobial peptide (CAMP) resistance, protease PgtE 2,0 -parS; two-component system, OmpR family, sensor kinase ParS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K18072 M00745 Imipenem resistance, repression of porin OprD 0,0,0,0 -parR; two-component system, OmpR family, response regulator ParR [COG:COG0745] [GO:0000156] K18073 M00745 Imipenem resistance, repression of porin OprD 0,0,1,0 -cusS, copS, silS; two-component system, OmpR family, heavy metal sensor histidine kinase CusS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K07644 M00745 Imipenem resistance, repression of porin OprD 0,1,0,0 -cusR, copR, silR; two-component system, OmpR family, copper resistance phosphate regulon response regulator CusR [COG:COG0745] [GO:0000156] K07665 M00745 Imipenem resistance, repression of porin OprD 0,1,1,0 -mexT; LysR family transcriptional regulator, mexEF-oprN operon transcriptional activator [COG:COG0583] K18297 M00745 Imipenem resistance, repression of porin OprD 0,2 -oprD; imipenem/basic amino acid-specific outer membrane pore [EC:3.4.21.-] [TC:1.B.25.1.1] K18093 M00745 Imipenem resistance, repression of porin OprD 1,0 -marA; AraC family transcriptional regulator, mar-sox-rob regulon activator [COG:COG2207] K13632 M00746 Multidrug resistance, repression of porin OmpF 0,0 -micF; small regulatory RNA MicF K18513 M00746 Multidrug resistance, repression of porin OmpF 1,0 -ompF; outer membrane pore protein F [COG:COG3203] [TC:1.B.1.1.1] K09476 M00746 Multidrug resistance, repression of porin OmpF 2,0 +phoQ; two-component system, OmpR family, sensor histidine kinase PhoQ [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K07637 M00744 Cationic antimicrobial peptide (CAMP) resistance, protease PgtE 0,0 +phoP; two-component system, OmpR family, response regulator PhoP [COG:COG0745] [GO:0000156] K07660 M00744 Cationic antimicrobial peptide (CAMP) resistance, protease PgtE 1,0 +pgtE; outer membrane protease E [EC:3.4.21.-] [COG:COG4571] K08477 M00744 Cationic antimicrobial peptide (CAMP) resistance, protease PgtE 2,0 +parS; two-component system, OmpR family, sensor kinase ParS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K18072 M00745 Imipenem resistance, repression of porin OprD 0,0,0,0 +parR; two-component system, OmpR family, response regulator ParR [COG:COG0745] [GO:0000156] K18073 M00745 Imipenem resistance, repression of porin OprD 0,0,1,0 +cusS, copS, silS; two-component system, OmpR family, heavy metal sensor histidine kinase CusS [EC:2.7.13.3] [COG:COG0642] [GO:0000155] K07644 M00745 Imipenem resistance, repression of porin OprD 0,1,0,0 +cusR, copR, silR; two-component system, OmpR family, copper resistance phosphate regulon response regulator CusR [COG:COG0745] [GO:0000156] K07665 M00745 Imipenem resistance, repression of porin OprD 0,1,1,0 +mexT; LysR family transcriptional regulator, mexEF-oprN operon transcriptional activator [COG:COG0583] K18297 M00745 Imipenem resistance, repression of porin OprD 0,2 +oprD; imipenem/basic amino acid-specific outer membrane pore [EC:3.4.21.-] [TC:1.B.25.1.1] K18093 M00745 Imipenem resistance, repression of porin OprD 1,0 +marA; AraC family transcriptional regulator, mar-sox-rob regulon activator [COG:COG2207] K13632 M00746 Multidrug resistance, repression of porin OmpF 0,0 +micF; small regulatory RNA MicF K18513 M00746 Multidrug resistance, repression of porin OmpF 1,0 +ompF; outer membrane pore protein F [COG:COG3203] [TC:1.B.1.1.1] K09476 M00746 Multidrug resistance, repression of porin OmpF 2,0 UDP-4-amino-4-deoxy-L-arabinose formyltransferase / UDP-glucuronic acid dehydrogenase (UDP-4-keto-hexauronic acid decarboxylating) [EC:2.1.2.13 1.1.1.305] [RN:R07658 R07660] K10011 M00761 Undecaprenylphosphate alpha-L-Ara4N biosynthesis, UDP-GlcA => undecaprenyl phosphate alpha-L-Ara4N 0,0 C16154 UDP-L-Ara4FN C16153 UDP-L-Ara4N UDP-4-amino-4-deoxy-L-arabinose-oxoglutarate aminotransferase [EC:2.6.1.87] [RN:R07659] K07806 M00761 Undecaprenylphosphate alpha-L-Ara4N biosynthesis, UDP-GlcA => undecaprenyl phosphate alpha-L-Ara4N 1,0 C16153 UDP-L-Ara4N C16155 UDP-L-Ara4O undecaprenyl-phosphate 4-deoxy-4-formamido-L-arabinose transferase [EC:2.4.2.53] [RN:R07661] K10012 M00761 Undecaprenylphosphate alpha-L-Ara4N biosynthesis, UDP-GlcA => undecaprenyl phosphate alpha-L-Ara4N 2,0 C16156 Undecaprenyl phosphate alpha-L-Ara4FN C16154 UDP-L-Ara4FN @@ -2749,11 +2749,11 @@ LysW-L-glutamate kinase [EC:2.7.2.-] [RN:R10930] K05828 M00763 Ornithine biosynt LysW-L-glutamyl-5-phosphate reductase [EC:1.2.1.-] [RN:R10931] K05829 M00763 Ornithine biosynthesis, mediated by LysW, glutamate => ornithine 2,0 C20950 LysW-L-glutamate 5-semialdehyde C20949 LysW-L-glutamyl 5-phosphate LysW-L-ornithine aminotransferase [EC:2.6.1.-] [RN:R10932] K05830 M00763 Ornithine biosynthesis, mediated by LysW, glutamate => ornithine 3,0 C20951 LysW-L-ornithine C20950 LysW-L-glutamate 5-semialdehyde LysW-L-ornithine carboxypeptidase [RN:R10933] K05831 M00763 Ornithine biosynthesis, mediated by LysW, glutamate => ornithine 4,0 C00077 L-Ornithine C20951 LysW-L-ornithine -lasR; LuxR family transcriptional regulator, quorum-sensing transcription factor LasR K18304 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 0,0 -cueR; MerR family transcriptional regulator, copper efflux regulator K19591 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 1,0 -gesA; membrane fusion protein, gold/copper resistance efflux system K19595 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 2,0 -gesB; gold/copper resistance efflux pump K19594 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 2,0 -opmE; outer membrane protein, multidrug efflux system K19593 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 2,0 +lasR; LuxR family transcriptional regulator, quorum-sensing transcription factor LasR K18304 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 0,0 +cueR; MerR family transcriptional regulator, copper efflux regulator K19591 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 1,0 +gesA; membrane fusion protein, gold/copper resistance efflux system K19595 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 2,0 +gesB; gold/copper resistance efflux pump K19594 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 2,0 +opmE; outer membrane protein, multidrug efflux system K19593 M00769 Multidrug resistance, efflux pump MexPQ-OpmE 2,0 tylG; tylactone synthase [RN:R06448] K15988 M00773 Tylosin biosynthesis, methylmalonyl-CoA + malonyl-CoA => tylactone => tylosin 0,0 C12000 Tylactone C02557,C00083 Methylmalonyl-CoA,Malonyl-CoA tylMII; tylactone mycaminosyltransferase [EC:2.4.1.316] [RN:R06450] K15989 M00773 Tylosin biosynthesis, methylmalonyl-CoA + malonyl-CoA => tylactone => tylosin 1,0 C12001 5-O-beta-D-Mycaminosyltylactone C12000 Tylactone tylMIII; tylactone mycaminosyltransferase auxiliary protein [RN:R06450] K15990 M00773 Tylosin biosynthesis, methylmalonyl-CoA + malonyl-CoA => tylactone => tylosin 1,0 C12001 5-O-beta-D-Mycaminosyltylactone C12000 Tylactone @@ -2873,7 +2873,7 @@ dTDP-glucose 4,6-dehydratase [EC:4.2.1.46] [RN:R06513] K01710 M00793 dTDP-L-rham dTDP-4-dehydrorhamnose 3,5-epimerase [EC:5.1.3.13] [RN:R06514] K01790 M00793 dTDP-L-rhamnose biosynthesis 2,0 C00688 dTDP-4-dehydro-beta-L-rhamnose C11907 dTDP-4-oxo-6-deoxy-D-glucose dTDP-4-dehydrorhamnose reductase [EC:1.1.1.133] [RN:R02777] K00067 M00793 dTDP-L-rhamnose biosynthesis 3,0 C03319 dTDP-L-rhamnose C00688 dTDP-4-dehydro-beta-L-rhamnose tylJ; dTDP-4-dehydro-6-deoxy-D-glucose 3-epimerase [EC:5.1.3.27] [RN:R06437] K13312 M00794 dTDP-6-deoxy-D-allose biosynthesis 0,0 C11926 dTDP-4-oxo-6-deoxy-D-allose C11907 dTDP-4-oxo-6-deoxy-D-glucose -tylD; dTDP-4-dehydro-6-deoxy-alpha-D-gulose 4-ketoreductase [EC:1.1.1.364] [RN:R06438,R10573] K13313 M00794 dTDP-6-deoxy-D-allose biosynthesis 1,0 +tylD; dTDP-4-dehydro-6-deoxy-alpha-D-gulose 4-ketoreductase [EC:1.1.1.364] [RN:R06438,R10573] K13313 M00794 dTDP-6-deoxy-D-allose biosynthesis 1,0 novW; dTDP-4-dehydro-6-deoxy-D-glucose 3-epimerase [EC:5.1.3.27] [RN:R06437] K19855 M00795 dTDP-beta-L-noviose biosynthesis 0,0 C11926 dTDP-4-oxo-6-deoxy-D-allose C11907 dTDP-4-oxo-6-deoxy-D-glucose novU; C-methyltransferase [EC:2.1.1.-] [RN:R11020] K12710 M00795 dTDP-beta-L-noviose biosynthesis 1,0 C11460 dTDP-4-oxo-5-C-methyl-L-rhamnose C11926 dTDP-4-oxo-6-deoxy-D-allose novS; dTDP-4-keto-6-deoxyhexose reductase [EC:1.1.1.-] [RN:R10459] K17625 M00795 dTDP-beta-L-noviose biosynthesis 2,0 C12481 dTDP-5-dimethyl-L-lyxose C11460 dTDP-4-oxo-5-C-methyl-L-rhamnose @@ -2967,7 +2967,7 @@ valK; 5-epi-valiolone dehydratase [EC:4.2.1.-] [RN:R11233] K20432 M00815 Validam valC; C7-cyclitol kinase [EC:2.7.1.-] [RN:R11234] K20433 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 3,0 C17697 Valienone 7-phosphate C17696 Valienone valN; cyclitol reductase [RN:R11236] K20434 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 4,0 C21218 Validone 7-phosphate C17697 Valienone 7-phosphate valM; validone 7-phosphate aminotransferase [EC2.6.1.-] [RN:R11238] K20435 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 5,0 C21216 Validamine 7-phosphate C21218 Validone 7-phosphate -valL; validoxylamine A 7'-phosphate synthase [EC:2.4.1.-] [RN:R11497] K20436 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 6,0 C21219 Validoxylamine A 7'-phosphate C21368, C21216 +valL; validoxylamine A 7'-phosphate synthase [EC:2.4.1.-] [RN:R11497] K20436 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 6,0 C21219 Validoxylamine A 7'-phosphate C21368, C21216 vldH; validoxylamine A 7'-phosphate phosphatase [EC:3.1.3.101] [RN:R11240] K20437 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 7,0 C17700 Validoxylamine A C21219 Validoxylamine A 7'-phosphate valG; validoxylamine A glucosyltransferase [EC:2.4.1.338] [RN:R11241] K20438 M00815 Validamycin A biosynthesis, sedoheptulopyranose-7P => validamycin A 8,0 C12112 Validamycin A C17700 Validoxylamine A pentalenene synthase [EC:4.2.3.7] [RN:R02305] K12250 M00819 Pentalenolactone biosynthesis, farnesyl-PP => pentalenolactone 0,0 C01841 Pentalenene C00448 trans,trans-Farnesyl diphosphate @@ -2985,24 +2985,24 @@ oxyT, ctcO, cts6; 4-amino-anhydrotetracycline N4-methyltransferase [EC:2.1.1.335 oxyS, cts8; anhydrotetracycline 6-monooxygenase / 5a,11a-dehydrotetracycline 5-monooxygenase [EC:1.14.13.38 1.14.13.234] [RN:R04060 R09198] K14256 M00823 Chlortetracycline biosynthesis, pretetramide => chlortetracycline 5,0 C03206 5a,11a-Dehydrotetracycline C02811 Anhydrotetracycline oxyR; 5a,11a-dehydrotetracycline reductase [EC:1.3.98.4] [RN:R09192 R05459] K21301 M00823 Chlortetracycline biosynthesis, pretetramide => chlortetracycline 6,0 C06570 Tetracycline C03206 5a,11a-Dehydrotetracycline ctcP; tetracycline 7-halogenase [EC:1.14.19.49] [RN:R11478] K14257 M00823 Chlortetracycline biosynthesis, pretetramide => chlortetracycline 7,0 C06571 Chlortetracycline C06570 Tetracycline -ctcQ; flavin reductase (NADH) [EC:1.5.1.36] K21297 M00823 Chlortetracycline biosynthesis, pretetramide => chlortetracycline 7,0 -sgcE; enediyne polyketide synthase [RN:R11435] K15314 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 0,0 -sgcE2; enediyne biosynthesis protein E2 K21160 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE3; enediyne biosynthesis protein E3 K21161 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE4; enediyne biosynthesis protein E4 K21162 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE5; enediyne biosynthesis protein E5 K21163 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE7; enediyne biosynthesis protein E7 K21164 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE8; enediyne biosynthesis protein E8 K21165 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE9; enediyne biosynthesis protein E9 K21166 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE11; enediyne biosynthesis protein E11 K21167 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 -sgcE; enediyne polyketide synthase [RN:R11435] K15314 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 0,0 -calE1; enediyne biosynthesis protein CalE1 K21168 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 -calE2; enediyne biosynthesis protein CalE2 K21169 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 -calE3; enediyne biosynthesis protein CalE3 K21170 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 -calE4; enediyne biosynthesis protein CalE4 K21171 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 -calE5; enediyne biosynthesis protein CalE5 K21172 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 -calE6; methionine gamma-lyase K21173 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 -calE9; enediyne biosynthesis protein CalE9 K21174 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +ctcQ; flavin reductase (NADH) [EC:1.5.1.36] K21297 M00823 Chlortetracycline biosynthesis, pretetramide => chlortetracycline 7,0 +sgcE; enediyne polyketide synthase [RN:R11435] K15314 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 0,0 +sgcE2; enediyne biosynthesis protein E2 K21160 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE3; enediyne biosynthesis protein E3 K21161 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE4; enediyne biosynthesis protein E4 K21162 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE5; enediyne biosynthesis protein E5 K21163 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE7; enediyne biosynthesis protein E7 K21164 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE8; enediyne biosynthesis protein E8 K21165 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE9; enediyne biosynthesis protein E9 K21166 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE11; enediyne biosynthesis protein E11 K21167 M00824 9-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 9-membered enediyne core 1,0 +sgcE; enediyne polyketide synthase [RN:R11435] K15314 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 0,0 +calE1; enediyne biosynthesis protein CalE1 K21168 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +calE2; enediyne biosynthesis protein CalE2 K21169 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +calE3; enediyne biosynthesis protein CalE3 K21170 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +calE4; enediyne biosynthesis protein CalE4 K21171 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +calE5; enediyne biosynthesis protein CalE5 K21172 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +calE6; methionine gamma-lyase K21173 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 +calE9; enediyne biosynthesis protein CalE9 K21174 M00825 10-membered enediyne core biosynthesis, malonyl-CoA => 3-hydroxyhexadeca-4,6,8,10,12,14-hexaenoyl-ACP => 10-membered enediyne core 1,0 sgcD; 2-amino-4-deoxychorismate synthase [EC:2.6.1.86] [RN:R08956] K20159 M00826 C-1027 benzoxazolinate moiety biosynthesis, chorismate => benzoxazolinyl-CoA 0,0 C18054 2-Amino-2-deoxyisochorismate C00251 Chorismate sgcD1; 2-amino-4-deoxychorismate synthase, glutamine amidotransferase component [EC:2.6.1.86] [RN:R08956] K21175 M00826 C-1027 benzoxazolinate moiety biosynthesis, chorismate => benzoxazolinyl-CoA 0,0 C18054 2-Amino-2-deoxyisochorismate C00251 Chorismate sgcG; 2-amino-4-deoxychorismate dehydrogenase [EC:1.3.99.24] [RN:R09559] K20156 M00826 C-1027 benzoxazolinate moiety biosynthesis, chorismate => benzoxazolinyl-CoA 1,0 C19686 3-(1-Carboxyvinyloxy)anthranilate C18054 2-Amino-2-deoxyisochorismate @@ -3025,7 +3025,7 @@ ncsB; neocarzinostatin naphthoate synthase [EC:2.3.1.237] [RN:R11125] K20422 M00 ncsB3; 2-hydroxy-5-methyl-1-naphthoate 7-hydroxylase [EC:1.14.15.31] [RN:R10796] K20420 M00830 Neocarzinostatin naphthoate moiety biosynthesis, malonyl-CoA => 2-hydroxy-5-methyl-1-naphthoate => 2-hydroxy-7-methoxy-5-methyl-1-naphthoyl-CoA 1,0 C20857 2,7-Dihydroxy-5-methyl-1-naphthoate C20856 2-Hydroxy-5-methyl-1-naphthoate ncsB1; 2,7-dihydroxy-5-methyl-1-naphthoate 7-O-methyltransferase [EC:2.1.1.303] [RN:R10963] K20421 M00830 Neocarzinostatin naphthoate moiety biosynthesis, malonyl-CoA => 2-hydroxy-5-methyl-1-naphthoate => 2-hydroxy-7-methoxy-5-methyl-1-naphthoyl-CoA 2,0 C20841 2-Hydroxy-7-methoxy-5-methyl-1-naphthoate C20857 2,7-Dihydroxy-5-methyl-1-naphthoate ncsB2; 2-hydroxy-7-methoxy-5-methyl-1-naphthoate---CoA ligase [EC:6.2.1.43] [RN:R10771] K20423 M00830 Neocarzinostatin naphthoate moiety biosynthesis, malonyl-CoA => 2-hydroxy-5-methyl-1-naphthoate => 2-hydroxy-7-methoxy-5-methyl-1-naphthoyl-CoA 3,0 C20842 2-Hydroxy-7-methoxy-5-methyl-1-naphthoyl-CoA C20841 2-Hydroxy-7-methoxy-5-methyl-1-naphthoate -kedU38 K21221 M00831 Kedarcidin 2-hydroxynaphthoate moiety biosynthesis, malonyl-CoA => 3,6,8-trihydroxy-2-naphthoate => 3-hydroxy-7,8-dimethoxy-6-isopropoxy-2-naphthoyl-CoA 0,0 +kedU38 K21221 M00831 Kedarcidin 2-hydroxynaphthoate moiety biosynthesis, malonyl-CoA => 3,6,8-trihydroxy-2-naphthoate => 3-hydroxy-7,8-dimethoxy-6-isopropoxy-2-naphthoyl-CoA 0,0 kedN3; cytochrome P450 monooxygenase [EC:1.14.-.-] [RN:R11387] K21222 M00831 Kedarcidin 2-hydroxynaphthoate moiety biosynthesis, malonyl-CoA => 3,6,8-trihydroxy-2-naphthoate => 3-hydroxy-7,8-dimethoxy-6-isopropoxy-2-naphthoyl-CoA 1,0 C21321 3,6,7,8-Tetrahydroxy-2-naphthoate C21320 3,6,8-Trihydroxy-2-naphthoate kedN1; O-methyltransferase [EC:2.1.1.-] [RN:R11388] K21223 M00831 Kedarcidin 2-hydroxynaphthoate moiety biosynthesis, malonyl-CoA => 3,6,8-trihydroxy-2-naphthoate => 3-hydroxy-7,8-dimethoxy-6-isopropoxy-2-naphthoyl-CoA 2,0 C21322 3-Hydroxy-6,7,8-trimethoxy-2-naphthoate C21321 3,6,7,8-Tetrahydroxy-2-naphthoate kedN5; radical SAM C-methyltransferase [RN:R11389] K21224 M00831 Kedarcidin 2-hydroxynaphthoate moiety biosynthesis, malonyl-CoA => 3,6,8-trihydroxy-2-naphthoate => 3-hydroxy-7,8-dimethoxy-6-isopropoxy-2-naphthoyl-CoA 3,0 C21323 3-Hydroxy-7,8-dimethoxy-6-isopropoxy-2-naphthoate C21322 3-Hydroxy-6,7,8-trimethoxy-2-naphthoate @@ -3129,53 +3129,53 @@ mevalonate-3-phosphate-5-kinase [EC:2.7.1.186] [RN:R10780] K18690 M00849 C5 isop bisphosphomevalonate decarboxylase [EC:4.1.1.110] [RN:R10781] K22813 M00849 C5 isoprenoid biosynthesis, mevalonate pathway, archaea 3,1,2,0 C20345 Isopentenyl phosphate C20848 (R)-Mevalonate 3,5-bisphosphate isopentenyl phosphate kinase [EC:2.7.4.26] [RN:R10093] K06981 M00849 C5 isoprenoid biosynthesis, mevalonate pathway, archaea 4,0 C00129 Isopentenyl diphosphate C20345 Isopentenyl phosphate isopentenyl-diphosphate Delta-isomerase [EC:5.3.3.2] [RN:R01123] K01823 M00849 C5 isoprenoid biosynthesis, mevalonate pathway, archaea 5,0 C00235 Dimethylallyl diphosphate C00129 Isopentenyl diphosphate -ctxA; cholera enterotoxin subunit A [EC:2.4.2.36] K10928 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 0,0 -ctxB; cholera enterotoxin subunit B K10929 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 0,0 -zot; zona occludens toxin K10954 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 1,0 -ace; accessory cholera enterotoxin K10952 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 2,0 -rtxA; RTX toxin RtxA K10953 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 3,0 -hlyA; hemolysin K10948 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 4,0 -tlh; thermolabile hemolysin K11018 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 5,0 -blaKPC; beta-lactamase class A KPC [EC:3.5.2.6] K18768 M00851 Carbapenem resistance 0,0 -blaGES; beta-lactamase class A GES [EC:3.5.2.6] K18970 M00851 Carbapenem resistance 0,1 -blaIMI; beta-lactamase class A IMI [EC:3.5.2.6] K19316 M00851 Carbapenem resistance 0,2 -blaSME; beta-lactamase class A SME [EC:3.5.2.6] K22346 M00851 Carbapenem resistance 0,3 -blaOXA-51; beta-lactamase class D OXA-51 [EC:3.5.2.6] K18794 M00851 Carbapenem resistance 0,4 -blaOXA-213; beta-lactamase class D OXA-213 [EC:3.5.2.6] K19318 M00851 Carbapenem resistance 0,5 -blaOXA-24; beta-lactamase class D OXA-24 [EC:3.5.2.6] K18971 M00851 Carbapenem resistance 0,6 -blaOXA-23; beta-lactamase class D OXA-23 [EC:3.5.2.6] K18793 M00851 Carbapenem resistance 0,7 -blaOXA-134; beta-lactamase class D OXA-134 [EC:3.5.2.6] K19319 M00851 Carbapenem resistance 0,8 -blaOXA-211; beta-lactamase class D OXA-211 [EC:3.5.2.6] K19320 M00851 Carbapenem resistance 0,9 -blaOXA-214; beta-lactamase class D OXA-214 [EC:3.5.2.6] K19321 M00851 Carbapenem resistance 0,10 -blaOXA-229; beta-lactamase class D OXA-229 [EC:3.5.2.6] K19322 M00851 Carbapenem resistance 0,11 -blaOXA-58; beta-lactamase class D OXA-58 [EC:3.5.2.6] K18972 M00851 Carbapenem resistance 0,12 -blaOXA-62; beta-lactamase class D OXA-62 [EC:3.5.2.6] K19211 M00851 Carbapenem resistance 0,13 -blaOXA-48; beta-lactamase class D OXA-48 [EC:3.5.2.6] K18976 M00851 Carbapenem resistance 0,14 -blaOXA-60; beta-lactamase class D OXA-60 [EC:3.5.2.6] K21277 M00851 Carbapenem resistance 0,15 -blaIMP; metallo-beta-lactamase class B IMP [EC:3.5.2.6] K18782 M00851 Carbapenem resistance 0,16 -blaVIM; metallo-beta-lactamase class B VIM [EC:3.5.2.6] K18781 M00851 Carbapenem resistance 0,17 -blaNDM; metallo-beta-lactamase class B NDM [EC:3.5.2.6] K18780 M00851 Carbapenem resistance 0,18 -blaGIM; metallo-beta-lactamase class B GIM [EC:3.5.2.6] K19099 M00851 Carbapenem resistance 0,19 -blaIND; metallo-beta-lactamase class B IND [EC:3.5.2.6] K19216 M00851 Carbapenem resistance 0,20 -tcpI; toxin coregulated pilus biosynthesis protein I K10961 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 0,0 -tcpP; toxin coregulated pilus biosynthesis protein P K10920 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 1,0 -tcpH; toxin coregulated pilus biosynthesis protein H K10919 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 2,0 -tcpA; toxin coregulated pilin K10930 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 3,0 -tcpB; toxin coregulated pilus biosynthesis protein B K10931 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 4,0 -tcpQ; toxin coregulated pilus biosynthesis protein Q K10962 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 5,0 -tcpC; toxin coregulated pilus biosynthesis outer membrane protein C K10932 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 6,0 -tcpR; toxin coregulated pilus biosynthesis protein R K10963 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 7,0 -tcpD; toxin coregulated pilus biosynthesis protein D K10933 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 8,0 -tcpS; toxin coregulated pilus biosynthesis protein S K10964 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 9,0 -tcpT; toxin coregulated pilus biosynthesis protein T K10965 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 10,0 -tcpE; toxin coregulated pilus biosynthesis protein E K10934 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 11,0 -tcpF; toxin coregulated pilus biosynthesis protein F K10935 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 12,0 -tcpJ; toxin coregulated pilus biosynthesis protein J [EC:3.4.23.43 2.1.1.-] K10966 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 13,0 -cfaA; CFA/I fimbrial subunit A K22850 M00853 ETEC pathogenicity signature, colonization factors 0,0 -cfaB; CFA/I fimbrial subunit B K22851 M00853 ETEC pathogenicity signature, colonization factors 1,0 -cfaC; CFA/I fimbrial subunit C K22852 M00853 ETEC pathogenicity signature, colonization factors 2,0 -cfaE; CFA/I fimbrial subunit E K22853 M00853 ETEC pathogenicity signature, colonization factors 3,0 -cfaD; CFA/I fimbrial subunit D K22854 M00853 ETEC pathogenicity signature, colonization factors 4,0 +ctxA; cholera enterotoxin subunit A [EC:2.4.2.36] K10928 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 0,0 +ctxB; cholera enterotoxin subunit B K10929 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 0,0 +zot; zona occludens toxin K10954 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 1,0 +ace; accessory cholera enterotoxin K10952 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 2,0 +rtxA; RTX toxin RtxA K10953 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 3,0 +hlyA; hemolysin K10948 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 4,0 +tlh; thermolabile hemolysin K11018 M00850 Vibrio cholerae pathogenicity signature, cholera toxins 5,0 +blaKPC; beta-lactamase class A KPC [EC:3.5.2.6] K18768 M00851 Carbapenem resistance 0,0 +blaGES; beta-lactamase class A GES [EC:3.5.2.6] K18970 M00851 Carbapenem resistance 0,1 +blaIMI; beta-lactamase class A IMI [EC:3.5.2.6] K19316 M00851 Carbapenem resistance 0,2 +blaSME; beta-lactamase class A SME [EC:3.5.2.6] K22346 M00851 Carbapenem resistance 0,3 +blaOXA-51; beta-lactamase class D OXA-51 [EC:3.5.2.6] K18794 M00851 Carbapenem resistance 0,4 +blaOXA-213; beta-lactamase class D OXA-213 [EC:3.5.2.6] K19318 M00851 Carbapenem resistance 0,5 +blaOXA-24; beta-lactamase class D OXA-24 [EC:3.5.2.6] K18971 M00851 Carbapenem resistance 0,6 +blaOXA-23; beta-lactamase class D OXA-23 [EC:3.5.2.6] K18793 M00851 Carbapenem resistance 0,7 +blaOXA-134; beta-lactamase class D OXA-134 [EC:3.5.2.6] K19319 M00851 Carbapenem resistance 0,8 +blaOXA-211; beta-lactamase class D OXA-211 [EC:3.5.2.6] K19320 M00851 Carbapenem resistance 0,9 +blaOXA-214; beta-lactamase class D OXA-214 [EC:3.5.2.6] K19321 M00851 Carbapenem resistance 0,10 +blaOXA-229; beta-lactamase class D OXA-229 [EC:3.5.2.6] K19322 M00851 Carbapenem resistance 0,11 +blaOXA-58; beta-lactamase class D OXA-58 [EC:3.5.2.6] K18972 M00851 Carbapenem resistance 0,12 +blaOXA-62; beta-lactamase class D OXA-62 [EC:3.5.2.6] K19211 M00851 Carbapenem resistance 0,13 +blaOXA-48; beta-lactamase class D OXA-48 [EC:3.5.2.6] K18976 M00851 Carbapenem resistance 0,14 +blaOXA-60; beta-lactamase class D OXA-60 [EC:3.5.2.6] K21277 M00851 Carbapenem resistance 0,15 +blaIMP; metallo-beta-lactamase class B IMP [EC:3.5.2.6] K18782 M00851 Carbapenem resistance 0,16 +blaVIM; metallo-beta-lactamase class B VIM [EC:3.5.2.6] K18781 M00851 Carbapenem resistance 0,17 +blaNDM; metallo-beta-lactamase class B NDM [EC:3.5.2.6] K18780 M00851 Carbapenem resistance 0,18 +blaGIM; metallo-beta-lactamase class B GIM [EC:3.5.2.6] K19099 M00851 Carbapenem resistance 0,19 +blaIND; metallo-beta-lactamase class B IND [EC:3.5.2.6] K19216 M00851 Carbapenem resistance 0,20 +tcpI; toxin coregulated pilus biosynthesis protein I K10961 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 0,0 +tcpP; toxin coregulated pilus biosynthesis protein P K10920 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 1,0 +tcpH; toxin coregulated pilus biosynthesis protein H K10919 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 2,0 +tcpA; toxin coregulated pilin K10930 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 3,0 +tcpB; toxin coregulated pilus biosynthesis protein B K10931 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 4,0 +tcpQ; toxin coregulated pilus biosynthesis protein Q K10962 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 5,0 +tcpC; toxin coregulated pilus biosynthesis outer membrane protein C K10932 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 6,0 +tcpR; toxin coregulated pilus biosynthesis protein R K10963 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 7,0 +tcpD; toxin coregulated pilus biosynthesis protein D K10933 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 8,0 +tcpS; toxin coregulated pilus biosynthesis protein S K10964 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 9,0 +tcpT; toxin coregulated pilus biosynthesis protein T K10965 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 10,0 +tcpE; toxin coregulated pilus biosynthesis protein E K10934 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 11,0 +tcpF; toxin coregulated pilus biosynthesis protein F K10935 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 12,0 +tcpJ; toxin coregulated pilus biosynthesis protein J [EC:3.4.23.43 2.1.1.-] K10966 M00852 Vibrio cholerae pathogenicity signature, toxin coregulated pilus 13,0 +cfaA; CFA/I fimbrial subunit A K22850 M00853 ETEC pathogenicity signature, colonization factors 0,0 +cfaB; CFA/I fimbrial subunit B K22851 M00853 ETEC pathogenicity signature, colonization factors 1,0 +cfaC; CFA/I fimbrial subunit C K22852 M00853 ETEC pathogenicity signature, colonization factors 2,0 +cfaE; CFA/I fimbrial subunit E K22853 M00853 ETEC pathogenicity signature, colonization factors 3,0 +cfaD; CFA/I fimbrial subunit D K22854 M00853 ETEC pathogenicity signature, colonization factors 4,0 UTP--glucose-1-phosphate uridylyltransferase [EC:2.7.7.9] [RN:R00289] K00963 M00854 Glycogen biosynthesis, glucose-1P => glycogen/starch 0,0,0,0 C00029 UDP-glucose C00103 D-Glucose 1-phosphate glycogen synthase [EC:2.4.1.11] [RN:R00292] K00693 M00854 Glycogen biosynthesis, glucose-1P => glycogen/starch 0,0,1,0 C00718 Amylose C00029 UDP-glucose glycogen synthase [EC:2.4.1.11] [RN:R00292] K00750 M00854 Glycogen biosynthesis, glucose-1P => glycogen/starch 0,0,1,0 C00718 Amylose C00029 UDP-glucose @@ -3199,30 +3199,30 @@ pullulanase [EC:3.2.1.41] [COG:COG1523] [RN:R02111] K01200 M00855 Glycogen degra phosphoglucomutase [EC:5.4.2.2] [RN:R08639] K15779 M00855 Glycogen degradation, glycogen => glucose-6P 2,0 C00092 D-Glucose 6-phosphate C00103 D-Glucose 1-phosphate phosphoglucomutase [EC:5.4.2.2] [RN:R08639] K01835 M00855 Glycogen degradation, glycogen => glucose-6P 2,1 C00092 D-Glucose 6-phosphate C00103 D-Glucose 1-phosphate phosphoglucomutase [EC:5.4.2.2] [RN:R08639] K15778 M00855 Glycogen degradation, glycogen => glucose-6P 2,2 C00092 D-Glucose 6-phosphate C00103 D-Glucose 1-phosphate -cdtB; cytolethal distending toxin subunit B K11014 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 0,0 -ptxA; pertussis toxin subunit 1 [EC:2.4.2.-] K11023 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 1,0 -subB; subtilase cytotoxin, subunit B K19298 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 2,0 -ttsA; typhoid toxin secretion A K22918 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 3,0 -tviA; Vi polysaccharide biosynthesis protein TviA K22914 M00857 Salmonella enterica pathogenicity signature, Vi antigen 0,0 -tviB; UDP-N-acetylglucosamine 6-dehydrogenase [EC:1.1.1.136] K22926 M00857 Salmonella enterica pathogenicity signature, Vi antigen 1,0 -tviC; UDP-N-acetylglucosaminuronic acid 4-epimerase [EC:5.1.3.-] K22925 M00857 Salmonella enterica pathogenicity signature, Vi antigen 2,0 -tviD; Vi polysaccharide biosynthesis protein TviD K22915 M00857 Salmonella enterica pathogenicity signature, Vi antigen 3,0 -tviE; Vi polysaccharide biosynthesis protein TviE K22916 M00857 Salmonella enterica pathogenicity signature, Vi antigen 4,0 -vexE; Vi polysaccharide export protein VexE K22917 M00857 Salmonella enterica pathogenicity signature, Vi antigen 5,0 -vexA; Vi polysaccharide export protein VexA K22924 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 -vexB; Vi polysaccharide transport system permease protein K22921 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 -vexC; Vi polysaccharide transport system ATP-binding protein [EC:3.6.3.38] K22923 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 -vexD; Vi polysaccharide transport system permease protein K22922 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 -pagA; protective antigen K11030 M00859 Bacillus anthracis pathogenicity signature, anthrax toxin 0,0 -lef; anthrax lethal toxin endopeptidase [EC:3.4.24.83] K08645 M00859 Bacillus anthracis pathogenicity signature, anthrax toxin 1,0 -cyaA; anthrax edema toxin adenylate cyclase [EC:4.6.1.1] K11029 M00859 Bacillus anthracis pathogenicity signature, anthrax toxin 2,0 -atxA; anthrax toxin expression trans-acting positive regulator K22976 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 0,0 -acpA; capsule synthesis positive regulator AcpA K22977 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 1,0 -acpB; capsule synthesis positive regulator AcpB K22980 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 2,0 -capA; gamma-polyglutamate biosynthesis protein CapA K07282 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 3,0 -capC; gamma-polyglutamate biosynthesis protein CapC K22116 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 4,0 -capB; gamma-polyglutamate synthase [EC:6.3.2.-] K01932 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 5,0 -capE; gamma-polyglutamate biosynthesis protein CapE K22981 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 6,0 +cdtB; cytolethal distending toxin subunit B K11014 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 0,0 +ptxA; pertussis toxin subunit 1 [EC:2.4.2.-] K11023 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 1,0 +subB; subtilase cytotoxin, subunit B K19298 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 2,0 +ttsA; typhoid toxin secretion A K22918 M00856 Salmonella enterica pathogenicity signature, typhoid toxin 3,0 +tviA; Vi polysaccharide biosynthesis protein TviA K22914 M00857 Salmonella enterica pathogenicity signature, Vi antigen 0,0 +tviB; UDP-N-acetylglucosamine 6-dehydrogenase [EC:1.1.1.136] K22926 M00857 Salmonella enterica pathogenicity signature, Vi antigen 1,0 +tviC; UDP-N-acetylglucosaminuronic acid 4-epimerase [EC:5.1.3.-] K22925 M00857 Salmonella enterica pathogenicity signature, Vi antigen 2,0 +tviD; Vi polysaccharide biosynthesis protein TviD K22915 M00857 Salmonella enterica pathogenicity signature, Vi antigen 3,0 +tviE; Vi polysaccharide biosynthesis protein TviE K22916 M00857 Salmonella enterica pathogenicity signature, Vi antigen 4,0 +vexE; Vi polysaccharide export protein VexE K22917 M00857 Salmonella enterica pathogenicity signature, Vi antigen 5,0 +vexA; Vi polysaccharide export protein VexA K22924 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 +vexB; Vi polysaccharide transport system permease protein K22921 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 +vexC; Vi polysaccharide transport system ATP-binding protein [EC:3.6.3.38] K22923 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 +vexD; Vi polysaccharide transport system permease protein K22922 M00857 Salmonella enterica pathogenicity signature, Vi antigen 6,0 +pagA; protective antigen K11030 M00859 Bacillus anthracis pathogenicity signature, anthrax toxin 0,0 +lef; anthrax lethal toxin endopeptidase [EC:3.4.24.83] K08645 M00859 Bacillus anthracis pathogenicity signature, anthrax toxin 1,0 +cyaA; anthrax edema toxin adenylate cyclase [EC:4.6.1.1] K11029 M00859 Bacillus anthracis pathogenicity signature, anthrax toxin 2,0 +atxA; anthrax toxin expression trans-acting positive regulator K22976 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 0,0 +acpA; capsule synthesis positive regulator AcpA K22977 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 1,0 +acpB; capsule synthesis positive regulator AcpB K22980 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 2,0 +capA; gamma-polyglutamate biosynthesis protein CapA K07282 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 3,0 +capC; gamma-polyglutamate biosynthesis protein CapC K22116 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 4,0 +capB; gamma-polyglutamate synthase [EC:6.3.2.-] K01932 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 5,0 +capE; gamma-polyglutamate biosynthesis protein CapE K22981 M00860 Bacillus anthracis pathogenicity signature, polyglutamic acid capsule biosynthesis 6,0 acyl-CoA oxidase [EC:1.3.3.6] [RN:R07934 R07950] K00232 M00861 beta-Oxidation, peroxisome, VLCFA 0,0 C16387 (2E,6Z,9Z,12Z,15Z,18Z)-Tetracosahexaenoyl-CoA C16172 (6Z,9Z,12Z,15Z,18Z)-Tetracosapentaenoyl-CoA (3R)-3-hydroxyacyl-CoA dehydrogenase / enoyl-CoA hydratase 2 [EC:1.1.1.- 4.2.1.119] [RN:R07935 R07936 R07951 R07952] K12405 M00861 beta-Oxidation, peroxisome, VLCFA 1,0 C16389 (6Z,9Z,12Z,15Z,18Z)-3-Oxotetracosapentaenoyl-CoA C16388 (3R,6Z,9Z,12Z,15Z,18Z)-3-Hydroxytetracosapentaenoyl-CoA acetyl-CoA acyltransferase 1 [EC:2.3.1.16] [RN:R07937 R07953] K07513 M00861 beta-Oxidation, peroxisome, VLCFA 2,0 C16173 (4Z,7Z,10Z,13Z,16Z)-Docosapentaenoyl-CoA C16389 (6Z,9Z,12Z,15Z,18Z)-3-Oxotetracosapentaenoyl-CoA @@ -3230,16 +3230,16 @@ sterol carrier protein 2 [EC:2.3.1.176] [RN:R07937 R07953] K08764 M00861 beta-Ox 3alpha,7alpha,12alpha-trihydroxy-5beta-cholestanoyl-CoA 24-hydroxylase [EC:1.17.99.3] [RN:R08735 R08740] K10214 M00862 beta-Oxidation, peroxisome, tri/dihydroxycholestanoyl-CoA => choloyl/chenodeoxycholoyl-CoA 0,0 C05447 (24E)-3alpha,7alpha-Dihydroxy-5beta-cholest-24-enoyl-CoA C17346 (25S)-3alpha,7alpha-Dihydroxy-5beta-cholestanoyl-CoA (3R)-3-hydroxyacyl-CoA dehydrogenase / 3a,7a,12a-trihydroxy-5b-cholest-24-enoyl-CoA hydratase [EC:1.1.1.- 4.2.1.107] [RN:R04813 R04812 R04809 R04810] K12405 M00862 beta-Oxidation, peroxisome, tri/dihydroxycholestanoyl-CoA => choloyl/chenodeoxycholoyl-CoA 1,0 C05449 3alpha,7alpha-Dihydroxy-5beta-24-oxocholestanoyl-CoA C05448 (24R,25R)-3alpha,7alpha,24-Trihydroxy-5beta-cholestanoyl-CoA sterol carrier protein 2 [EC:2.3.1.176] [RN:R03719 R04811] K08764 M00862 beta-Oxidation, peroxisome, tri/dihydroxycholestanoyl-CoA => choloyl/chenodeoxycholoyl-CoA 2,0 C05337 Chenodeoxycholoyl-CoA C05449 3alpha,7alpha-Dihydroxy-5beta-24-oxocholestanoyl-CoA -lpxA; UDP-N-acetylglucosamine acyltransferase [EC:2.3.1.129] K00677 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 0,0 -lpxC; UDP-3-O-[3-hydroxymyristoyl] N-acetylglucosamine deacetylase [EC:3.5.1.108] K02535 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 1,0 -lpxC-fabZ; UDP-3-O-[3-hydroxymyristoyl] N-acetylglucosamine deacetylase / 3-hydroxyacyl-[acyl-carrier-protein] dehydratase [EC:3.5.1.108 4.2.1.59] K16363 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 1,1 -lpxD; UDP-3-O-[3-hydroxymyristoyl] glucosamine N-acyltransferase [EC:2.3.1.191] K02536 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 2,0 -lpxH; UDP-2,3-diacylglucosamine hydrolase [EC:3.6.1.54] K03269 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 3,0 -lpxB; lipid-A-disaccharide synthase [EC:2.4.1.182] K00748 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 4,0 -lpxK; tetraacyldisaccharide 4'-kinase [EC:2.7.1.130] K00912 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 5,0 -kdtA; 3-deoxy-D-manno-octulosonic-acid transferase [EC:2.4.99.12 2.4.99.13 2.4.99.14 2.4.99.15] K02527 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 6,0 -lpxL, htrB; Kdo2-lipid IVA lauroyltransferase/acyltransferase [EC:2.3.1.241 2.3.1.-] K02517 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 7,0 -lpxJ; Kdo2-lipid IVA 3' secondary acyltransferase [EC:2.3.1.-] K09778 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 8,0 +lpxA; UDP-N-acetylglucosamine acyltransferase [EC:2.3.1.129] K00677 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 0,0 +lpxC; UDP-3-O-[3-hydroxymyristoyl] N-acetylglucosamine deacetylase [EC:3.5.1.108] K02535 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 1,0 +lpxC-fabZ; UDP-3-O-[3-hydroxymyristoyl] N-acetylglucosamine deacetylase / 3-hydroxyacyl-[acyl-carrier-protein] dehydratase [EC:3.5.1.108 4.2.1.59] K16363 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 1,1 +lpxD; UDP-3-O-[3-hydroxymyristoyl] glucosamine N-acyltransferase [EC:2.3.1.191] K02536 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 2,0 +lpxH; UDP-2,3-diacylglucosamine hydrolase [EC:3.6.1.54] K03269 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 3,0 +lpxB; lipid-A-disaccharide synthase [EC:2.4.1.182] K00748 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 4,0 +lpxK; tetraacyldisaccharide 4'-kinase [EC:2.7.1.130] K00912 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 5,0 +kdtA; 3-deoxy-D-manno-octulosonic-acid transferase [EC:2.4.99.12 2.4.99.13 2.4.99.14 2.4.99.15] K02527 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 6,0 +lpxL, htrB; Kdo2-lipid IVA lauroyltransferase/acyltransferase [EC:2.3.1.241 2.3.1.-] K02517 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 7,0 +lpxJ; Kdo2-lipid IVA 3' secondary acyltransferase [EC:2.3.1.-] K09778 M00866 KDO2-lipid A biosynthesis, Raetz pathway, non-LpxL-LpxM type 8,0 lpxE; lipid A 1-phosphatase [EC:3.1.3.-] [RN:R12201] K12977 M00867 KDO2-lipid A modification pathway 0,0 C21994 1-Dephospho-KDO2-lipid A C21988 H. pylori KDO2-lipid A eptA; lipid A ethanolaminephosphotransferase [EC:2.7.8.43] [RN:R12202] K03760 M00867 KDO2-lipid A modification pathway 1,0 C21995 1-PEtN-KDO2-lipid A C21994 1-Dephospho-KDO2-lipid A kdoH1; 3-deoxy-D-manno-octulosonic acid-hydrolase [EC:3.2.1.144] [RN:R12219] K23082 M00867 KDO2-lipid A modification pathway 2,0 C21996,C01187 1-PEtN-KDO-lipid A,3-Deoxy-D-manno-octulosonate C21995 1-PEtN-KDO2-lipid A @@ -3255,25 +3255,25 @@ coproporphyrinogen III oxidase [EC:1.3.3.3] [RN:R03220] K00228 M00868 Heme biosy protoporphyrinogen/coproporphyrinogen III oxidase [EC:1.3.3.4] [RN:R03222] K00231 M00868 Heme biosynthesis, animals and fungi, glycine => heme 6,0 C02191 Protoporphyrin C01079 Protoporphyrinogen IX protoporphyrin/coproporphyrin ferrochelatase [EC:4.99.1.1] [RN:R00310] K01772 M00868 Heme biosynthesis, animals and fungi, glycine => heme 7,0 C00032 Heme C02191 Protoporphyrin FKTN; fukutin [EC:2.7.8.-] [RN:R12294] K19872 M00872 O-glycan biosynthesis, mannose type (core M3) 0,0 G13093 C00789,G13092 CDP-ribitol,Phospho-core M3 -FKRP; fukutin-related protein [EC:2.7.8.-] [RN:R12295] K19873 M00872 O-glycan biosynthesis, mannose type (core M3) 1,0 G13094 G13093 -TMEM5; alpha-dystroglycan beta1,4-xylosyltransferase [EC:2.4.2.61] [RN:R12244] K21052 M00872 O-glycan biosynthesis, mannose type (core M3) 2,0 G13095 G13094 -B4GAT1; beta-1,4-glucuronyltransferase 1 [EC:2.4.1.-] [RN:R12296] K21032 M00872 O-glycan biosynthesis, mannose type (core M3) 3,0 G13096 G13095 -LARGE; glycosyltransferase-like protein LARGE [EC:2.4.2.- 2.4.1.-] [RN:R12297 R12298] K09668 M00872 O-glycan biosynthesis, mannose type (core M3) 4,0 G13098 G13097 -malonyl-CoA/methylmalonyl-CoA synthetase [EC:6.2.1.-] K18660 M00873 Fatty acid biosynthesis in mitochondria, animals 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha/beta subcomplex 1, acyl-carrier protein K03955 M00873 Fatty acid biosynthesis in mitochondria, animals 1,0 -[acyl-carrier-protein] S-malonyltransferase [EC:2.3.1.39] K00645 M00873 Fatty acid biosynthesis in mitochondria, animals 1,0 -3-oxoacyl-[acyl-carrier-protein] synthase II [EC:2.3.1.179] K09458 M00873 Fatty acid biosynthesis in mitochondria, animals 2,0 -3-oxoacyl-[acyl-carrier protein] reductase [EC:1.1.1.-] K11539 M00873 Fatty acid biosynthesis in mitochondria, animals 3,0 -3-oxoacyl-[acyl-carrier protein] reductase [EC:1.1.1.-] K13370 M00873 Fatty acid biosynthesis in mitochondria, animals 3,0 -3-hydroxyacyl-thioester dehydratase, animal type [EC:4.2.1.-] K22540 M00873 Fatty acid biosynthesis in mitochondria, animals 4,0 -mitochondrial enoyl-[acyl-carrier protein] reductase [EC:1.3.1.-] K07512 M00873 Fatty acid biosynthesis in mitochondria, animals 5,0 -acetyl-CoA carboxylase / biotin carboxylase 1 [EC:6.4.1.2] K11262 M00874 Fatty acid biosynthesis in mitochondria, fungi 0,0 -NADH dehydrogenase (ubiquinone) 1 alpha/beta subcomplex 1, acyl-carrier protein K03955 M00874 Fatty acid biosynthesis in mitochondria, fungi 1,0 -[acyl-carrier-protein] S-malonyltransferase [EC:2.3.1.39] K00645 M00874 Fatty acid biosynthesis in mitochondria, fungi 1,0 -3-oxoacyl-[acyl-carrier-protein] synthase II [EC:2.3.1.179] K09458 M00874 Fatty acid biosynthesis in mitochondria, fungi 2,0 -3-oxoacyl-[acyl-carrier protein] reductase [EC:1.1.1.100] K00059 M00874 Fatty acid biosynthesis in mitochondria, fungi 3,0 -3-hydroxyacyl-thioester dehydratase, fungi type [EC:4.2.1.-] K22541 M00874 Fatty acid biosynthesis in mitochondria, fungi 4,0 -mitochondrial enoyl-[acyl-carrier protein] reductase [EC:1.3.1.-] K07512 M00874 Fatty acid biosynthesis in mitochondria, fungi 5,0 +FKRP; fukutin-related protein [EC:2.7.8.-] [RN:R12295] K19873 M00872 O-glycan biosynthesis, mannose type (core M3) 1,0 G13094 G13093 +TMEM5; alpha-dystroglycan beta1,4-xylosyltransferase [EC:2.4.2.61] [RN:R12244] K21052 M00872 O-glycan biosynthesis, mannose type (core M3) 2,0 G13095 G13094 +B4GAT1; beta-1,4-glucuronyltransferase 1 [EC:2.4.1.-] [RN:R12296] K21032 M00872 O-glycan biosynthesis, mannose type (core M3) 3,0 G13096 G13095 +LARGE; glycosyltransferase-like protein LARGE [EC:2.4.2.- 2.4.1.-] [RN:R12297 R12298] K09668 M00872 O-glycan biosynthesis, mannose type (core M3) 4,0 G13098 G13097 +malonyl-CoA/methylmalonyl-CoA synthetase [EC:6.2.1.-] K18660 M00873 Fatty acid biosynthesis in mitochondria, animals 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha/beta subcomplex 1, acyl-carrier protein K03955 M00873 Fatty acid biosynthesis in mitochondria, animals 1,0 +[acyl-carrier-protein] S-malonyltransferase [EC:2.3.1.39] K00645 M00873 Fatty acid biosynthesis in mitochondria, animals 1,0 +3-oxoacyl-[acyl-carrier-protein] synthase II [EC:2.3.1.179] K09458 M00873 Fatty acid biosynthesis in mitochondria, animals 2,0 +3-oxoacyl-[acyl-carrier protein] reductase [EC:1.1.1.-] K11539 M00873 Fatty acid biosynthesis in mitochondria, animals 3,0 +3-oxoacyl-[acyl-carrier protein] reductase [EC:1.1.1.-] K13370 M00873 Fatty acid biosynthesis in mitochondria, animals 3,0 +3-hydroxyacyl-thioester dehydratase, animal type [EC:4.2.1.-] K22540 M00873 Fatty acid biosynthesis in mitochondria, animals 4,0 +mitochondrial enoyl-[acyl-carrier protein] reductase [EC:1.3.1.-] K07512 M00873 Fatty acid biosynthesis in mitochondria, animals 5,0 +acetyl-CoA carboxylase / biotin carboxylase 1 [EC:6.4.1.2] K11262 M00874 Fatty acid biosynthesis in mitochondria, fungi 0,0 +NADH dehydrogenase (ubiquinone) 1 alpha/beta subcomplex 1, acyl-carrier protein K03955 M00874 Fatty acid biosynthesis in mitochondria, fungi 1,0 +[acyl-carrier-protein] S-malonyltransferase [EC:2.3.1.39] K00645 M00874 Fatty acid biosynthesis in mitochondria, fungi 1,0 +3-oxoacyl-[acyl-carrier-protein] synthase II [EC:2.3.1.179] K09458 M00874 Fatty acid biosynthesis in mitochondria, fungi 2,0 +3-oxoacyl-[acyl-carrier protein] reductase [EC:1.1.1.100] K00059 M00874 Fatty acid biosynthesis in mitochondria, fungi 3,0 +3-hydroxyacyl-thioester dehydratase, fungi type [EC:4.2.1.-] K22541 M00874 Fatty acid biosynthesis in mitochondria, fungi 4,0 +mitochondrial enoyl-[acyl-carrier protein] reductase [EC:1.3.1.-] K07512 M00874 Fatty acid biosynthesis in mitochondria, fungi 5,0 sbnI; L-serine kinase (ATP) / ParB family transcriptional regulator, heme-responsive regulator [EC:2.7.1.225] [RN:R12344] K23371 M00875 Staphyloferrin B biosynthesis, L-serine => staphyloferrin B 0,0 C01005 O-Phospho-L-serine C00065 L-Serine sbnA; N-(2-amino-2-carboxyethyl)-L-glutamate synthase [EC:2.5.1.140] [RN:R11705] K21949 M00875 Staphyloferrin B biosynthesis, L-serine => staphyloferrin B 1,0 C21559 N-[(2S)-2-Amino-2-carboxyethyl]-L-glutamate C01005 O-Phospho-L-serine sbnB; N-[(2S)-2-amino-2-carboxyethyl]-L-glutamate dehydrogenase [EC:1.5.1.51] [RN:11655] K21721 M00875 Staphyloferrin B biosynthesis, L-serine => staphyloferrin B 2,0 C03401 L-2,3-Diaminopropanoate C21559 N-[(2S)-2-Amino-2-carboxyethyl]-L-glutamate diff --git a/bin/assets/traits_rules.tsv b/bin/assets/traits_rules.tsv old mode 100755 new mode 100644 index 1c2a47c7..48b79167 --- a/bin/assets/traits_rules.tsv +++ b/bin/assets/traits_rules.tsv @@ -1,80 +1,80 @@ name alias rule topic_ecosystem notes -Methanogen methanogen mcr & notOtherMethanogen energy - mcr K00399 | K00400 | K00401 | K00402 | K03421 | K03422 energy - notOtherMethanogen not(OtherAjMethanogen) energy - OtherAjMethanogen sulfatereducer | Denitrifier | AerobicAmmoniaOxidizer | comammox | annamox | Phototroph | ETC60 energy -Aerobic Ammonia Oxidizer AerobicAmmoniaOxidizer AmmoniaMonooxygenase | [AmmoniaMonooxygenase & HydroxylamineDehydrogenase] energy - AmmoniaMonooxygenase EC1.14.99.39 | K10944 | K10945 | K10946 energy - HydroxylamineDehydrogenase EC1.7.2.6 | K10535 energy -Comammox comammox AmmoniaMonooxygenase & NitriteOxidoreductase & HydrazineDeydrogenase energy - NitriteOxidoreductase K00370 | K00371 energy - HydrazineDeydrogenase EC1.7.2.8 | K20935 energy -annamox annamox HydrazineDeydrogenase & HydrazineSynthase energy - HydrazineSynthase EC1.7.2.7 | K20932 | K20933 | K20934 energy -Nitrogen fixer NitrogenFixer Nitrogenase energy - Nitrogenase EC1.18.6.1 | EC1.18.6.2 | K02591 | K02586 | K02588 | K00531 | K22897 | K22896 | K22898 | K22899 energy -Phototroph Phototroph PhotosystemI | PhotosystemII energy - PhotosystemI K02689 | K02690 | K026901 | K02692 | K02693 | K02694 | K08940 | K08941 | K08942 | K08943 energy - PhotosystemII K02703 | K02704 | K02705 | K02706 | K02707 | K02708 | K08928 | K08929 energy - ETC60 percent60ComplexIA | percent60ComplexIB | percent60ComplexIC energy - ETC50 percent50ComplexIA | percent50ComplexIB | percent50ComplexIC energy - percent50ComplexIA percent(50,ComplexIA) energy - percent50ComplexIB percent(50,ComplexIB) energy - percent50ComplexIC percent(50,ComplexIC) energy - percent60ComplexIA percent(60,ComplexIA) energy - percent60ComplexIB percent(60,ComplexIB) energy - percent60ComplexIC percent(60,ComplexIC) energy - ComplexIA K00330,[K00331 & K00332 & [K00333 | K00331] & [K13378 | K13380]],K00334,K00335,K00336,K00337,K00338,K00339,K00340,[[K00341 & K00342] | K15863],K00343 energy - ComplexIB K05574,K05582,K05581,K05579,K05572,K05580,K05578,K05576,K05577,K05575,K05573,K05583,K05584,K05585 energy - ComplexIC K03945,K03946,K03947,K03948,K03949,K03950,K03951,K03952,K03953,K03954,K03955,K03956,K11352,K11353 energy -Fermenter Fermenter not(NegativeForFermenter) energy - NegativeForFermenter ETC50 | methanogen | Denitrifier | sulfatereducer | AerobicAmmoniaOxidizer | Aerobe | Microaerophillic | Phototroph energy - Denitrifier ETC50 & [NitrateReductase | NitriteReductase | NitricOxideReductase | NitrousOxideReductase] energy - NitrousOxideReductase K00376 | EC1.7.2.4 energy - NitricOxideReductase K04561 | K02305 | EC1.7.2.5 energy - NitriteReductase K00368 | K15864 | EC1.7.2.1 energy -Aerobe Aerobe [CytochromeCOxidase | CytochromeAa3600MenaquinolOxidase | CytochromeOUbiquinolOxidase] & ETC50 energy - CytochromeCOxidase K02275 | K02274 | K02276 | K15408 | K02277 energy - CytochromeAa3600MenaquinolOxidase K02827 | K02826 | K02828 | K02829 energy - CytochromeOUbiquinolOxidase K02297 | K02298 | K02299 | K02300 energy -Microaerophillic Microaerophillic [percent50CytochromeBDUbiquinolOxidase | percent50CytochromeCOxidaseCBB3] & ETC50 energy - percent50CytochromeBDUbiquinolOxidase percent(50,CytochromeBDUbiquinolOxidase) energy - percent50CytochromeCOxidaseCBB3 percent(50,CytochromeCOxidaseCBB3) energy - CytochromeBDUbiquinolOxidase K00425,K00426,K00424 | K22501 energy - CytochromeCOxidaseCBB3 K00404 | K00405 | K15862,K00407,K00406 energy - NotNarNapNrf not(NarNapNrf) energy - NarNapNrf NitrateReductase | NRF energy - NitrateReductase K00370 | K00371 | K00374 | K02567 | K02568 | EC1.7.5.1 | EC1.9.6.1 energy -Iron Oxidation IronOxidation [Cyc2 | PioA | Fe:sulfocyanin | foxEYZ | foxABC] & [Microaerophillic | Aerobe | sulfatereducer | Denitrifier | Phototroph] energy - Cyc2 Fe:Cyc2_repCluster1 energy - PioA PlaceHolder energy - foxEYZ Fe:FoxE | Fe:FoxY | Fe:FoxZ energy - foxABC Fe:FoxA | Fe:FoxB | Fe:FoxC energy - PlaceHolder FALSE energy -Probable Iron Reduction ProbIronReduction [notIronReductionGenes | hemeCount] & ETC50 energy - notIronReductionGenes not(IronReductionGenes) energy - hemeCount NotUnironDescription -> column_count_values(heme_regulatory_motif_count,ge,4,ge,3) energy - NotUnironDescription not(UnironDescription) energy - UnironDescription filter_contains(kegg_description,"nitrate reductase") energy -Iron Reduction IronReduction IronReductionGenes & ETC50 energy - IronReductionGenes mtrCAB | Fe:omcF | Fe:omcS | Fe:omcZ | Fe:DFE_operons | Fe:FmnA energy - mtrCAB Fe:MtrA & Fe:MtrB_TIGR03509 & Fe:MtrC_TIGR03507 energy - DFE_operons Fe:DFE_0448 | Fe:DFE_0449 | Fe:DFE_0450 | Fe:DFE_0451 | Fe:DFE_0461 | Fe:DFE_0462 | Fe:DFE_0463 | Fe:DFE_0464 | Fe:DFE_0465 energy -N reducer Nreducer ETC50 & [NitrateReductase | NitriteReductase | NitricOxideReductase | NitrousOxideReductase] energy -Fumarate Reduction FumarateReduction at_least(1,FumarateReductionParts) energy - FumarateReductionParts K00244,K00245,K00246,K00247 energy -Tetrathionate Reduction TetrathionateReduction [1ofttrrs & 1ofttrabc] | 2ofttrabc energy - 1ofttrrs K13040 | K13041 energy - 2ofttrabc at_least(2,ttrabc) energy - 1ofttrabc at_least(1,ttrabc) energy - ttrabc K08359,K08358,K08357 energy -DNRA DNRA nirBD | nrfAH energy - nirBD K00362 | K00363 energy - nrfAH K03385 | K15876 energy -Methanotroph Methanotroph pmoA | mmoX energy - pmoA K10944 | EC1.14.18.3 energy - mmoX K16157 energy -S oxidizer sulfateoxidizer [DsrABtypeo | SoeABC | SorAB | Sqr | FccAB | SoxXA | SoxYZ | SoxB | SoxCD] & percent50NADH energy +Methanogen methanogen mcr & notOtherMethanogen energy + mcr K00399 | K00400 | K00401 | K00402 | K03421 | K03422 energy + notOtherMethanogen not(OtherAjMethanogen) energy + OtherAjMethanogen sulfatereducer | Denitrifier | AerobicAmmoniaOxidizer | comammox | annamox | Phototroph | ETC60 energy +Aerobic Ammonia Oxidizer AerobicAmmoniaOxidizer AmmoniaMonooxygenase | [AmmoniaMonooxygenase & HydroxylamineDehydrogenase] energy + AmmoniaMonooxygenase EC1.14.99.39 | K10944 | K10945 | K10946 energy + HydroxylamineDehydrogenase EC1.7.2.6 | K10535 energy +Comammox comammox AmmoniaMonooxygenase & NitriteOxidoreductase & HydrazineDeydrogenase energy + NitriteOxidoreductase K00370 | K00371 energy + HydrazineDeydrogenase EC1.7.2.8 | K20935 energy +annamox annamox HydrazineDeydrogenase & HydrazineSynthase energy + HydrazineSynthase EC1.7.2.7 | K20932 | K20933 | K20934 energy +Nitrogen fixer NitrogenFixer Nitrogenase energy + Nitrogenase EC1.18.6.1 | EC1.18.6.2 | K02591 | K02586 | K02588 | K00531 | K22897 | K22896 | K22898 | K22899 energy +Phototroph Phototroph PhotosystemI | PhotosystemII energy + PhotosystemI K02689 | K02690 | K026901 | K02692 | K02693 | K02694 | K08940 | K08941 | K08942 | K08943 energy + PhotosystemII K02703 | K02704 | K02705 | K02706 | K02707 | K02708 | K08928 | K08929 energy + ETC60 percent60ComplexIA | percent60ComplexIB | percent60ComplexIC energy + ETC50 percent50ComplexIA | percent50ComplexIB | percent50ComplexIC energy + percent50ComplexIA percent(50,ComplexIA) energy + percent50ComplexIB percent(50,ComplexIB) energy + percent50ComplexIC percent(50,ComplexIC) energy + percent60ComplexIA percent(60,ComplexIA) energy + percent60ComplexIB percent(60,ComplexIB) energy + percent60ComplexIC percent(60,ComplexIC) energy + ComplexIA K00330,[K00331 & K00332 & [K00333 | K00331] & [K13378 | K13380]],K00334,K00335,K00336,K00337,K00338,K00339,K00340,[[K00341 & K00342] | K15863],K00343 energy + ComplexIB K05574,K05582,K05581,K05579,K05572,K05580,K05578,K05576,K05577,K05575,K05573,K05583,K05584,K05585 energy + ComplexIC K03945,K03946,K03947,K03948,K03949,K03950,K03951,K03952,K03953,K03954,K03955,K03956,K11352,K11353 energy +Fermenter Fermenter not(NegativeForFermenter) energy + NegativeForFermenter ETC50 | methanogen | Denitrifier | sulfatereducer | AerobicAmmoniaOxidizer | Aerobe | Microaerophillic | Phototroph energy + Denitrifier ETC50 & [NitrateReductase | NitriteReductase | NitricOxideReductase | NitrousOxideReductase] energy + NitrousOxideReductase K00376 | EC1.7.2.4 energy + NitricOxideReductase K04561 | K02305 | EC1.7.2.5 energy + NitriteReductase K00368 | K15864 | EC1.7.2.1 energy +Aerobe Aerobe [CytochromeCOxidase | CytochromeAa3600MenaquinolOxidase | CytochromeOUbiquinolOxidase] & ETC50 energy + CytochromeCOxidase K02275 | K02274 | K02276 | K15408 | K02277 energy + CytochromeAa3600MenaquinolOxidase K02827 | K02826 | K02828 | K02829 energy + CytochromeOUbiquinolOxidase K02297 | K02298 | K02299 | K02300 energy +Microaerophillic Microaerophillic [percent50CytochromeBDUbiquinolOxidase | percent50CytochromeCOxidaseCBB3] & ETC50 energy + percent50CytochromeBDUbiquinolOxidase percent(50,CytochromeBDUbiquinolOxidase) energy + percent50CytochromeCOxidaseCBB3 percent(50,CytochromeCOxidaseCBB3) energy + CytochromeBDUbiquinolOxidase K00425,K00426,K00424 | K22501 energy + CytochromeCOxidaseCBB3 K00404 | K00405 | K15862,K00407,K00406 energy + NotNarNapNrf not(NarNapNrf) energy + NarNapNrf NitrateReductase | NRF energy + NitrateReductase K00370 | K00371 | K00374 | K02567 | K02568 | EC1.7.5.1 | EC1.9.6.1 energy +Iron Oxidation IronOxidation [Cyc2 | PioA | Fe:sulfocyanin | foxEYZ | foxABC] & [Microaerophillic | Aerobe | sulfatereducer | Denitrifier | Phototroph] energy + Cyc2 Fe:Cyc2_repCluster1 energy + PioA PlaceHolder energy + foxEYZ Fe:FoxE | Fe:FoxY | Fe:FoxZ energy + foxABC Fe:FoxA | Fe:FoxB | Fe:FoxC energy + PlaceHolder FALSE energy +Probable Iron Reduction ProbIronReduction [notIronReductionGenes | hemeCount] & ETC50 energy + notIronReductionGenes not(IronReductionGenes) energy + hemeCount NotUnironDescription -> column_count_values(heme_regulatory_motif_count,ge,4,ge,3) energy + NotUnironDescription not(UnironDescription) energy + UnironDescription filter_contains(kegg_description,"nitrate reductase") energy +Iron Reduction IronReduction IronReductionGenes & ETC50 energy + IronReductionGenes mtrCAB | Fe:omcF | Fe:omcS | Fe:omcZ | Fe:DFE_operons | Fe:FmnA energy + mtrCAB Fe:MtrA & Fe:MtrB_TIGR03509 & Fe:MtrC_TIGR03507 energy + DFE_operons Fe:DFE_0448 | Fe:DFE_0449 | Fe:DFE_0450 | Fe:DFE_0451 | Fe:DFE_0461 | Fe:DFE_0462 | Fe:DFE_0463 | Fe:DFE_0464 | Fe:DFE_0465 energy +N reducer Nreducer ETC50 & [NitrateReductase | NitriteReductase | NitricOxideReductase | NitrousOxideReductase] energy +Fumarate Reduction FumarateReduction at_least(1,FumarateReductionParts) energy + FumarateReductionParts K00244,K00245,K00246,K00247 energy +Tetrathionate Reduction TetrathionateReduction [1ofttrrs & 1ofttrabc] | 2ofttrabc energy + 1ofttrrs K13040 | K13041 energy + 2ofttrabc at_least(2,ttrabc) energy + 1ofttrabc at_least(1,ttrabc) energy + ttrabc K08359,K08358,K08357 energy +DNRA DNRA nirBD | nrfAH energy + nirBD K00362 | K00363 energy + nrfAH K03385 | K15876 energy +Methanotroph Methanotroph pmoA | mmoX energy + pmoA K10944 | EC1.14.18.3 energy + mmoX K16157 energy +S oxidizer sulfateoxidizer [DsrABtypeo | SoeABC | SorAB | Sqr | FccAB | SoxXA | SoxYZ | SoxB | SoxCD] & percent50NADH energy DsrABtypeo K11180 | S:dsrA | S:dsrB | K11181 energy BAD dsrAB (oxidizing type) [ --BAD dissimilatory-type sulfite reductase] SoeABC K21307 | K21308 | K21309 energy GOOD soeABC SorAB K05301 | K00386 energy MAYBE sorAB PF07682.11 S:SOR or just the kos I used @@ -86,50 +86,50 @@ S oxidizer sulfateoxidizer [DsrABtypeo | SoeABC | SorAB | Sqr | FccAB | SoxXA | SoxCD K17225 | K22622 energy GOOD soxCD Selected the KO that was SUlpher related percent50NADH percent(50,NADH) energy MAYBE 50% of NADH dehydrogenase with electron acceptor [--BAD is this 2 things] NADH K03934,K03935,K03936,K03937,K03938,K03939,K03940,K03941,K03942,K03943,K03944 energy I am going to include the optional extra K03934+K03935+K03936+K03937+K03938+K03939+K03940+K03941+K03942+K03943-K03944 -S reducer sulfatereducer DsrABtyper | PhsA | TtrA energy +S reducer sulfatereducer DsrABtyper | PhsA | TtrA energy DsrABtyper K11180 | S:dsrA | S:dsrB | K11181 energy BAD dsrAB (reducing type) [dissimilatory-type sulfite reductase in sulpher] PhsA K08352 energy MAYBE phsA [S:thiosulfate_reductase_phsA_alignment] TtrA K08357 energy GOOD ttrA -Simple Sugars Glucose Glucose K02777 | K02779 | K02791 | K20118 | K18124 | K18125 | K00115 | K00117 | K19813 | K18851 | K00844 | K12407 | K00845 | K25026 carbon -Simple Sugars Sucrose Sucrose K01182 | K01203 | K12047 | K01187 | K12316 | K12317 | K06617 | K01193 | K00695 | K02810 | K00690 | K05341 | K00689 | K00692 carbon -Simple Sugars Mannose Mannose [K01809 | K02793 | K02794 | K02795] | K02796 carbon -Simple Sugars Galactose Galactose [K00849 | K00965 | K01784] | K01785 carbon -Simple Sugars Fucose Fucose [K00879 | K01628] | K01818 carbon -Simple Sugars Xylose Xylose [K00854 | K01805 | K00008 | K00011 | K00854 | K05351 | K17743 | K00078 | K14273 | K14274] | K14275 carbon -Simple Sugars Fructose Fructose K00008 | K00045 | K27924 | K00007 | K00844 | K00847 | K01805 | K00846 | K27475 | K02768 | K02769 | K02770 | K02771 | K11194 | K11195 | K11196 carbon -Simple Sugars Arabinose Arabinose K01804 | K00011 | K26066 | K13873 | K19660 | K12446 carbon -Simple Sugars Ribose Ribose K00852 carbon -Simple Sugars Rhamnose Rhamnose K01813 | K01820 | K18337 carbon -Simple Sugars Maltose Maltose K05343 | K00691 | K06896 | K16146 | K00705 | K22451 | K12047 | K01187 | K12316 | K12317 carbon -Simple Sugars Raffinose Raffinose K006611 | K01193 | K01189 | K07406 | K07407 carbon -Simple Sugars Sorbose Sorbose K02812 | K02813 | K02814 | K02815 carbon -Simple Sugars Trehalose Trehalose K12437 | K02777 | K02819 | K01194 | K22934 | K05342 | K05343 carbon -Simple Sugars Lactose Lactose [K01190 | K12111 | K12112] | K12309 carbon -Complex Polysaccharide Amorphous Cellulose Amorphous Cellulose [[GH94 | GH1 | GH2 | GH3 | GH5 | GH9 | GH16] | GH116] & [[GH5 | GH6 | GH7 | GH8 | GH9 | GH10 | GH124 | GH12 | GH44] | GH45] carbon -Complex Polysaccharide Crystalline Cellulose Crystalline Cellulose [GH7 | GH48 | AA10 | AA15 | AA16 | AA9 | AA10 | AA11] | AA13 carbon -Complex Polysaccharide Starch Starch [[AA13 | GH13 | GH14 | GH57 | GH119] | GH126] & [[GH133 | GH15] | GH97] carbon -Complex Polysaccharide Pectin Pectin [[GH28 | PL1 | PL2 | PL9 | PL10 | PL11 | PL22 | PL26 | PL3] | PL4] & [[GH78 | GH106 | GH138 | GH139 | GH143 | CE8 | GH105 | GH4 | CE12] | GH2] carbon -Complex Polysaccharide Beta-mannan Beta-mannan [[GH113 | GH134 | GH26] | GH5] & [[GH26 | GH130 | GH113 | CE2 | CE17] | GH2] carbon -Complex Polysaccharide Alpha-mannan Alpha-mannan [[GH99 | GH76] & [GH76 | GH92 | GH38 | GH63 | GH47 | GH125]] | GH130 carbon -Complex Polysaccharide Xyloglucan Xyloglucan [[GH5 | GH9 | GH12 | GH16 | GH44 | GH45 | GH48 | GH74] | AA9] & [[GH31 | GH43 | GH10] | GH2] carbon -Complex Polysaccharide Xylan Xylan [[AA13 | GH13 | GH14 | GH57 | GH119] | GH126] & [[GH133 | GH15] | GH97] carbon -Short-Chain Fatty Acids (SCFA) Acetate Acetate-Final Acetate-1 | Acetate-2 | Acetate-3 carbon - Acetate-1 [[Acetate-sub1 & [K00163 | K00161 | K00162] & K00627] | [K00174 | K00175] | [K00169 | K00170 | K00172 | K00189 | K00171 | K03737]] & [K01905 | K22224 | K24012] carbon - Acetate-2 Acetate-sub1 & K01568 & [K00138 | K00128 | K14085 | K00149 | K00129] carbon - Acetate-3 K001895 | K01913 carbon - Acetate-sub1 [K00163 | K00161 | K00162 | K01568] carbon -Short-Chain Fatty Acids (SCFA) Propionate Propionate-Final Propionate-1 | Propionate-2 | Propionate-3 carbon +Simple Sugars Glucose Glucose K02777 | K02779 | K02791 | K20118 | K18124 | K18125 | K00115 | K00117 | K19813 | K18851 | K00844 | K12407 | K00845 | K25026 carbon +Simple Sugars Sucrose Sucrose K01182 | K01203 | K12047 | K01187 | K12316 | K12317 | K06617 | K01193 | K00695 | K02810 | K00690 | K05341 | K00689 | K00692 carbon +Simple Sugars Mannose Mannose [K01809 | K02793 | K02794 | K02795] | K02796 carbon +Simple Sugars Galactose Galactose [K00849 | K00965 | K01784] | K01785 carbon +Simple Sugars Fucose Fucose [K00879 | K01628] | K01818 carbon +Simple Sugars Xylose Xylose [K00854 | K01805 | K00008 | K00011 | K00854 | K05351 | K17743 | K00078 | K14273 | K14274] | K14275 carbon +Simple Sugars Fructose Fructose K00008 | K00045 | K27924 | K00007 | K00844 | K00847 | K01805 | K00846 | K27475 | K02768 | K02769 | K02770 | K02771 | K11194 | K11195 | K11196 carbon +Simple Sugars Arabinose Arabinose K01804 | K00011 | K26066 | K13873 | K19660 | K12446 carbon +Simple Sugars Ribose Ribose K00852 carbon +Simple Sugars Rhamnose Rhamnose K01813 | K01820 | K18337 carbon +Simple Sugars Maltose Maltose K05343 | K00691 | K06896 | K16146 | K00705 | K22451 | K12047 | K01187 | K12316 | K12317 carbon +Simple Sugars Raffinose Raffinose K006611 | K01193 | K01189 | K07406 | K07407 carbon +Simple Sugars Sorbose Sorbose K02812 | K02813 | K02814 | K02815 carbon +Simple Sugars Trehalose Trehalose K12437 | K02777 | K02819 | K01194 | K22934 | K05342 | K05343 carbon +Simple Sugars Lactose Lactose [K01190 | K12111 | K12112] | K12309 carbon +Complex Polysaccharide Amorphous Cellulose Amorphous Cellulose [[GH94 | GH1 | GH2 | GH3 | GH5 | GH9 | GH16] | GH116] & [[GH5 | GH6 | GH7 | GH8 | GH9 | GH10 | GH124 | GH12 | GH44] | GH45] carbon +Complex Polysaccharide Crystalline Cellulose Crystalline Cellulose [GH7 | GH48 | AA10 | AA15 | AA16 | AA9 | AA10 | AA11] | AA13 carbon +Complex Polysaccharide Starch Starch [[AA13 | GH13 | GH14 | GH57 | GH119] | GH126] & [[GH133 | GH15] | GH97] carbon +Complex Polysaccharide Pectin Pectin [[GH28 | PL1 | PL2 | PL9 | PL10 | PL11 | PL22 | PL26 | PL3] | PL4] & [[GH78 | GH106 | GH138 | GH139 | GH143 | CE8 | GH105 | GH4 | CE12] | GH2] carbon +Complex Polysaccharide Beta-mannan Beta-mannan [[GH113 | GH134 | GH26] | GH5] & [[GH26 | GH130 | GH113 | CE2 | CE17] | GH2] carbon +Complex Polysaccharide Alpha-mannan Alpha-mannan [[GH99 | GH76] & [GH76 | GH92 | GH38 | GH63 | GH47 | GH125]] | GH130 carbon +Complex Polysaccharide Xyloglucan Xyloglucan [[GH5 | GH9 | GH12 | GH16 | GH44 | GH45 | GH48 | GH74] | AA9] & [[GH31 | GH43 | GH10] | GH2] carbon +Complex Polysaccharide Xylan Xylan [[AA13 | GH13 | GH14 | GH57 | GH119] | GH126] & [[GH133 | GH15] | GH97] carbon +Short-Chain Fatty Acids (SCFA) Acetate Acetate-Final Acetate-1 | Acetate-2 | Acetate-3 carbon + Acetate-1 [[Acetate-sub1 & [K00163 | K00161 | K00162] & K00627] | [K00174 | K00175] | [K00169 | K00170 | K00172 | K00189 | K00171 | K03737]] & [K01905 | K22224 | K24012] carbon + Acetate-2 Acetate-sub1 & K01568 & [K00138 | K00128 | K14085 | K00149 | K00129] carbon + Acetate-3 K001895 | K01913 carbon + Acetate-sub1 [K00163 | K00161 | K00162 | K01568] carbon +Short-Chain Fatty Acids (SCFA) Propionate Propionate-Final Propionate-1 | Propionate-2 | Propionate-3 carbon Propionate-1 "[ [K01899 | K01900 | K01902 | K01903 | K01899] & [K01847 | K01849 | K01848] & [K00140 | [K05606 & [K11264 | K03416 | K18426]]] & Propionate-sub2 ] - | Propionate-sub1" carbon - Propionate-2 [K01026 & [K20626 | K20627] & [K00248 | K00232] & Propionate-sub2] | Propionate-sub1 carbon - Propionate-3 [[K01699 | K13919 | K13920] & K13922 & Propionate-sub2] | Propionate-sub1 carbon + | Propionate-sub1" carbon + Propionate-2 [K01026 & [K20626 | K20627] & [K00248 | K00232] & Propionate-sub2] | Propionate-sub1 carbon + Propionate-3 [[K01699 | K13919 | K13920] & K13922 & Propionate-sub2] | Propionate-sub1 carbon Propionate-sub1 "[ - [K01206 | K01905 | K22224 | K24012] + [K01206 | K01905 | K22224 | K24012] | [ [ [K13788 | K00625 | K15024 | K13923] @@ -138,12 +138,12 @@ Short-Chain Fatty Acids (SCFA) Propionate Propionate-Final Propionate-1 | Propio ] & [K00925 | K00932 | K19697] ] - ]" carbon - Propionate-sub2 [K01895 | K01908] carbon -Short-Chain Fatty Acids (SCFA) Butyrate Butyrate-Final Butyrate-1 | Butyrate-2 | Butyrate-3 | Butyrate-4 carbon - Butyrate-1 K00626 & [K00074 | K00022 | K07516 | K01825 | K01782 | K07514] & [K01692 | K01825 | K01782 | K07515 | K07514 | K07511 | K01715] & Butyrate-sub1 carbon - Butyrate-2 [K00135 | K08324 | K00135 | K00139 | K17761 | K08324] & Butyrate-sub2 & Butyrate-sub1 carbon - Butyrate-3 K01580 & [K13524 | K07250 | K14268 | K00823 | K16871] & Butyrate-sub2 & Butyrate-sub1 carbon + ]" carbon + Propionate-sub2 [K01895 | K01908] carbon +Short-Chain Fatty Acids (SCFA) Butyrate Butyrate-Final Butyrate-1 | Butyrate-2 | Butyrate-3 | Butyrate-4 carbon + Butyrate-1 K00626 & [K00074 | K00022 | K07516 | K01825 | K01782 | K07514] & [K01692 | K01825 | K01782 | K07515 | K07514 | K07511 | K01715] & Butyrate-sub1 carbon + Butyrate-2 [K00135 | K08324 | K00135 | K00139 | K17761 | K08324] & Butyrate-sub2 & Butyrate-sub1 carbon + Butyrate-3 K01580 & [K13524 | K07250 | K14268 | K00823 | K16871] & Butyrate-sub2 & Butyrate-sub1 carbon Butyrate-4 "K01843 & [K01844 | K18011] & K18012 @@ -157,8 +157,8 @@ Short-Chain Fatty Acids (SCFA) Butyrate Butyrate-Final Butyrate-1 | Butyrate-2 | ] ] & Butyrate-1" carbon - Butyrate-sub1 [K00209 | K17829] & [K01034 | K01035 | K19709] carbon - Butyrate-sub2 [K00043 | K08318 | K18120 | K18121] & K18122 & K14534 carbon + Butyrate-sub1 [K00209 | K17829] & [K01034 | K01035 | K19709] carbon + Butyrate-sub2 [K00043 | K08318 | K18120 | K18121] & K18122 & K14534 carbon Short-Chain Fatty Acids (SCFA) Lactate Lactate-Final Lactate-1 | Lactate-2 | Lactate-3 carbon Lactate-1 "Lactate-sub1 & [ @@ -177,21 +177,21 @@ Short-Chain Fatty Acids (SCFA) Lactate Lactate-Final Lactate-1 | Lactate-2 | Lac ] ] & [K01689 | K27394 | K00873 | K12406] - & K00016" carbon - Lactate-2 K00016 carbon - Lactate-3 [K18124 | K18125 | K00115 | K19813 | K00117] & K01053 & K05308 & [K11395 | K18127] & K00016 carbon + & K00016" carbon + Lactate-2 K00016 carbon + Lactate-3 [K18124 | K18125 | K00115 | K19813 | K00117] & K01053 & K05308 & [K11395 | K18127] & K00016 carbon Lactate-sub1 "[K00844 | K00886 | K08074 | K00918 | K12407 | K00845 | K25026] & [K01810 | K06859 | K13810 | K15916] & [K24182 | K00850 | K16370 | K21071 | K00918 | K00895 | K21071] - & [K01623 | K01624 | K01622 | K11645 | K16305 | K16306]" carbon -Short-Chain Fatty Acids (SCFA) Formate Formate K00656 carbon -Amino Acids Glutamate Glutamate K11067 | K00618 | K00619 | K14681 | K14682 | K00620 | K22476 | K22477 | K22478 | K19412 | K25032 | K00260 | K00261 | K00262 | K01915 | K00931 | K18538 | K18539 | K00603 | K01776 | K11204 | K11205 | K01909 | K06048 | K13559 | K01915 | K14272 | K05825 | K28204 | K19268 | K01846 | K01885 | K14163 | K09698 | K14223 | K01886 carbon -Amino Acids Glycine Glycine K00659 | K00273 | K14272 | K00827 | K00830 | K14272 | K00281 | K00282 | K00283 | K00643 | K01620 | K20801 | K00639 | K18896 | K24071 | K00552 | K00613 | K00830 | K00600 | K10814 | K10815 | K10816 | K19967 | K21456 | K01920 | K00605 | K00382 | K02437 | K03153 | K01878 | K01879 | K01880 | K14164 carbon -Amino Acids Alanine Alanine K00814 | K14260 | K14272 | K00827 | K00830 | K14272 | K00259 | K19244 | K03851 | K01775 | K01798 | K01872 | K23665 carbon -Amino Acids Serine Serine K17989 | K01754 | K10752 | K25316 | K25317 | K12235 | K01695 | K01696 | K06001 | K01694 | K00600 | K00830 | K01697 | K10150 | K13290 | K17989 | K01752 | K00640 | K23304 | K23370 | K25193 | K00654 | K00640 | K23304 | K01875 | K23371 carbon -Organic Acids Oxalate Oxalate K01569 | K22133 carbon -Organic Acids Citrate Citrate K01681 | K27802 | K01682 | K05942 | K01648 | K01647 | K01659 | K15230 | K15231 | K27797 | K18310 | K27802 | K01682 | K15232 | K15233 carbon -Organic Acids Malate Malate K00025 | K00026 | K00024 | K00116 | K01676 | K01677 | K01678 | K01679 | K01675 | K01774 | K00051 | K22212 | K01638 | K08692 | K14067 | K00029 | K00028 | K14471 | K14472 carbon -Aromatics/Phenolics Vanillin Vanillin K21802 | K24276 carbon -Lipids Glycerol Glycerol K01189 | K07406 | K07407 | K00005 | K22251 | K18097 | K00864 | K06120 | K06121 | K06122 | K00011 | K00002 | K13979 carbon -Microbial Compounds Chitin Chitin K01183 | K20547 | K13381 | K01452 carbon + & [K01623 | K01624 | K01622 | K11645 | K16305 | K16306]" carbon +Short-Chain Fatty Acids (SCFA) Formate Formate K00656 carbon +Amino Acids Glutamate Glutamate K11067 | K00618 | K00619 | K14681 | K14682 | K00620 | K22476 | K22477 | K22478 | K19412 | K25032 | K00260 | K00261 | K00262 | K01915 | K00931 | K18538 | K18539 | K00603 | K01776 | K11204 | K11205 | K01909 | K06048 | K13559 | K01915 | K14272 | K05825 | K28204 | K19268 | K01846 | K01885 | K14163 | K09698 | K14223 | K01886 carbon +Amino Acids Glycine Glycine K00659 | K00273 | K14272 | K00827 | K00830 | K14272 | K00281 | K00282 | K00283 | K00643 | K01620 | K20801 | K00639 | K18896 | K24071 | K00552 | K00613 | K00830 | K00600 | K10814 | K10815 | K10816 | K19967 | K21456 | K01920 | K00605 | K00382 | K02437 | K03153 | K01878 | K01879 | K01880 | K14164 carbon +Amino Acids Alanine Alanine K00814 | K14260 | K14272 | K00827 | K00830 | K14272 | K00259 | K19244 | K03851 | K01775 | K01798 | K01872 | K23665 carbon +Amino Acids Serine Serine K17989 | K01754 | K10752 | K25316 | K25317 | K12235 | K01695 | K01696 | K06001 | K01694 | K00600 | K00830 | K01697 | K10150 | K13290 | K17989 | K01752 | K00640 | K23304 | K23370 | K25193 | K00654 | K00640 | K23304 | K01875 | K23371 carbon +Organic Acids Oxalate Oxalate K01569 | K22133 carbon +Organic Acids Citrate Citrate K01681 | K27802 | K01682 | K05942 | K01648 | K01647 | K01659 | K15230 | K15231 | K27797 | K18310 | K27802 | K01682 | K15232 | K15233 carbon +Organic Acids Malate Malate K00025 | K00026 | K00024 | K00116 | K01676 | K01677 | K01678 | K01679 | K01675 | K01774 | K00051 | K22212 | K01638 | K08692 | K14067 | K00029 | K00028 | K14471 | K14472 carbon +Aromatics/Phenolics Vanillin Vanillin K21802 | K24276 carbon +Lipids Glycerol Glycerol K01189 | K07406 | K07407 | K00005 | K22251 | K18097 | K00864 | K06120 | K06121 | K06122 | K00011 | K00002 | K13979 carbon +Microbial Compounds Chitin Chitin K01183 | K20547 | K13381 | K01452 carbon diff --git a/bin/color_labels.R b/bin/color_labels.R deleted file mode 100755 index a6db0332..00000000 --- a/bin/color_labels.R +++ /dev/null @@ -1,49 +0,0 @@ -#!/usr/bin/env Rscript -# Load necessary libraries -library(ape) - -# Define the input files -newick_file <- commandArgs(trailingOnly = TRUE)[1] -labels_file <- commandArgs(trailingOnly = TRUE)[2] -output_pdf <- commandArgs(trailingOnly = TRUE)[3] - -# Read the Newick tree -tree <- read.tree(newick_file) - -# Read the labels to be colored -labels_to_color_raw <- readLines(labels_file) -labels_to_color <- sapply(strsplit(labels_to_color_raw, "\t"), `[`, 2) # Extract the second column - -# Print the labels to be colored for debugging -cat("Labels to be colored:\n") -print(labels_to_color) - -# Print the valid labels found in the tree for debugging -cat("Valid labels found in the tree:\n") -print(tree$tip.label) - -# Prepare the color vector -tip_colors <- rep("black", length(tree$tip.label)) - -# Apply red color to the specified labels -for (i in seq_along(tree$tip.label)) { - if (tree$tip.label[i] %in% labels_to_color) { - tip_colors[i] <- "red" - } -} - -# Debug statement to check which labels are set to red -cat("Tip colors set to red:\n") -print(tree$tip.label[tip_colors == "red"]) - -# Set plot size -pdf(output_pdf, width = 20, height = 20) - -# Plot the tree without tip labels to adjust spacing -plot(tree, type = "unrooted", show.tip.label = FALSE, no.margin = TRUE) - -# Add tip labels with custom colors and larger font size -tiplabels(tree$tip.label, frame = "none", adj = c(1, 1), col = tip_colors, cex = 0.7) - -# Close the PDF device -dev.off() diff --git a/bin/combine_annotations.py b/bin/combine_annotations.py index cef2f2da..0fed20c2 100755 --- a/bin/combine_annotations.py +++ b/bin/combine_annotations.py @@ -1,5 +1,4 @@ #!/usr/bin/env python -import argparse import pandas as pd from concurrent.futures import ThreadPoolExecutor, as_completed from skbio.io import read as read_sequence @@ -7,12 +6,12 @@ from pathlib import Path from utils.logger import get_logger import click -from utils.click_utils import validate_comma_separated -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') +FASTA_COLUMN = os.getenv("FASTA_COLUMN", "input_fasta") logger = get_logger(filename=Path(__file__).stem) + def read_and_preprocess(path: Path): # We design input fastas from intermediate steps to be named like: "input_fasta___some_information_annotation_file.tsv" input_fasta = input_fasta_from_filepath(path) @@ -24,37 +23,44 @@ def read_and_preprocess(path: Path): logger.error(f"Error loading DataFrame for input_fasta {input_fasta}: {str(e)}") return pd.DataFrame() # Return an empty DataFrame in case of error + def input_fasta_from_filepath(file_path: Path): return file_path.stem.split("___")[0] + def assign_rank(row): - rank = 'E' - if row.get('kegg_bitScore', 0) > 350: - rank = 'A' - elif row.get('uniref_bitScore', 0) > 350: - rank = 'B' - elif row.get('kegg_bitScore', 0) > 60 or row.get('uniref_bitScore', 0) > 60: - rank = 'C' - elif any(row.get(f"{db}_bitScore", 0) > 60 for db in ['pfam', 'dbcan', 'merops']): - rank = 'D' + rank = "E" + if row.get("kegg_bitScore", 0) > 350: + rank = "A" + elif row.get("uniref_bitScore", 0) > 350: + rank = "B" + elif row.get("kegg_bitScore", 0) > 60 or row.get("uniref_bitScore", 0) > 60: + rank = "C" + elif any(row.get(f"{db}_bitScore", 0) > 60 for db in ["pfam", "dbcan", "merops"]): + rank = "D" return rank + def convert_bit_scores_to_numeric(df): for col in df.columns: if "_bitScore" in col: - df[col] = pd.to_numeric(df[col], errors='coerce') + df[col] = pd.to_numeric(df[col], errors="coerce") return df + def count_motifs(gene_faa, motif="(C..CH)", genes_faa_dict=None): if genes_faa_dict is None: genes_faa_dict = dict() for seq in read_sequence(gene_faa, format="fasta"): if seq.metadata["id"] not in genes_faa_dict: genes_faa_dict[seq.metadata["id"]] = {} - - genes_faa_dict[seq.metadata["id"]]["heme_regulatory_motif_count"] = len(list(seq.find_with_regex(motif))) + + genes_faa_dict[seq.metadata["id"]]["heme_regulatory_motif_count"] = len( + list(seq.find_with_regex(motif)) + ) return genes_faa_dict + def set_gene_data(gene_faa, genes_faa_dict=None): if genes_faa_dict is None: genes_faa_dict = dict() @@ -64,53 +70,85 @@ def set_gene_data(gene_faa, genes_faa_dict=None): split_label = seq.metadata["id"].split("_") gene_position = split_label[-1] - start_position, end_position, strandedness = seq.metadata["description"].split("#")[1:4] + start_position, end_position, strandedness = seq.metadata["description"].split( + "#" + )[1:4] - input_fasta_name = Path(gene_faa).stem.split('_called_genes')[0] + input_fasta_name = Path(gene_faa).stem.split("_called_genes")[0] genes_faa_dict[seq.metadata["id"]][FASTA_COLUMN] = input_fasta_name genes_faa_dict[seq.metadata["id"]]["scaffold"] = ( seq.metadata["id"] .removeprefix(genes_faa_dict[seq.metadata["id"]][FASTA_COLUMN]) .removeprefix("_") - .removesuffix(f"_{gene_position}")) + .removesuffix(f"_{gene_position}") + ) genes_faa_dict[seq.metadata["id"]]["gene_number"] = int(gene_position) genes_faa_dict[seq.metadata["id"]]["start_position"] = int(start_position) genes_faa_dict[seq.metadata["id"]]["stop_position"] = int(end_position) genes_faa_dict[seq.metadata["id"]]["strandedness"] = int(strandedness) return genes_faa_dict + def organize_columns(df, special_columns=None): if special_columns is None: special_columns = [] - base_columns = ['query_id', FASTA_COLUMN, "scaffold", 'gene_number', 'start_position', 'stop_position', 'strandedness', 'rank'] + base_columns = [ + "query_id", + FASTA_COLUMN, + "scaffold", + "gene_number", + "start_position", + "stop_position", + "strandedness", + "rank", + ] base_columns = [col for col in base_columns if col in df.columns] - - kegg_columns = sorted([col for col in df.columns if col.startswith('kegg_')], key=lambda x: (x != 'kegg_id', x)) - other_columns = [col for col in df.columns if col not in base_columns + kegg_columns + special_columns] - - db_prefixes = set(col.split('_')[0] for col in other_columns) + + kegg_columns = sorted( + [col for col in df.columns if col.startswith("kegg_")], + key=lambda x: (x != "kegg_id", x), + ) + other_columns = [ + col + for col in df.columns + if col not in base_columns + kegg_columns + special_columns + ] + + db_prefixes = set(col.split("_")[0] for col in other_columns) sorted_other_columns = [] for prefix in db_prefixes: - prefixed_columns = sorted([col for col in other_columns if col.startswith(prefix + '_')], key=lambda x: (x != f"{prefix}_id", x)) + prefixed_columns = sorted( + [col for col in other_columns if col.startswith(prefix + "_")], + key=lambda x: (x != f"{prefix}_id", x), + ) sorted_other_columns.extend(prefixed_columns) - - final_columns_order = base_columns + kegg_columns + sorted_other_columns + special_columns + + final_columns_order = ( + base_columns + kegg_columns + sorted_other_columns + special_columns + ) return df[final_columns_order] + @click.command() @click.option("--annotations_dir", required=True, help="Directory of annotation files") -@click.option("--genes_dir", required=True, help="Directory genes faa file paths from prodigal") +@click.option( + "--genes_dir", required=True, help="Directory genes faa file paths from prodigal" +) @click.option("--output", help="Output file path for the combined annotations.") -@click.option("--threads", help="Number of threads for parallel processing", type=int, default=4) +@click.option( + "--threads", help="Number of threads for parallel processing", type=int, default=4 +) def combine_annotations(annotations_dir, genes_dir, output, threads): """Combine annotation files with ranks and avoid duplicating specific columns.""" annotations = Path(annotations_dir).glob("*") genes_faa = Path(genes_dir).glob("*") with ThreadPoolExecutor(max_workers=threads) as executor: # futures = [executor.submit(read_and_preprocess, input_fasta, path) for input_fasta, path in input_fastas_and_paths] - futures = [executor.submit(read_and_preprocess, Path(path)) for path in annotations] + futures = [ + executor.submit(read_and_preprocess, Path(path)) for path in annotations + ] data_frames = [future.result() for future in as_completed(futures)] - + combined_data = pd.concat(data_frames, ignore_index=True) if genes_faa: genes_faa_dict = dict() @@ -119,36 +157,47 @@ def combine_annotations(annotations_dir, genes_dir, output, threads): genes_faa_dict count_motifs(gene_path, "(C..CH)", genes_faa_dict=genes_faa_dict) set_gene_data(gene_path, genes_faa_dict) - df = pd.DataFrame.from_dict(genes_faa_dict, orient='index') + df = pd.DataFrame.from_dict(genes_faa_dict, orient="index") columns = [col for col in df.columns.tolist() if col != FASTA_COLUMN] - combined_data = combined_data.drop(columns=columns, errors='ignore') - df.index.name = 'query_id' - df = df.rename(columns={FASTA_COLUMN: FASTA_COLUMN+"2"}) - + combined_data = combined_data.drop(columns=columns, errors="ignore") + df.index.name = "query_id" + df = df.rename(columns={FASTA_COLUMN: FASTA_COLUMN + "2"}) + # we use outer to get any genes that don't have hits combined_data = pd.merge(combined_data, df, how="outer", on="query_id") combined_data[FASTA_COLUMN] = combined_data[FASTA_COLUMN].fillna("") mask = combined_data[FASTA_COLUMN] != "" - combined_data[FASTA_COLUMN] = combined_data[FASTA_COLUMN].where(mask, other=combined_data[FASTA_COLUMN+"2"]) - + combined_data[FASTA_COLUMN] = combined_data[FASTA_COLUMN].where( + mask, other=combined_data[FASTA_COLUMN + "2"] + ) + combined_data = convert_bit_scores_to_numeric(combined_data) - aggregation_functions = {col: 'first' for col in combined_data.columns if col not in ['query_id', FASTA_COLUMN]} - for col in ['Completeness', 'Contamination', 'taxonomy']: + aggregation_functions = { + col: "first" + for col in combined_data.columns + if col not in ["query_id", FASTA_COLUMN] + } + for col in ["Completeness", "Contamination", "taxonomy"]: if col in combined_data.columns: - aggregation_functions[col] = 'max' - combined_data = combined_data.groupby(['query_id', FASTA_COLUMN], as_index=False).agg(aggregation_functions) + aggregation_functions[col] = "max" + combined_data = combined_data.groupby( + ["query_id", FASTA_COLUMN], as_index=False + ).agg(aggregation_functions) # After aggregating data - combined_data['rank'] = combined_data.apply(assign_rank, axis=1) + combined_data["rank"] = combined_data.apply(assign_rank, axis=1) # Continue with organizing columns and saving the DataFrame - special_columns = ['Completeness', 'Contamination', 'taxonomy'] + special_columns = ["Completeness", "Contamination", "taxonomy"] special_columns = [col for col in special_columns if col in combined_data.columns] combined_data = organize_columns(combined_data, special_columns=special_columns) - combined_data = combined_data.sort_values(by=[FASTA_COLUMN, 'scaffold', 'gene_number']) + combined_data = combined_data.sort_values( + by=[FASTA_COLUMN, "scaffold", "gene_number"] + ) - combined_data.to_csv(output, index=False, sep='\t') + combined_data.to_csv(output, index=False, sep="\t") logger.info(f"Combined annotations saved to {output}, with corrected gene numbers.") + if __name__ == "__main__": combine_annotations() diff --git a/bin/distill.py b/bin/distill.py index 90c95ee6..14f5e8be 100755 --- a/bin/distill.py +++ b/bin/distill.py @@ -1,43 +1,71 @@ #!/usr/bin/env python """This is the script that distills the genomes""" + import click import os from pathlib import Path import polars as pl -from xlsxwriter import Workbook from utils.logger import get_logger from utils.click_utils import validate_comma_separated -from utils.click_utils import validate_comma_separated from utils.excel import write_summarized_genomes_to_xlsx from utils.pl_utils import read_csv from rule_parser.src.rules import evaluate_rules_on_anno, ID_EXPR_DICT logger = get_logger(filename=Path(__file__).stem) -COL_GENE_ID, COL_GENE_DESCRIPTION, COL_MODULE, COL_SHEET, COL_HEADER, COL_SUBHEADER, COL_ALIAS, COL_RULE = 'gene_id', 'gene_description', 'pathway', 'topic_ecosystem','category', 'subcategory', 'alias', 'rule' +( + COL_GENE_ID, + COL_GENE_DESCRIPTION, + COL_MODULE, + COL_SHEET, + COL_HEADER, + COL_SUBHEADER, + COL_ALIAS, + COL_RULE, +) = ( + "gene_id", + "gene_description", + "pathway", + "topic_ecosystem", + "category", + "subcategory", + "alias", + "rule", +) OPTIONAL_COLUMNS = [COL_ALIAS, COL_RULE] RRNA_COLUMNS = [COL_GENE_ID, COL_GENE_DESCRIPTION, COL_SHEET, COL_HEADER, COL_SUBHEADER] -TRNA_COLUMNS = RRNA_COLUMNS + ['AA_type'] +TRNA_COLUMNS = RRNA_COLUMNS + ["AA_type"] CORE_COLUMNS = RRNA_COLUMNS + [COL_MODULE] FRAME_COLUMNS = CORE_COLUMNS + OPTIONAL_COLUMNS -RRNA_TYPES = ['5S rRNA', '16S rRNA', '23S rRNA'] -TAXONOMY_LEVELS = ['d', 'p', 'c', 'o', 'f', 'g', 's'] -CONSTANT_DISTILLATE_COLUMNS = [COL_GENE_ID, COL_GENE_DESCRIPTION, COL_MODULE, COL_HEADER, COL_SUBHEADER] +RRNA_TYPES = ["5S rRNA", "16S rRNA", "23S rRNA"] +TAXONOMY_LEVELS = ["d", "p", "c", "o", "f", "g", "s"] +CONSTANT_DISTILLATE_COLUMNS = [ + COL_GENE_ID, + COL_GENE_DESCRIPTION, + COL_MODULE, + COL_HEADER, + COL_SUBHEADER, +] DISTILATE_SORT_ORDER_COLUMNS = [COL_HEADER, COL_SUBHEADER, COL_MODULE, COL_GENE_ID] EXCEL_MAX_CELL_SIZE = 32767 -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') +FASTA_COLUMN = os.getenv("FASTA_COLUMN", "input_fasta") DISTILL_DIR = Path(__file__).parent / "assets/forms/distill_sheets" - + def check_columns(data, logger): functions = [i for i in ID_EXPR_DICT if i in data.columns] missing = [i for i in ID_EXPR_DICT if i not in data.columns] - logger.info("Note: the following id fields " - f"were not in the annotations file and are not being used: {missing}," - f" but these are {functions}") + logger.info( + "Note: the following id fields " + f"were not in the annotations file and are not being used: {missing}," + f" but these are {functions}" + ) + -def make_genome_summary(annotations, genome_summary_frame: pl.LazyFrame, logger, groupby_column=FASTA_COLUMN): +def make_genome_summary( + annotations, genome_summary_frame: pl.LazyFrame, logger, groupby_column=FASTA_COLUMN +): if COL_RULE not in genome_summary_frame.collect_schema().names(): genome_summary_frame = genome_summary_frame.with_columns( pl.lit(None).cast(pl.String).alias(COL_RULE) @@ -57,12 +85,16 @@ def make_genome_summary(annotations, genome_summary_frame: pl.LazyFrame, logger, sample_col="query_id", label_col="gene_id", parent_col=None, - rules_col=COL_RULE - ) - df = df.join(annotations.select([pl.col("query_id"), pl.col("input_fasta")]), on="query_id").drop("query_id") + rules_col=COL_RULE, + ) + df = df.join( + annotations.select([pl.col("query_id"), pl.col("input_fasta")]), on="query_id" + ).drop("query_id") df = df.group_by("input_fasta").agg(pl.exclude("input_fasta").sum()) - df = df.select(pl.exclude("input_fasta")).transpose(include_header=True, header_name="gene_id", column_names=df["input_fasta"]) + df = df.select(pl.exclude("input_fasta")).transpose( + include_header=True, header_name="gene_id", column_names=df["input_fasta"] + ) df = genome_summary_frame.collect().join(df, on="gene_id", how="left") @@ -70,76 +102,84 @@ def make_genome_summary(annotations, genome_summary_frame: pl.LazyFrame, logger, return df + # TODO: add assembly stats like N50, longest contig, total assembled length etc -def make_genome_stats(annotations: pl.DataFrame, rrna_frame: pl.DataFrame = None, trna_frame: pl.DataFrame = None, quast_frame: pl.DataFrame = None, groupby_column: str = FASTA_COLUMN): +def make_genome_stats( + annotations: pl.DataFrame, + rrna_frame: pl.DataFrame = None, + trna_frame: pl.DataFrame = None, + quast_frame: pl.DataFrame = None, + groupby_column: str = FASTA_COLUMN, +): rows = list() - columns = ['genome'] - if 'scaffold' in annotations.columns: - columns.append('number of scaffolds') - if 'bin_taxonomy' in annotations.columns: - columns.append('taxonomy') - if 'bin_completeness' in annotations.columns: - columns.append('completeness score') - if 'bin_contamination' in annotations.columns: - columns.append('contamination score') + columns = ["genome"] + if "scaffold" in annotations.columns: + columns.append("number of scaffolds") + if "bin_taxonomy" in annotations.columns: + columns.append("taxonomy") + if "bin_completeness" in annotations.columns: + columns.append("completeness score") + if "bin_contamination" in annotations.columns: + columns.append("contamination score") for genome, frame in annotations.group_by(groupby_column): row = [genome[0]] - if 'scaffold' in frame.columns: - row.append(len(set(frame['scaffold']))) - if 'bin_taxonomy' in frame.columns: - row.append(frame['bin_taxonomy'][0]) - if 'bin_completeness' in frame.columns: - row.append(frame['bin_completeness'][0]) - if 'bin_contamination' in frame.columns: - row.append(frame['bin_contamination'][0]) + if "scaffold" in frame.columns: + row.append(len(set(frame["scaffold"]))) + if "bin_taxonomy" in frame.columns: + row.append(frame["bin_taxonomy"][0]) + if "bin_completeness" in frame.columns: + row.append(frame["bin_completeness"][0]) + if "bin_contamination" in frame.columns: + row.append(frame["bin_contamination"][0]) rows.append(row) - genome_stats = pl.DataFrame(rows, schema=columns, orient='row') + genome_stats = pl.DataFrame(rows, schema=columns, orient="row") if rrna_frame is not None: # Identify the "sample" columns (everything that's not metadata) meta_cols = RRNA_COLUMNS sample_cols = [c for c in rrna_frame.columns if c not in meta_cols] # group_by gene_id, sum sample columns - df_rrna = ( - rrna_frame - .group_by("gene_id") - .agg([pl.col(c).sum().alias(c) for c in sample_cols]) + df_rrna = rrna_frame.group_by("gene_id").agg( + [pl.col(c).sum().alias(c) for c in sample_cols] ) # transpose: rows -> genomes (samples), columns -> gene_id # This creates a "genome" column from original sample column names df_rrna = df_rrna.transpose( include_header=True, - header_name="genome", # new first column name - column_names="gene_id", # column headers come from gene_id values + header_name="genome", # new first column name + column_names="gene_id", # column headers come from gene_id values ) genome_stats = genome_stats.join(df_rrna, on="genome", how="inner") - assert genome_stats.shape[0] == df_rrna.shape[0], "genomes from annotation file don't map to rrna file" + assert genome_stats.shape[0] == df_rrna.shape[0], ( + "genomes from annotation file don't map to rrna file" + ) if trna_frame is not None: meta_cols = TRNA_COLUMNS sample_cols = [c for c in trna_frame.columns if c not in meta_cols] df_trna = ( - trna_frame - .filter(~pl.col("AA_type").is_in(["Undet", "Sup"])) + trna_frame.filter(~pl.col("AA_type").is_in(["Undet", "Sup"])) .group_by("AA_type") .agg([pl.col(c).sum().alias(c) for c in sample_cols]) - .select([(pl.col(c) != 0).cast(pl.Int64).sum().alias(c) for c in sample_cols]) - .transpose(include_header=True, header_name="genome", column_names=["tRNA count"]) + .select( + [(pl.col(c) != 0).cast(pl.Int64).sum().alias(c) for c in sample_cols] + ) + .transpose( + include_header=True, header_name="genome", column_names=["tRNA count"] + ) ) genome_stats = genome_stats.join(df_trna, on="genome", how="inner") - + if quast_frame is not None: - quast_frame = ( - quast_frame - .rename({groupby_column: "genome"}) - .drop("no. contigs") - ) + quast_frame = quast_frame.rename({groupby_column: "genome"}).drop("no. contigs") genome_stats = genome_stats.join(quast_frame, on="genome", how="inner") - assert genome_stats.shape[0] == quast_frame.shape[0], "genomes from annotation file don't map to quast file" + assert genome_stats.shape[0] == quast_frame.shape[0], ( + "genomes from annotation file don't map to quast file" + ) return genome_stats @@ -150,22 +190,46 @@ def make_genome_stats(annotations: pl.DataFrame, rrna_frame: pl.DataFrame = None @click.option("--rrna_path", help="rRNA output from annotation") @click.option("--trna_path", help="tRNA output from annotation") @click.option("--quast_path", help="Quast summary TSV from the quast step") -@click.option("--groupby_column", help="Column from annotations to group as organism units", - default=FASTA_COLUMN) -@click.option("--distil_topics", default="default", help="Default distillates topics to run.") -@click.option("--distil_ecosystem", default="eng_sys,ag", help="Default distillates ecosystems to run.") -@click.option("--custom_distillate", default=[], callback=validate_comma_separated, help="Custom distillate forms to add your own modules, comma separated. ") -def distill(input_file, rrna_path=None, trna_path=None, quast_path=None, groupby_column=FASTA_COLUMN, distil_topics=None, distil_ecosystem=None, - custom_distillate=None): +@click.option( + "--groupby_column", + help="Column from annotations to group as organism units", + default=FASTA_COLUMN, +) +@click.option( + "--distil_topics", default="default", help="Default distillates topics to run." +) +@click.option( + "--distil_ecosystem", + default="eng_sys,ag", + help="Default distillates ecosystems to run.", +) +@click.option( + "--custom_distillate", + default=[], + callback=validate_comma_separated, + help="Custom distillate forms to add your own modules, comma separated. ", +) +def distill( + input_file, + rrna_path=None, + trna_path=None, + quast_path=None, + groupby_column=FASTA_COLUMN, + distil_topics=None, + distil_ecosystem=None, + custom_distillate=None, +): """Summarize metabolic content of annotated genomes""" # read in data try: - annotations = pl.read_csv(input_file, separator="\t", infer_schema_length=10_000) - except Exception as e: + annotations = pl.read_csv( + input_file, separator="\t", infer_schema_length=10_000 + ) + except Exception: annotations = pl.read_csv(input_file, separator="\t", infer_schema_length=None) - if 'bin_taxnomy' in annotations: - annotations = annotations.sort_values('bin_taxonomy') + if "bin_taxnomy" in annotations: + annotations = annotations.sort_values("bin_taxonomy") # Check the columns are present check_columns(annotations, logger) @@ -182,58 +246,72 @@ def distill(input_file, rrna_path=None, trna_path=None, quast_path=None, groupby DISTILL_DIR / "distill_misc.tsv", DISTILL_DIR / "distill_nitrogen.tsv", DISTILL_DIR / "distill_transport.tsv", - DISTILL_DIR / "distill_metals.tsv" + DISTILL_DIR / "distill_metals.tsv", ] else: - if 'carbon' in distil_topics: + if "carbon" in distil_topics: distil_sheets_names.append(DISTILL_DIR / "distill_carbon.tsv") - if 'energy' in distil_topics: + if "energy" in distil_topics: distil_sheets_names.append(DISTILL_DIR / "distill_energy.tsv") - if 'misc' in distil_topics: + if "misc" in distil_topics: distil_sheets_names.append(DISTILL_DIR / "distill_misc.tsv") - if 'nitrogen' in distil_topics: + if "nitrogen" in distil_topics: distil_sheets_names.append(DISTILL_DIR / "distill_nitrogen.tsv") - if 'transport' in distil_topics: + if "transport" in distil_topics: distil_sheets_names.append(DISTILL_DIR / "distill_transport.tsv") if "metals" in distil_topics: distil_sheets_names.append(DISTILL_DIR / "distill_metals.tsv") - - + if "ag" in distil_ecosystem: distil_sheets_names.append(DISTILL_DIR / "distill_ag.tsv") if "eng_sys" in distil_ecosystem: distil_sheets_names.append(DISTILL_DIR / "distill_eng_sys.tsv") - - if "camper_id" in annotations and ("default" in distil_topics or "camper" in distil_topics): + + if "camper_id" in annotations and ( + "default" in distil_topics or "camper" in distil_topics + ): distil_sheets_names.append(DISTILL_DIR / "distill_camper.tsv") - + logger.info(f"Distillate dir: {DISTILL_DIR}") logger.info(f"Distillate sheets to be used: {distil_sheets_names}") if custom_distillate: for custom_sheet in custom_distillate: distil_sheets_names.append(custom_sheet) - + genome_summary_form = pl.concat( [ - pl.scan_csv(s, separator="\t") - .select([c for c in FRAME_COLUMNS if c in pl.scan_csv(s, separator="\t", n_rows=0).columns]) + pl.scan_csv(s, separator="\t").select( + [ + c + for c in FRAME_COLUMNS + if c in pl.scan_csv(s, separator="\t", n_rows=0).columns + ] + ) for s in distil_sheets_names ], how="diagonal", ) - - logger.info('Retrieved distillate genome summary form') + + logger.info("Retrieved distillate genome summary form") # make genome stats - genome_stats = make_genome_stats(annotations, rrna_frame, trna_frame, quast_frame=quast_frame, groupby_column=groupby_column) - genome_stats.write_csv('genome_stats.tsv', separator='\t') - logger.info('Calculated genome statistics') + genome_stats = make_genome_stats( + annotations, + rrna_frame, + trna_frame, + quast_frame=quast_frame, + groupby_column=groupby_column, + ) + genome_stats.write_csv("genome_stats.tsv", separator="\t") + logger.info("Calculated genome statistics") # make genome metabolism summary - genome_summary = 'metabolism_summary.xlsx' - logger.info(f'Giving counts for genome metabolism summary') - summarized_genomes = make_genome_summary(annotations, genome_summary_form, logger, groupby_column) - summarized_genomes.write_csv('summarized_genomes.tsv', separator='\t') + genome_summary = "metabolism_summary.xlsx" + logger.info("Giving counts for genome metabolism summary") + summarized_genomes = make_genome_summary( + annotations, genome_summary_form, logger, groupby_column + ) + summarized_genomes.write_csv("summarized_genomes.tsv", separator="\t") kw = {"extra_frames": []} if rrna_frame is not None: kw["extra_frames"].append(rrna_frame) @@ -244,10 +322,10 @@ def distill(input_file, rrna_path=None, trna_path=None, quast_path=None, groupby output_file=genome_summary, group_by=COL_SHEET, sort_order_columns=DISTILATE_SORT_ORDER_COLUMNS, - **kw + **kw, ) - logger.info('Generated genome metabolism summary') + logger.info("Generated genome metabolism summary") + - if __name__ == "__main__": distill() diff --git a/bin/format_kegg_database.py b/bin/format_kegg_database.py index 9df6830e..5287c994 100755 --- a/bin/format_kegg_database.py +++ b/bin/format_kegg_database.py @@ -1,5 +1,5 @@ #!/usr/bin/env python -from os import path, mkdir +from os import path from datetime import datetime from shutil import move, rmtree from glob import glob @@ -77,7 +77,7 @@ def process_kegg( create_mmseqs( kegg_mod_loc, kegg_mmseqs_db, - #create_index=True, + # create_index=True, threads=threads, ) LOGGER.info("KEGG database processed") @@ -149,17 +149,32 @@ def main(): "--gene_ko_link_loc", type=str, help="Path to the gene KO link file" ) parser.add_argument( - "--skip_gene_ko_link", type=bool, help="Skip gene KO link processing. If not passed in, `--gene_ko_link_loc` is required", default=False + "--skip_gene_ko_link", + type=bool, + help="Skip gene KO link processing. If not passed in, `--gene_ko_link_loc` is required", + default=False, + ) + parser.add_argument( + "--output_dir", type=str, help="Path to the output directory", default="kegg" + ) + parser.add_argument( + "--download_date", + type=str, + help="Date of the KEGG download, if not included, will use today's date", + ) + parser.add_argument( + "--threads", type=int, help="Number of threads to use", default=10 ) - parser.add_argument("--output_dir", type=str, help="Path to the output directory", default="kegg") - parser.add_argument("--download_date", type=str, help="Date of the KEGG download, if not included, will use today's date") - parser.add_argument("--threads", type=int, help="Number of threads to use", default=10) args = parser.parse_args() - + if not args.skip_gene_ko_link and not args.gene_ko_link_loc: - parser.error("If `--skip_gene_ko_link` is not passed in, `--gene_ko_link_loc` is required") + parser.error( + "If `--skip_gene_ko_link` is not passed in, `--gene_ko_link_loc` is required" + ) if args.skip_gene_ko_link and args.gene_ko_link_loc: - parser.error("If `--skip_gene_ko_link` is passed in, `--gene_ko_link_loc` is not allowed") + parser.error( + "If `--skip_gene_ko_link` is passed in, `--gene_ko_link_loc` is not allowed" + ) prepare_databases( kegg_loc=args.kegg_loc, diff --git a/bin/generate_gff_genbank.py b/bin/generate_gff_genbank.py index 33ef4552..a23f0702 100755 --- a/bin/generate_gff_genbank.py +++ b/bin/generate_gff_genbank.py @@ -3,8 +3,6 @@ import csv from collections import defaultdict import os -import glob -from datetime import datetime from Bio import SeqIO from Bio.SeqRecord import SeqRecord from Bio.SeqFeature import SeqFeature, FeatureLocation @@ -12,22 +10,43 @@ import logging import urllib.parse # For escaping characters in accordance with RFC 3986 -logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s') +logging.basicConfig( + level=logging.DEBUG, format="%(asctime)s - %(levelname)s - %(message)s" +) + +FASTA_COLUMN = os.getenv("FASTA_COLUMN", "input_fasta") -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') def parse_arguments(): """Parse command line arguments.""" - parser = argparse.ArgumentParser(description="Generate GFF and/or GBK files from raw annotations, with specified databases formatting.") - parser.add_argument("--gff", action='store_true', help="Generate GFF file") - parser.add_argument("--gbk", action='store_true', help="Generate GBK file") - parser.add_argument("--input_fastas_paths", nargs='+', help="Alternating list of input_fasta names and paths to their .fna files.") - parser.add_argument("--database_list", type=str, help="Comma-separated list of databases to include in the annotations. Use 'empty' for all.", default="empty") - parser.add_argument("--annotations", required=True, help="Path to the raw annotations file") + parser = argparse.ArgumentParser( + description="Generate GFF and/or GBK files from raw annotations, with specified databases formatting." + ) + parser.add_argument("--gff", action="store_true", help="Generate GFF file") + parser.add_argument("--gbk", action="store_true", help="Generate GBK file") + parser.add_argument( + "--input_fastas_paths", + nargs="+", + help="Alternating list of input_fasta names and paths to their .fna files.", + ) + parser.add_argument( + "--database_list", + type=str, + help="Comma-separated list of databases to include in the annotations. Use 'empty' for all.", + default="empty", + ) + parser.add_argument( + "--annotations", required=True, help="Path to the raw annotations file" + ) args = parser.parse_args() - args.database_list = None if (args.database_list == "empty" or args.database_list == "all") else args.database_list.split(',') + args.database_list = ( + None + if (args.database_list == "empty" or args.database_list == "all") + else args.database_list.split(",") + ) return args + def parse_input_fastas_and_paths(input_fastas_paths): """ Parses the provided list of input_fasta names and .fna file paths into a structured dictionary. @@ -36,19 +55,22 @@ def parse_input_fastas_and_paths(input_fastas_paths): iterator = iter(cleaned_input_fastas_paths) return dict(zip(iterator, iterator)) + def sanitize_taxonomy(taxonomy): """ Sanitizes the taxonomy string for safe inclusion in GFF comments. Replaces semicolons with commas or another safe delimiter to avoid parsing issues. """ - return taxonomy.replace(';', ',') # Replace semicolons with commas + return taxonomy.replace(";", ",") # Replace semicolons with commas + def escape_gff3_value(value): """ Escapes characters in a string for GFF3 compliance, using URL encoding. """ # RFC 3986 percent-encoding, excluding reserved characters used in GFF3 format - return urllib.parse.quote(value, safe=':/,=.-') + return urllib.parse.quote(value, safe=":/,=.-") + def format_attributes(annotation, database_list): """ @@ -57,16 +79,17 @@ def format_attributes(annotation, database_list): """ attributes = [] for key, value in sorted(annotation.items()): - if (key.endswith('_id') or key.endswith('_description')) and value: - db_name = key.split('_')[0] + if (key.endswith("_id") or key.endswith("_description")) and value: + db_name = key.split("_")[0] if database_list is None or db_name in database_list: # Ensure value is URL-encoded encoded_value = escape_gff3_value(value) attributes.append(f"{db_name.upper()}_{key.upper()}={encoded_value}") - + # Join attributes with semicolons, avoiding spaces for GFF3 compliance return ";".join(attributes) + def generate_gff(input_fastas_annotations, database_list): """ Generate GFF files for each input_fasta, filtered by specified databases, @@ -76,34 +99,37 @@ def generate_gff(input_fastas_annotations, database_list): for input_fasta, annotations in input_fastas_annotations.items(): with open(f"GFF/{input_fasta}.gff", "w") as gff_file: gff_file.write("##gff-version 3\n") - + # Extract metadata from the first annotation (assuming it's consistent across annotations) metadata = annotations[0] - completeness = metadata.get('Completeness', 'NA') - contamination = metadata.get('Contamination', 'NA') - taxonomy = escape_gff3_value(metadata.get('taxonomy', 'NA').replace(';', ',')) - + completeness = metadata.get("Completeness", "NA") + contamination = metadata.get("Contamination", "NA") + taxonomy = escape_gff3_value( + metadata.get("taxonomy", "NA").replace(";", ",") + ) + gff_file.write(f"# Completeness: {completeness}\n") gff_file.write(f"# Contamination: {contamination}\n") gff_file.write(f"# Taxonomy: {taxonomy}\n") - + for annotation in annotations: try: - seqid = escape_gff3_value(annotation['query_id']) - source = '.' + seqid = escape_gff3_value(annotation["query_id"]) + source = "." type = "gene" - start = annotation['start_position'] - end = annotation['stop_position'] - score = '.' - strand = '+' if annotation['strandedness'] == '+1' else '-' - phase = '.' + start = annotation["start_position"] + end = annotation["stop_position"] + score = "." + strand = "+" if annotation["strandedness"] == "+1" else "-" + phase = "." attributes_str = format_attributes(annotation, database_list) - + gff_line = f"{seqid}\t{source}\t{type}\t{start}\t{end}\t{score}\t{strand}\t{phase}\t{attributes_str}\n" gff_file.write(gff_line) except KeyError as e: - logging.warning(f"Missing key in annotation: {e}. Skipping annotation: {annotation}") - + logging.warning( + f"Missing key in annotation: {e}. Skipping annotation: {annotation}" + ) def parse_fna_sequence(fna_file_path): @@ -114,6 +140,7 @@ def parse_fna_sequence(fna_file_path): sequences[header_name] = seq_record.seq return sequences + def aggregate_input_fasta_sequences(input_fastas_and_paths): """ Aggregate sequences from .fna files, ensuring correct matching with input_fasta names. @@ -123,11 +150,14 @@ def aggregate_input_fasta_sequences(input_fastas_and_paths): for input_fasta, file_path in input_fastas_and_paths.items(): if os.path.exists(file_path): # Assuming we're collecting all sequences for a input_fasta in a list - sequences[input_fasta] = [seq_record.seq for seq_record in SeqIO.parse(file_path, "fasta")] + sequences[input_fasta] = [ + seq_record.seq for seq_record in SeqIO.parse(file_path, "fasta") + ] else: print(f"File does not exist: {file_path}") return sequences + def format_qualifiers(annotation, database_list=None): """ Formats qualifiers for a GenBank feature, ensuring correct syntax and inclusion of essential information. @@ -135,38 +165,53 @@ def format_qualifiers(annotation, database_list=None): """ qualifiers = {} for key, value in annotation.items(): - if key in ['gene', 'product', 'note', 'function', 'locus_tag']: # Add 'locus_tag' if relevant + if key in [ + "gene", + "product", + "note", + "function", + "locus_tag", + ]: # Add 'locus_tag' if relevant qualifiers[key] = value else: # Check if the key is database-specific and whether it should be included - db_name = key.split('_')[0] + db_name = key.split("_")[0] if database_list is None or db_name in database_list: qualifiers[key] = value return qualifiers + def generate_gbk_feature(annotation): """Generate a SeqFeature for a GenBank file based on annotation data.""" - start = int(annotation['start_position']) - 1 # Convert to 0-based indexing - end = int(annotation['stop_position']) # End is inclusive, no adjustment needed - strand = 1 if annotation['strandedness'] == '+1' else -1 # Convert strandedness + start = int(annotation["start_position"]) - 1 # Convert to 0-based indexing + end = int(annotation["stop_position"]) # End is inclusive, no adjustment needed + strand = 1 if annotation["strandedness"] == "+1" else -1 # Convert strandedness location = FeatureLocation(start, end, strand=strand) qualifiers = { - 'locus_tag': annotation.get('query_id', 'unknown_locus'), + "locus_tag": annotation.get("query_id", "unknown_locus"), # Assuming 'product' or a general description can be derived from the data - 'product': next((annotation.get(k) for k in annotation.keys() if k.endswith('_description') and annotation[k]), 'unknown product') + "product": next( + ( + annotation.get(k) + for k in annotation.keys() + if k.endswith("_description") and annotation[k] + ), + "unknown product", + ), } # Dynamically add database-specific information as qualifiers for key, value in annotation.items(): - if key.endswith(('_id', '_description', '_EC')) and value: + if key.endswith(("_id", "_description", "_EC")) and value: # Simple heuristic to extract database prefix and adjust it if necessary - db_prefix = key.split('_')[0] + db_prefix = key.split("_")[0] qualifier_key = f"db_{db_prefix}" qualifiers[qualifier_key] = value return SeqFeature(location=location, type="CDS", qualifiers=qualifiers) + def generate_gbk(input_fastas_annotations, database_list, input_fastas_and_paths): os.makedirs("GBK", exist_ok=True) # Ensure the output directory exists @@ -182,15 +227,24 @@ def generate_gbk(input_fastas_annotations, database_list, input_fastas_and_paths sequence_index = SeqIO.index(fna_file_path, "fasta") # Initialize a SeqRecord for the input_fasta - input_fasta_seq_record = SeqRecord(Seq(""), id=input_fasta, name="", description=f"Annotations for {input_fasta}") - + input_fasta_seq_record = SeqRecord( + Seq(""), + id=input_fasta, + name="", + description=f"Annotations for {input_fasta}", + ) + # Extract metadata from one of the annotations (assuming consistency) metadata = annotations[0] if annotations else {} input_fasta_seq_record.annotations["source"] = "Your Source" input_fasta_seq_record.annotations["molecule_type"] = "DNA" - input_fasta_seq_record.annotations["organism"] = metadata.get('taxonomy', 'Not Available') - input_fasta_seq_record.annotations["comment"] = f"Completeness: {metadata.get('Completeness', 'NA')}; Contamination: {metadata.get('Contamination', 'NA')}; Taxonomy: {metadata.get('taxonomy', 'Not Available')}" - + input_fasta_seq_record.annotations["organism"] = metadata.get( + "taxonomy", "Not Available" + ) + input_fasta_seq_record.annotations["comment"] = ( + f"Completeness: {metadata.get('Completeness', 'NA')}; Contamination: {metadata.get('Contamination', 'NA')}; Taxonomy: {metadata.get('taxonomy', 'Not Available')}" + ) + # Iterate through annotations, creating features for each for annotation in annotations: query_id = annotation["query_id"] @@ -198,25 +252,26 @@ def generate_gbk(input_fastas_annotations, database_list, input_fastas_and_paths feature = generate_gbk_feature(annotation) input_fasta_seq_record.features.append(feature) else: - print(f"Warning: Query ID {query_id} not found in .fna file for input_fasta {input_fasta}.") + print( + f"Warning: Query ID {query_id} not found in .fna file for input_fasta {input_fasta}." + ) # Determine the output file path output_filename = os.path.join("GBK", f"{input_fasta}.gbk") - + # Write the SeqRecord to a GBK file with open(output_filename, "w") as output_handle: SeqIO.write([input_fasta_seq_record], output_handle, "genbank") print(f"GBK file generated for input_fasta {input_fasta}: {output_filename}") - def main(): args = parse_arguments() # Load annotations and organize by input_fasta input_fastas_annotations = defaultdict(list) - with open(args.annotations, 'r') as file: - reader = csv.DictReader(file, delimiter='\t') + with open(args.annotations, "r") as file: + reader = csv.DictReader(file, delimiter="\t") for row in reader: input_fastas_annotations[row[FASTA_COLUMN]].append(row) @@ -229,7 +284,10 @@ def main(): # Check if GBK generation is requested and call generate_gbk if args.gbk: - generate_gbk(input_fastas_annotations, args.database_list, input_fastas_and_paths) + generate_gbk( + input_fastas_annotations, args.database_list, input_fastas_and_paths + ) + if __name__ == "__main__": main() diff --git a/bin/hmm_parser.py b/bin/hmm_parser.py index 45cbce7b..73490b43 100755 --- a/bin/hmm_parser.py +++ b/bin/hmm_parser.py @@ -5,35 +5,98 @@ import numpy as np # query_id is targey name, but this matches our query_name later for merging -# In DRAM1 we had query and target swapped compared to usual HMMER terminology +# In DRAM1 we had query and target swapped compared to usual HMMER terminology # (so query_name here was target_id in DRAM1, model_start model_end were target_start target_end in DRAM1, etc.) -HMMSCAN_ALL_COLUMNS = ['query_id', 'target_ascession', 'target_length', 'query_name', 'query_ascession', 'query_length', 'full_evalue', 'full_bitScore', 'full_bias', 'domain_number', 'domain_count', 'domain_cevalue', 'domain_ievalue', 'domain_bitScore', 'domain_bias', 'model_start', 'model_end', 'alignment_start', 'alignment_end', 'env_start', 'env_end', 'accuracy', 'description'] -HMMSCAN_COLUMN_TYPES = [str, str, int, str, str, int, float, float, float, int, int, float, float, float, float, int, int, int, int, int, int, float, str] +HMMSCAN_ALL_COLUMNS = [ + "query_id", + "target_ascession", + "target_length", + "query_name", + "query_ascession", + "query_length", + "full_evalue", + "full_bitScore", + "full_bias", + "domain_number", + "domain_count", + "domain_cevalue", + "domain_ievalue", + "domain_bitScore", + "domain_bias", + "model_start", + "model_end", + "alignment_start", + "alignment_end", + "env_start", + "env_end", + "accuracy", + "description", +] +HMMSCAN_COLUMN_TYPES = [ + str, + str, + int, + str, + str, + int, + float, + float, + float, + int, + int, + float, + float, + float, + float, + int, + int, + int, + int, + int, + int, + float, + str, +] # Potential Columns to include in the final output if they are in the DataFrame (depends on the HMM info file provided and how things are process) -OUTPUT_COLUMNS = ['query_id', 'start_position', 'stop_position', 'strandedness', '{db_name}_id', '{db_name}_ids', "{db_name}_full_bitScore", "{db_name}_domain_bitScore", 'description', '{db_name}_EC', "{db_name}_score_rank"] +OUTPUT_COLUMNS = [ + "query_id", + "start_position", + "stop_position", + "strandedness", + "{db_name}_id", + "{db_name}_ids", + "{db_name}_full_bitScore", + "{db_name}_domain_bitScore", + "description", + "{db_name}_EC", + "{db_name}_score_rank", +] def parse_hmmsearch_domtblout(file): print(file) df_lines = [] for line in open(file): - if not line.startswith('#'): + if not line.startswith("#"): line = line.split() - line = line[:22] + [' '.join(line[22:])] + line = line[:22] + [" ".join(line[22:])] df_lines.append(line) column_data = {col: [] for col in HMMSCAN_ALL_COLUMNS} for line in df_lines: for i, col in enumerate(HMMSCAN_ALL_COLUMNS): - column_data[col].append(HMMSCAN_COLUMN_TYPES[i](line[i])) + column_data[col].append(HMMSCAN_COLUMN_TYPES[i](line[i])) hmmsearch_frame = pd.DataFrame(column_data) - + # Extract the sign part from the description column to determine strandedness - hmmsearch_frame['strandedness'] = hmmsearch_frame['description'].apply(lambda x: 1 if x.endswith('+') else -1) + hmmsearch_frame["strandedness"] = hmmsearch_frame["description"].apply( + lambda x: 1 if x.endswith("+") else -1 + ) return hmmsearch_frame - + + def sig_scores_row_by_row(df, db_name) -> pd.DataFrame: df = df.loc[df["score_type"].isin(["full", "domain"])] score = df["full_bitScore"].copy() @@ -54,15 +117,18 @@ def sig_scores_row_by_row(df, db_name) -> pd.DataFrame: conditions = [ (score >= s_a), - (score >= s_b) + (score >= s_b), # The default covers all other cases ] choices = ["A", "B"] df[f"{db_name}_score_rank"] = np.select(conditions, choices, default=pd.NA) df = df.dropna(subset=[f"{db_name}_score_rank"]) else: - raise ValueError(f"No threshold or A_rank columns found in provided info sheet to determine significant hits for {db_name} hmm DB.") - return df + raise ValueError( + f"No threshold or A_rank columns found in provided info sheet to determine significant hits for {db_name} hmm DB." + ) + return df + def get_all_hits(hits, db_name): return ( @@ -71,23 +137,43 @@ def get_all_hits(hits, db_name): .agg("; ".join) ) + def extract_ec_numbers(definition): """ Extract EC numbers from the definition string and format them into a semi-colon separated list. Each EC number is prefixed with 'EC:'. """ # This regex pattern looks for EC numbers within square brackets and captures the numbers following "EC:" - ec_numbers = re.findall(r'\[EC:(.*?)\]', definition) + ec_numbers = re.findall(r"\[EC:(.*?)\]", definition) # Join the EC numbers with semi-colon separator and prepend 'EC:' to each number - formatted_ec_numbers = '; '.join([f"EC:{ec.strip()}" for ec_block in ec_numbers for ec in ec_block.split()]) + formatted_ec_numbers = "; ".join( + [f"EC:{ec.strip()}" for ec_block in ec_numbers for ec in ec_block.split()] + ) return formatted_ec_numbers + @click.command() -@click.option("--hmm_domtbl", type=click.Path(exists=True), help="Path to the HMM search results domtblout file.") -@click.option("--hmm_info_path", type=click.Path(exists=True), help="Path to the hmm_info_path file.") -@click.option("--ec_from_info", is_flag=True, help="Extract EC numbers from definitions in info sheet. Can only be used if hmm_info_path is provided.") -@click.option("--gene_locs", type=click.Path(exists=True), help="Path to the gene locations TSV file.") -@click.option('--db_name', type=str, help='Name of the HMM database.') +@click.option( + "--hmm_domtbl", + type=click.Path(exists=True), + help="Path to the HMM search results domtblout file.", +) +@click.option( + "--hmm_info_path", + type=click.Path(exists=True), + help="Path to the hmm_info_path file.", +) +@click.option( + "--ec_from_info", + is_flag=True, + help="Extract EC numbers from definitions in info sheet. Can only be used if hmm_info_path is provided.", +) +@click.option( + "--gene_locs", + type=click.Path(exists=True), + help="Path to the gene locations TSV file.", +) +@click.option("--db_name", type=str, help="Name of the HMM database.") @click.option("--output", type=click.Path(), help="Path to the formatted output file.") def main(hmm_domtbl, hmm_info_path, ec_from_info, gene_locs, db_name, output): hits = parse_hmmsearch_domtblout(hmm_domtbl) @@ -100,16 +186,20 @@ def main(hmm_domtbl, hmm_info_path, ec_from_info, gene_locs, db_name, output): return # Load gene locations TSV file print("Loading gene locations TSV file...") - gene_locs_df = pd.read_csv(gene_locs, sep='\t', usecols=['query_id', 'start_position', 'stop_position']) + gene_locs_df = pd.read_csv( + gene_locs, sep="\t", usecols=["query_id", "start_position", "stop_position"] + ) # Merge hits_df with gene_locs_df - hits = pd.merge(hits, gene_locs_df, on='query_id', how='left') + hits = pd.merge(hits, gene_locs_df, on="query_id", how="left") - hits['perc_cov'] = (hits['model_end'] - hits['model_start'] + 1) / hits['query_length'] - hits[f'{db_name}_id'] = hits['query_name'].str.replace(r'.hmm', '', regex=True) + hits["perc_cov"] = (hits["model_end"] - hits["model_start"] + 1) / hits[ + "query_length" + ] + hits[f"{db_name}_id"] = hits["query_name"].str.replace(r".hmm", "", regex=True) all_hits = get_all_hits(hits, db_name) all_hits.name = f"{db_name}_ids" - hits = hits.merge(all_hits, how='left', left_on='query_id', right_index=True) + hits = hits.merge(all_hits, how="left", left_on="query_id", right_index=True) hmm_sheet = False if hmm_info_path is not None: @@ -118,12 +208,21 @@ def main(hmm_domtbl, hmm_info_path, ec_from_info, gene_locs, db_name, output): hmm_info = pd.read_csv(hmm_info_path, sep="\t", index_col=0) except Exception as e: try: - hmm_info = pd.read_csv(hmm_info_path, sep="\t", index_col=0, on_bad_lines='skip') + hmm_info = pd.read_csv( + hmm_info_path, sep="\t", index_col=0, on_bad_lines="skip" + ) except Exception as e2: print(f"Error reading HMM info file: {e}\n{e2}") hmm_sheet = False if hmm_sheet and not hmm_info.empty: - merge_cols = ['score_type', 'threshold', f"{db_name}_EC", "description", "A_rank", "B_rank"] + merge_cols = [ + "score_type", + "threshold", + f"{db_name}_EC", + "description", + "A_rank", + "B_rank", + ] raise_on_ec = False if "description" in hmm_info.columns: pass @@ -136,18 +235,33 @@ def main(hmm_domtbl, hmm_info_path, ec_from_info, gene_locs, db_name, output): if ec_from_info: if raise_on_ec: - raise ValueError("No suitable column found for descriptions in hmm_info_path.") - hmm_info[f"{db_name}_EC"] = hmm_info["description"].apply(extract_ec_numbers) + raise ValueError( + "No suitable column found for descriptions in hmm_info_path." + ) + hmm_info[f"{db_name}_EC"] = hmm_info["description"].apply( + extract_ec_numbers + ) merge_cols = [col for col in merge_cols if col in hmm_info.columns] - hits = hits.merge(hmm_info[merge_cols], how='left', left_on="query_name", right_index=True) + hits = hits.merge( + hmm_info[merge_cols], how="left", left_on="query_name", right_index=True + ) hits_sig = sig_scores_row_by_row(hits, db_name=db_name) - drop_cols = [col for col in merge_cols if col in hits_sig.columns and col not in [f"{db_name}_EC", "description",]] + drop_cols = [ + col + for col in merge_cols + if col in hits_sig.columns + and col + not in [ + f"{db_name}_EC", + "description", + ] + ] hits_sig = hits_sig.drop(columns=drop_cols) else: hits_sig = hits[hits["perc_cov"] >= 0.35] - + if len(hits_sig) == 0: # if nothing significant then return nothing, don't get descriptions # df = pd.DataFrame(columns=OUTPUT_COLUMNS) @@ -156,14 +270,26 @@ def main(hmm_domtbl, hmm_info_path, ec_from_info, gene_locs, db_name, output): # Get the best hit # hits_sig = hits_sig.sort_values(['full_evalue', "domain_ievalue", "perc_cov"], ascending=[True, True, False]).drop_duplicates(subset=["query_id"]) - hits_sig = hits_sig.sort_values(['full_evalue', "perc_cov"], ascending=[True, False]).drop_duplicates(subset=["query_id"]) - hits_sig = hits_sig.rename(columns={"full_bitScore": f"{db_name}_full_bitScore", "domain_bitScore": f"{db_name}_domain_bitScore"}) - - final_cols = [col for col in [col.format(db_name=db_name) for col in OUTPUT_COLUMNS] if col in hits_sig.columns] + hits_sig = hits_sig.sort_values( + ["full_evalue", "perc_cov"], ascending=[True, False] + ).drop_duplicates(subset=["query_id"]) + hits_sig = hits_sig.rename( + columns={ + "full_bitScore": f"{db_name}_full_bitScore", + "domain_bitScore": f"{db_name}_domain_bitScore", + } + ) + + final_cols = [ + col + for col in [col.format(db_name=db_name) for col in OUTPUT_COLUMNS] + if col in hits_sig.columns + ] hits_sig = hits_sig[final_cols] # Save the modified DataFrame to CSV hits_sig.to_csv(output, index=False) -if __name__ == '__main__': + +if __name__ == "__main__": main() diff --git a/bin/mmseqs_add_descriptions.py b/bin/mmseqs_add_descriptions.py index 794d5506..50f0bea6 100755 --- a/bin/mmseqs_add_descriptions.py +++ b/bin/mmseqs_add_descriptions.py @@ -2,71 +2,118 @@ import sys import pandas as pd + def assign_rank(row, a_rank, b_rank, db_name_bit_score): """Assign rank based on bit score and provided thresholds.""" if pd.isna(row[db_name_bit_score]): return None elif row[db_name_bit_score] >= a_rank: - return 'A' + return "A" elif row[db_name_bit_score] >= b_rank: - return 'B' + return "B" else: return None -def main(input_fasta, db_name, descriptions_path, bit_score_threshold, gene_locs_path, raw_mmseqs_path , output_path): + +def main( + input_fasta, + db_name, + descriptions_path, + bit_score_threshold, + gene_locs_path, + raw_mmseqs_path, + output_path, +): print(f"Starting processing for input_fasta: {input_fasta}, database: {db_name}") print(f"Loading MMseqs output from {raw_mmseqs_path}") - - df_gene_locs = pd.read_csv(gene_locs_path, sep='\t', usecols=['query_id', 'start_position', 'stop_position']) + + df_gene_locs = pd.read_csv( + gene_locs_path, + sep="\t", + usecols=["query_id", "start_position", "stop_position"], + ) print("Gene locations loaded. Sample rows:") print(df_gene_locs.head()) - - df_mmseqs = pd.read_csv(raw_mmseqs_path, sep='\t', header=None, usecols=[0, 1, 11]) - df_mmseqs.columns = ['query_id', f'{db_name}_id', f'{db_name}_bitScore'] + + df_mmseqs = pd.read_csv(raw_mmseqs_path, sep="\t", header=None, usecols=[0, 1, 11]) + df_mmseqs.columns = ["query_id", f"{db_name}_id", f"{db_name}_bitScore"] print("MMseqs data loaded and columns renamed. Sample rows:") print(df_mmseqs.head()) - - df_merged = pd.merge(df_mmseqs, df_gene_locs, on='query_id', how='left') + + df_merged = pd.merge(df_mmseqs, df_gene_locs, on="query_id", how="left") print("Merged MMseqs output with gene locations. Sample rows:") print(df_merged.head()) if descriptions_path != "NULL": - df_descriptions = pd.read_csv(descriptions_path, sep='\t') + df_descriptions = pd.read_csv(descriptions_path, sep="\t") first_column = df_descriptions.columns[0] - df_descriptions.rename(columns={first_column: f'{db_name}_id'}, inplace=True) - + df_descriptions.rename(columns={first_column: f"{db_name}_id"}, inplace=True) + # Rename 'definition' to 'description', and prefix it with db_name if it exists - if 'definition' in df_descriptions.columns: - df_descriptions.rename(columns={'definition': f'{db_name}_description'}, inplace=True) - elif 'description' in df_descriptions.columns: + if "definition" in df_descriptions.columns: + df_descriptions.rename( + columns={"definition": f"{db_name}_description"}, inplace=True + ) + elif "description" in df_descriptions.columns: # If 'description' already exists, just prefix it with db_name - df_descriptions.rename(columns={'description': f'{db_name}_description'}, inplace=True) - + df_descriptions.rename( + columns={"description": f"{db_name}_description"}, inplace=True + ) + # Prefix other columns except 'A_rank', 'B_rank', and the first column (already handled) - df_descriptions = df_descriptions.rename(columns={col: f"{db_name}_{col}" for col in df_descriptions.columns if col not in ['A_rank', 'B_rank', f'{db_name}_id', f'{db_name}_description']}) + df_descriptions = df_descriptions.rename( + columns={ + col: f"{db_name}_{col}" + for col in df_descriptions.columns + if col + not in ["A_rank", "B_rank", f"{db_name}_id", f"{db_name}_description"] + } + ) # Merge descriptions DataFrame - df_merged = pd.merge(df_merged, df_descriptions, on=f'{db_name}_id', how='left') - + df_merged = pd.merge(df_merged, df_descriptions, on=f"{db_name}_id", how="left") + # Assign ranks based on A_rank and B_rank thresholds, directly using them without db_name prefix - if 'A_rank' in df_descriptions.columns and 'B_rank' in df_descriptions.columns: + if "A_rank" in df_descriptions.columns and "B_rank" in df_descriptions.columns: db_name_bit_score = f"{db_name}_bitScore" - df_merged[f'{db_name}_rank'] = df_merged.apply(lambda row: assign_rank(row, row['A_rank'], row['B_rank'], db_name_bit_score), axis=1) - + df_merged[f"{db_name}_rank"] = df_merged.apply( + lambda row: assign_rank( + row, row["A_rank"], row["B_rank"], db_name_bit_score + ), + axis=1, + ) + # Drop A_rank and B_rank columns as they should not be output - df_merged.drop(columns=['A_rank', 'B_rank'], inplace=True, errors='ignore') + df_merged.drop(columns=["A_rank", "B_rank"], inplace=True, errors="ignore") df_merged.to_csv(output_path, index=False) print("Merged DataFrame saved to", output_path) + if __name__ == "__main__": input_fasta = sys.argv[1] db_name = sys.argv[2] descriptions_path = sys.argv[3] bit_score_threshold = float(sys.argv[4]) gene_locs_path = sys.argv[5] - raw_mmseqs_path = sys.argv[6] if len(sys.argv) > 6 else f"mmseqs_out/{input_fasta}___mmseqs_{db_name}.tsv" - output_path = sys.argv[7] if len(sys.argv) > 7 else f"mmseqs_out/{input_fasta}___mmseqs_{db_name}_formatted.csv" + raw_mmseqs_path = ( + sys.argv[6] + if len(sys.argv) > 6 + else f"mmseqs_out/{input_fasta}___mmseqs_{db_name}.tsv" + ) + output_path = ( + sys.argv[7] + if len(sys.argv) > 7 + else f"mmseqs_out/{input_fasta}___mmseqs_{db_name}_formatted.csv" + ) - main(input_fasta, db_name, descriptions_path, bit_score_threshold, gene_locs_path, raw_mmseqs_path, output_path) + main( + input_fasta, + db_name, + descriptions_path, + bit_score_threshold, + gene_locs_path, + raw_mmseqs_path, + output_path, + ) diff --git a/bin/parse_annotations.py b/bin/parse_annotations.py index 7326864c..26f73db2 100755 --- a/bin/parse_annotations.py +++ b/bin/parse_annotations.py @@ -3,28 +3,43 @@ import sys import os -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') +FASTA_COLUMN = os.getenv("FASTA_COLUMN", "input_fasta") + def extract_query_ids(tsv_path, ko_terms): - df = pd.read_csv(tsv_path, sep='\t') - + df = pd.read_csv(tsv_path, sep="\t") + # Split KO terms on newline to handle multiple entries correctly - ko_terms = ko_terms.strip().split('\n') + ko_terms = ko_terms.strip().split("\n") print(f"Searching for KOs: {ko_terms}") # Define columns to search for KO terms, excluding 'query_id' - search_columns = [col for col in df.columns if (col.endswith('_id') or col.endswith('_description') or col.endswith('_EC')) and col != 'query_id'] - + search_columns = [ + col + for col in df.columns + if (col.endswith("_id") or col.endswith("_description") or col.endswith("_EC")) + and col != "query_id" + ] + # Debugging: Output the columns being searched print(f"Searching in columns: {search_columns}") # Create a filter mask for any row containing any of the KO terms in the specified columns - mask = df[search_columns].apply(lambda x: x.astype(str).str.contains('|'.join(ko_terms), case=False, na=False)).any(axis=1) + mask = ( + df[search_columns] + .apply( + lambda x: x.astype(str).str.contains( + "|".join(ko_terms), case=False, na=False + ) + ) + .any(axis=1) + ) filtered_df = df[mask] print(f"Found {len(filtered_df)} matching entries.") - return filtered_df[[FASTA_COLUMN, 'query_id']] + return filtered_df[[FASTA_COLUMN, "query_id"]] + def main(): if len(sys.argv) != 4: @@ -32,15 +47,16 @@ def main(): sys.exit(1) tsv_path, ko_list_path, output_file = sys.argv[1:] - with open(ko_list_path, 'r') as f: + with open(ko_list_path, "r") as f: ko_list = f.read() results_df = extract_query_ids(tsv_path, ko_list) # Write results to output file - results_df.to_csv(output_file, sep='\t', index=False, header=False) + results_df.to_csv(output_file, sep="\t", index=False, header=False) print(f"Extracted {len(results_df)} entries written to {output_file}") -if __name__ == '__main__': + +if __name__ == "__main__": main() diff --git a/bin/parse_faa.sh b/bin/parse_faa.sh index 341067a4..b871775a 100755 --- a/bin/parse_faa.sh +++ b/bin/parse_faa.sh @@ -19,4 +19,4 @@ BEGIN { OFS="\t"; print "query_id","start_position","stop_position","strandednes }' "$INPUT_FILE" > "$OUTPUT_FILE" -trap 'echo "parsing input faa files failed. Check they have all the same metadata information in the header files as Prodigal outputs. Example header line: >OWC_0000_k121_3157_1 # 2 # 580 # -1 # ID=1_1;partial=10;start_type=ATG;rbs_motif=AATAA;rbs_spacer=15bp;gc_cont=0.439"; exit 1' ERR \ No newline at end of file +trap 'echo "parsing input faa files failed. Check they have all the same metadata information in the header files as Prodigal outputs. Example header line: >OWC_0000_k121_3157_1 # 2 # 580 # -1 # ID=1_1;partial=10;start_type=ATG;rbs_motif=AATAA;rbs_spacer=15bp;gc_cont=0.439"; exit 1' ERR diff --git a/bin/parse_gff.sh b/bin/parse_gff.sh deleted file mode 100755 index ecc92a65..00000000 --- a/bin/parse_gff.sh +++ /dev/null @@ -1,17 +0,0 @@ -#!/usr/bin/env bash -set -euo pipefail - -INPUT_FILE=$1 -OUTPUT_FILE=$2 - -awk -F'\t' ' -BEGIN { - OFS = "\t"; - print "query_id","start_position","stop_position","strandedness","gene_number" -} -# skip comments; keep CDS only -$0 !~ /^#/ && $3=="CDS" { - cnt[$1]++; # per-sequence gene counter - strand = ($7=="+") ? 1 : -1; # map strand to {+1,-1} - printf "%s_%d\t%d\t%d\t%d\t%d\n", $1, cnt[$1], $4, $5, strand, cnt[$1] -}' "$INPUT_FILE" > "$OUTPUT_FILE" \ No newline at end of file diff --git a/bin/process_quast.py b/bin/process_quast.py index 6a5f2bd0..c326574d 100755 --- a/bin/process_quast.py +++ b/bin/process_quast.py @@ -5,31 +5,32 @@ from utils.logger import get_logger from pathlib import Path -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') +FASTA_COLUMN = os.getenv("FASTA_COLUMN", "input_fasta") logger = get_logger(filename=Path(__file__).stem) # Function to count predicted genes in a GFF file def count_genes_in_gff(gff_file): - with open(gff_file, 'r') as file: - return sum(1 for line in file if '\\tCDS\\t' in line) + with open(gff_file, "r") as file: + return sum(1 for line in file if "\\tCDS\\t" in line) + # Find all FASTA and GFF files -gff_file_paths = glob('*.gff') +gff_file_paths = glob("*.gff") # Read the QUAST report generated for all input_fastas -quast_report_path = 'quast_results/report.tsv' -report_df = pd.read_csv(quast_report_path, sep='\t', index_col='Assembly') +quast_report_path = "quast_results/report.tsv" +report_df = pd.read_csv(quast_report_path, sep="\t", index_col="Assembly") logger.info(f"Number of gff files to process: {len(gff_file_paths)}") # Dynamically identify input_fasta names based on FASTA filenames and match with QUAST report collected_data = [] for i, gff_file in enumerate(gff_file_paths): - try: + try: base_name = os.path.splitext(os.path.basename(gff_file))[0] - input_fasta_name = base_name.split('_called_genes')[0] + input_fasta_name = base_name.split("_called_genes")[0] num_genes = count_genes_in_gff(gff_file) # Extract metrics from the QUAST report for this input_fasta @@ -37,22 +38,22 @@ def count_genes_in_gff(gff_file): if input_fasta_name in column: metrics = { FASTA_COLUMN: input_fasta_name, - 'assembly size': report_df.loc['Total length', column], - 'no. contigs': report_df.loc['# contigs', column], - 'largest contig': report_df.loc['Largest contig', column], - 'N50': report_df.loc['N50', column], - 'L50': report_df.loc['L50', column], - 'GC (%)': report_df.loc['GC (%)', column], - 'no. pred. genes': num_genes + "assembly size": report_df.loc["Total length", column], + "no. contigs": report_df.loc["# contigs", column], + "largest contig": report_df.loc["Largest contig", column], + "N50": report_df.loc["N50", column], + "L50": report_df.loc["L50", column], + "GC (%)": report_df.loc["GC (%)", column], + "no. pred. genes": num_genes, } collected_data.append(metrics) break except Exception as e: - logger.error(f"Error processing the {i+1}-th GFF file {gff_file}: {str(e)}") + logger.error(f"Error processing the {i + 1}-th GFF file {gff_file}: {str(e)}") continue # Convert the list of dictionaries into a DataFrame combined_df = pd.DataFrame(collected_data) # Save the DataFrame to a TSV file -combined_df.to_csv('collected_quast.tsv', sep='\t', index=False) \ No newline at end of file +combined_df.to_csv("collected_quast.tsv", sep="\t", index=False) diff --git a/bin/rbh_mmseqs_filter.py b/bin/rbh_mmseqs_filter.py index 95436164..419c3499 100755 --- a/bin/rbh_mmseqs_filter.py +++ b/bin/rbh_mmseqs_filter.py @@ -2,11 +2,12 @@ import pandas as pd import argparse + def find_rbh(forward_file, reverse_file, output_file): # Load the forward and reverse search results - forward_df = pd.read_csv(forward_file, sep='\t', header=None) - reverse_df = pd.read_csv(reverse_file, sep='\t', header=None) - + forward_df = pd.read_csv(forward_file, sep="\t", header=None) + reverse_df = pd.read_csv(reverse_file, sep="\t", header=None) + # Assuming the columns are [query, target, bitscore,...], adjust if your format is different # Map reverse hits for easy lookup reverse_hits = {row[1]: row[0] for index, row in reverse_df.iterrows()} @@ -23,15 +24,33 @@ def find_rbh(forward_file, reverse_file, output_file): rbh_df = pd.DataFrame(rbh) if not rbh_df.empty: # Save the RBH to an output file - rbh_df.to_csv(output_file, sep='\t', header=False, index=False) + rbh_df.to_csv(output_file, sep="\t", header=False, index=False) else: print("No reciprocal best hits found.") + if __name__ == "__main__": - parser = argparse.ArgumentParser(description="Filter Reciprocal Best Hits (RBH) from forward and reverse MMseqs2 search results.") - parser.add_argument('--forward', type=str, required=True, help='File path to forward search results.') - parser.add_argument('--reverse', type=str, required=True, help='File path to reverse search results.') - parser.add_argument('--output', type=str, required=True, help='Output file path for combined RBH results.') + parser = argparse.ArgumentParser( + description="Filter Reciprocal Best Hits (RBH) from forward and reverse MMseqs2 search results." + ) + parser.add_argument( + "--forward", + type=str, + required=True, + help="File path to forward search results.", + ) + parser.add_argument( + "--reverse", + type=str, + required=True, + help="File path to reverse search results.", + ) + parser.add_argument( + "--output", + type=str, + required=True, + help="Output file path for combined RBH results.", + ) args = parser.parse_args() find_rbh(args.forward, args.reverse, args.output) diff --git a/bin/rename_headers.py b/bin/rename_headers.py index e14432ae..736a1b2c 100755 --- a/bin/rename_headers.py +++ b/bin/rename_headers.py @@ -10,4 +10,4 @@ if line.startswith(">"): fout.write(f">{prefix}_{line[1:]}") else: - fout.write(line) \ No newline at end of file + fout.write(line) diff --git a/bin/sql_add_descriptions.py b/bin/sql_add_descriptions.py index 48f811ab..6c568fde 100755 --- a/bin/sql_add_descriptions.py +++ b/bin/sql_add_descriptions.py @@ -5,64 +5,83 @@ from concurrent.futures import ThreadPoolExecutor import argparse + def fetch_descriptions(chunk, db_name, db_file): # Function to fetch descriptions based on IDs from the specified table table_name = f"{db_name}_description" ids_column = "id" descriptions_column = "description" - + # Establish connection to SQLite database conn = sqlite3.connect(db_file) - + # Adjust the column name to match the hits CSV file and process dbcan_id values if needed hits_ids_column = f"{db_name}_id" if db_name == "dbcan": chunk[hits_ids_column] = chunk[hits_ids_column].str.replace(".hmm", "") ids = chunk[hits_ids_column].unique() - + # Construct the query based on the database name query = f"SELECT {ids_column}, {descriptions_column} FROM {table_name} WHERE {ids_column} IN ({','.join(['?'] * len(ids))})" if db_name == "dbcan": query = f"SELECT {ids_column}, {descriptions_column}, ec FROM {table_name} WHERE {ids_column} IN ({','.join(['?'] * len(ids))})" - + cursor = conn.cursor() cursor.execute(query, ids) results = cursor.fetchall() - + # Update chunk with descriptions and process according to the database type if db_name == "dbcan": # For dbcan, also fetch and format EC numbers descriptions_dict = {row[0]: (row[1], row[2]) for row in results} - chunk[f"{db_name}_description"] = chunk[hits_ids_column].map(lambda x: descriptions_dict.get(x, ("", ""))[0]) - chunk["dbcan_EC"] = chunk[hits_ids_column].map(lambda x: format_dbcan_EC(descriptions_dict.get(x, ("", ""))[1])) + chunk[f"{db_name}_description"] = chunk[hits_ids_column].map( + lambda x: descriptions_dict.get(x, ("", ""))[0] + ) + chunk["dbcan_EC"] = chunk[hits_ids_column].map( + lambda x: format_dbcan_EC(descriptions_dict.get(x, ("", ""))[1]) + ) elif db_name == "kegg": # For other databases, just update with descriptions descriptions_dict = {row[0]: row[1] for row in results} - chunk[f"{db_name}_description"] = chunk[hits_ids_column].map(lambda x: descriptions_dict.get(x, "")) - chunk["kegg_orthology"] = chunk[f"{db_name}_description"].apply(extract_kegg_orthology) + chunk[f"{db_name}_description"] = chunk[hits_ids_column].map( + lambda x: descriptions_dict.get(x, "") + ) + chunk["kegg_orthology"] = chunk[f"{db_name}_description"].apply( + extract_kegg_orthology + ) chunk["kegg_EC"] = chunk[f"{db_name}_description"].apply(extract_kegg_EC) - + # Ensure the 'kegg_id' column exists if your logic does not create it earlier - if 'kegg_id' not in chunk.columns: - chunk['kegg_id'] = '' # or any default logic you have for generating 'kegg_id' + if "kegg_id" not in chunk.columns: + chunk["kegg_id"] = ( + "" # or any default logic you have for generating 'kegg_id' + ) # Rename 'kegg_id' to 'kegg_gene_name' chunk.rename(columns={"kegg_id": "kegg_gene_name"}, inplace=True) - + # After extracting for kegg, rename "kegg_orthology" to "kegg_id" chunk.rename(columns={"kegg_orthology": "kegg_id"}, inplace=True) elif db_name == "merops": descriptions_dict = {row[0]: row[1] for row in results} - chunk[f"{db_name}_description"] = chunk[hits_ids_column].map(lambda x: descriptions_dict.get(x, "")) - chunk[f"{db_name}_family"] = chunk[f"{db_name}_description"].str.findall(r"#(\w*.)#").apply(lambda x: ';'.join(x)) + chunk[f"{db_name}_description"] = chunk[hits_ids_column].map( + lambda x: descriptions_dict.get(x, "") + ) + chunk[f"{db_name}_family"] = ( + chunk[f"{db_name}_description"] + .str.findall(r"#(\w*.)#") + .apply(lambda x: ";".join(x)) + ) else: descriptions_dict = {row[0]: row[1] for row in results} - chunk[f"{db_name}_description"] = chunk[hits_ids_column].map(lambda x: descriptions_dict.get(x, "")) + chunk[f"{db_name}_description"] = chunk[hits_ids_column].map( + lambda x: descriptions_dict.get(x, "") + ) - conn.close() return chunk + def extract_kegg_orthology(description): # Extract KO from the description if "(K" in description: @@ -73,33 +92,50 @@ def extract_kegg_orthology(description): else: return None + def format_dbcan_EC(ec_string): # Format EC numbers from the dbcan ec column with "EC:" prefix and semicolon separation if ec_string: - ec_numbers = ec_string.split(',') # Split the EC numbers string - formatted_ec_numbers = '; '.join([f"EC:{ec}" for ec in ec_numbers if ec]) # Add "EC:" prefix and join with semicolon + ec_numbers = ec_string.split(",") # Split the EC numbers string + formatted_ec_numbers = "; ".join( + [f"EC:{ec}" for ec in ec_numbers if ec] + ) # Add "EC:" prefix and join with semicolon return formatted_ec_numbers else: return "" + def extract_kegg_EC(description): # TODO this could be optimized into one regex with groups I am pretty sure # Extract and format EC numbers from the description with "EC:" prefix and semicolon separation ec_start = description.find("[EC:") if ec_start != -1: ec_end = description.find("]", ec_start) - ec_text = description[ec_start + 4:ec_end] # Skip the "[EC:" part - ec_numbers = re.findall(r'\b\d+\.\d+\.\d+\.\d+\b', ec_text) # Extract EC numbers using regex - formatted_ec_numbers = '; '.join([f"EC:{ec}" for ec in ec_numbers]) # Add "EC:" prefix and join with semicolon + ec_text = description[ec_start + 4 : ec_end] # Skip the "[EC:" part + ec_numbers = re.findall( + r"\b\d+\.\d+\.\d+\.\d+\b", ec_text + ) # Extract EC numbers using regex + formatted_ec_numbers = "; ".join( + [f"EC:{ec}" for ec in ec_numbers] + ) # Add "EC:" prefix and join with semicolon return formatted_ec_numbers else: return None + def main(): - parser = argparse.ArgumentParser(description="Add descriptions from SQL database to hits file") + parser = argparse.ArgumentParser( + description="Add descriptions from SQL database to hits file" + ) parser.add_argument("--hits_csv", type=str, help="Path to the hits CSV file") - parser.add_argument("--db_name", type=str, help="Name of the database table to fetch descriptions from") - parser.add_argument("--output", type=str, help="Path to the output formatted CSV file") + parser.add_argument( + "--db_name", + type=str, + help="Name of the database table to fetch descriptions from", + ) + parser.add_argument( + "--output", type=str, help="Path to the output formatted CSV file" + ) parser.add_argument("--db_file", type=str, help="Path to the SQLite database file") args = parser.parse_args() @@ -110,12 +146,15 @@ def main(): chunksize = max(1, min(10000, num_lines // 10)) # Adjust as needed, minimum 1 chunk # Read CSV file in chunks - reader = pd.read_csv(args.hits_csv, delimiter=',', chunksize=chunksize) + reader = pd.read_csv(args.hits_csv, delimiter=",", chunksize=chunksize) # Process chunks with ThreadPoolExecutor() as executor: # Convert reader to list before passing to executor.map - processed_chunks = executor.map(lambda chunk: fetch_descriptions(chunk, args.db_name, args.db_file), list(reader)) + processed_chunks = executor.map( + lambda chunk: fetch_descriptions(chunk, args.db_name, args.db_file), + list(reader), + ) # Concatenate processed chunks into a single DataFrame df = pd.concat(processed_chunks, ignore_index=True) @@ -123,5 +162,6 @@ def main(): # Write updated DataFrame to new CSV file df.to_csv(args.output, index=False) + if __name__ == "__main__": - main() \ No newline at end of file + main() diff --git a/bin/trna_collect.py b/bin/trna_collect.py index 23f3cf58..ee83e554 100755 --- a/bin/trna_collect.py +++ b/bin/trna_collect.py @@ -4,11 +4,11 @@ import pandas as pd from pathlib import Path -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') +FASTA_COLUMN = os.getenv("FASTA_COLUMN", "input_fasta") -df = pd.read_csv(Path("raw_trna_scan.tsv").resolve(), sep='\t') +df = pd.read_csv(Path("raw_trna_scan.tsv").resolve(), sep="\t") -gene_col="gene_id" +gene_col = "gene_id" df = df[[FASTA_COLUMN, gene_col]].copy() counts = pd.crosstab(df[gene_col], df[FASTA_COLUMN], dropna=False).astype("int64") counts.columns.name = None diff --git a/bin/update_annots_trees.py b/bin/update_annots_trees.py index 6ebff2ad..62618e75 100755 --- a/bin/update_annots_trees.py +++ b/bin/update_annots_trees.py @@ -6,17 +6,20 @@ from Bio import Phylo from io import StringIO + def load_jplace_file(jplace_path): - with open(jplace_path, 'r') as file: + with open(jplace_path, "r") as file: jplace_data = json.load(file) return jplace_data + def load_and_parse_tree(tree_data): - tree_data = re.sub(r'\{(\d+)\}', r'[&edge=\g<1>]', tree_data) + tree_data = re.sub(r"\{(\d+)\}", r"[&edge=\g<1>]", tree_data) handle = StringIO(tree_data) tree = Phylo.read(handle, "newick") return tree + def find_closest_labeled_ancestor(clade, tree): if clade.is_terminal() and clade.name: return clade.name @@ -24,7 +27,7 @@ def find_closest_labeled_ancestor(clade, tree): for ancestor in reversed(path): if ancestor.is_terminal() and ancestor.name: return ancestor.name - min_distance = float('inf') + min_distance = float("inf") closest_leaf = None for leaf in tree.get_terminals(): distance = tree.distance(clade, leaf) @@ -33,15 +36,17 @@ def find_closest_labeled_ancestor(clade, tree): closest_leaf = leaf.name return closest_leaf if closest_leaf else "" + def load_tree_mapping(mapping_tsv): - df = pd.read_csv(mapping_tsv, sep='\t') - return dict(zip(df['gene'], df['call'])) + df = pd.read_csv(mapping_tsv, sep="\t") + return dict(zip(df["gene"], df["call"])) + def extract_placement_details(jplace_data, tree, tree_mapping): - placements = jplace_data['placements'] + placements = jplace_data["placements"] placement_map = {} for placement in placements: - for placement_detail in placement['p']: + for placement_detail in placement["p"]: edge_num = placement_detail[1] clades = list(tree.find_clades({"comment": f"&edge={edge_num}"})) if clades: @@ -53,32 +58,39 @@ def extract_placement_details(jplace_data, tree, tree_mapping): closest_leaf = f"No mapping found;{closest_leaf}" else: closest_leaf = f"Clade not found;{edge_num}" - for name, _ in placement['nm']: + for name, _ in placement["nm"]: placement_map[name] = closest_leaf return placement_map + def update_tsv(tsv_path, output_tsv_path, placement_map): - df = pd.read_csv(tsv_path, sep='\t') - df['tree_verified'] = df['query_id'].map(placement_map).fillna('') + df = pd.read_csv(tsv_path, sep="\t") + df["tree_verified"] = df["query_id"].map(placement_map).fillna("") # Reorder columns to place 'tree_verified' after 'gene_number' - col_order_start = df.columns.tolist()[:df.columns.get_loc('gene_number')+1] + ['tree_verified'] + col_order_start = df.columns.tolist()[: df.columns.get_loc("gene_number") + 1] + [ + "tree_verified" + ] col_order_end = [col for col in df.columns if col not in col_order_start] df = df[col_order_start + col_order_end] - df.to_csv(output_tsv_path, sep='\t', index=False) + df.to_csv(output_tsv_path, sep="\t", index=False) + def main(): if len(sys.argv) != 5: - print("Usage: python update_annots_trees.py ") + print( + "Usage: python update_annots_trees.py " + ) sys.exit(1) jplace_path, tsv_path, mapping_tsv, output_tsv_path = sys.argv[1:] jplace_data = load_jplace_file(jplace_path) - tree = load_and_parse_tree(jplace_data['tree']) + tree = load_and_parse_tree(jplace_data["tree"]) tree_mapping = load_tree_mapping(mapping_tsv) placement_map = extract_placement_details(jplace_data, tree, tree_mapping) update_tsv(tsv_path, output_tsv_path, placement_map) + if __name__ == "__main__": main() diff --git a/bin/update_tree.py b/bin/update_tree.py index 9bc228ef..c0852a48 100755 --- a/bin/update_tree.py +++ b/bin/update_tree.py @@ -1,40 +1,44 @@ #!/usr/bin/env python import json -import xml.etree.ElementTree as ET -import re -from collections import defaultdict -import sys -from ete3 import Tree, Phyloxml +from ete3 import Tree + def parse_jplace(jplace_path): - with open(jplace_path, 'r') as file: + with open(jplace_path, "r") as file: jplace_data = json.load(file) - return jplace_data['tree'], jplace_data['placements'] + return jplace_data["tree"], jplace_data["placements"] + def add_placements_to_tree(tree_newick, placements): # Load the tree tree = Tree(tree_newick, format=1) - + # Add placements for placement in placements: - for p in placement['p']: + for p in placement["p"]: edge_num = p[1] - name = placement['nm'][0][0] + name = placement["nm"][0][0] edge = tree.search_nodes(name=str(edge_num)) if edge: new_clade = Tree(name=name, dist=0.0) edge[0].add_child(new_clade) - + return tree + def save_tree_as_phyloxml(tree, output_path): phyloxml = tree.write(format=5) - with open(output_path, 'w') as file: + with open(output_path, "w") as file: file.write(phyloxml) + def main(): - jplace_path = 'aligned_sequences.jplace' # Replace with the actual path if different - output_xml_path = 'aligned_sequences_updated.xml' # Replace with the actual path if different + jplace_path = ( + "aligned_sequences.jplace" # Replace with the actual path if different + ) + output_xml_path = ( + "aligned_sequences_updated.xml" # Replace with the actual path if different + ) # Parse the jplace file tree_newick, placements = parse_jplace(jplace_path) @@ -45,5 +49,6 @@ def main(): # Save the tree in phyloXML format save_tree_as_phyloxml(tree, output_xml_path) + if __name__ == "__main__": main() diff --git a/bin/utils/__init__.py b/bin/utils/__init__.py index e69de29b..4265cc3e 100755 --- a/bin/utils/__init__.py +++ b/bin/utils/__init__.py @@ -0,0 +1 @@ +#!/usr/bin/env python diff --git a/bin/utils/click_utils.py b/bin/utils/click_utils.py index d23835bc..e563647e 100755 --- a/bin/utils/click_utils.py +++ b/bin/utils/click_utils.py @@ -1,3 +1,4 @@ +#!/usr/bin/env python def validate_comma_separated(ctx, param, value, split=(",", " ")): if not value: return [] @@ -10,4 +11,3 @@ def validate_comma_separated(ctx, param, value, split=(",", " ")): for s in split: value = value.replace(s, ",") return [val.strip() for val in value.split(",")] - \ No newline at end of file diff --git a/bin/utils/excel.py b/bin/utils/excel.py index b7b3a73e..5faf4017 100755 --- a/bin/utils/excel.py +++ b/bin/utils/excel.py @@ -1,3 +1,4 @@ +#!/usr/bin/env python from typing import Iterable, TypeAlias import polars as pl @@ -14,22 +15,18 @@ def write_summarized_genomes_to_xlsx( output_file: PathLike, group_by: Columns, sort_order_columns: Columns, - extra_frames: Iterable|dict = tuple(), + extra_frames: Iterable | dict = tuple(), ): format_kw = { "autofit": True, - } + } # turn all this into an xlsx with Workbook(output_file) as wb: if df is not None and not df.is_empty(): for sheet, frame in df.group_by(group_by): frame = frame.sort(sort_order_columns) frame = frame.drop(group_by) - frame.write_excel( - workbook=wb, - worksheet=sheet[0], - **format_kw - ) + frame.write_excel(workbook=wb, worksheet=sheet[0], **format_kw) for extra_frame in extra_frames: if extra_frame is None: continue @@ -41,8 +38,4 @@ def write_summarized_genomes_to_xlsx( else: name = str(extra_frame[group_by][0]) if extra_frame is not None and not extra_frame.is_empty(): - extra_frame.write_excel( - workbook=wb, - worksheet=name, - **format_kw - ) + extra_frame.write_excel(workbook=wb, worksheet=name, **format_kw) diff --git a/bin/utils/logger.py b/bin/utils/logger.py index 5fe0b50f..36dce803 100755 --- a/bin/utils/logger.py +++ b/bin/utils/logger.py @@ -1,14 +1,15 @@ #!/usr/bin/env python import logging import os -from pathlib import Path DEFAULT_LOG_LEVEL: int = logging.INFO ROOT_LOGGER_NAME = "dram" -def get_logger(name: str = ROOT_LOGGER_NAME, level: int = DEFAULT_LOG_LEVEL, filename="dram.log") -> logging.Logger: +def get_logger( + name: str = ROOT_LOGGER_NAME, level: int = DEFAULT_LOG_LEVEL, filename="dram.log" +) -> logging.Logger: """Get a logger. To set a human-readable "output_name" that appears in logger outputs, @@ -71,9 +72,11 @@ def build_stream_handler(level: int = DEFAULT_LOG_LEVEL) -> logging.StreamHandle return handler -def build_file_handler(filename: os.PathLike, level: int = DEFAULT_LOG_LEVEL) -> logging.FileHandler: +def build_file_handler( + filename: os.PathLike, level: int = DEFAULT_LOG_LEVEL +) -> logging.FileHandler: handler = logging.FileHandler(filename) handler.setLevel(level=level) formatter = get_formatter() handler.setFormatter(formatter) - return handler \ No newline at end of file + return handler diff --git a/bin/utils/pl_utils.py b/bin/utils/pl_utils.py index 8ac943f2..31d15a60 100755 --- a/bin/utils/pl_utils.py +++ b/bin/utils/pl_utils.py @@ -1,6 +1,10 @@ +#!/usr/bin/env python import polars as pl -def read_csv(path, check_for_null_file=True, seperator="\t", *args, **kwargs) -> pl.DataFrame | None: + +def read_csv( + path, check_for_null_file=True, seperator="\t", *args, **kwargs +) -> pl.DataFrame | None: if path is None: return None df = pl.read_csv(path, separator=seperator, *args, **kwargs) @@ -10,4 +14,3 @@ def read_csv(path, check_for_null_file=True, seperator="\t", *args, **kwargs) -> if df.is_empty(): return None return df - \ No newline at end of file diff --git a/cliff.toml b/cliff.toml index 756ea7cd..b0b6b804 100644 --- a/cliff.toml +++ b/cliff.toml @@ -26,13 +26,17 @@ body = """ ### {{ group | upper_first }} {% for commit in commits %} - {{ commit.message | split(pat="\n") | first | upper_first | trim }} ([{{ commit.id | truncate(length=7, end="") }}](https://github.com/WrightonLabCSU/DRAM/commit/{{ commit.id }}))\ + {% if commit.body %}\ \n - {{ commit.body }}\ + {{ commit.body | indent(prefix=" ", first=true) }}\ + {% endif %}\ {% if commit.footers %}\ {% for footer in commit.footers -%} + \n , {{ footer.token }}{{ footer.separator }}{{ footer.value }}\ {% endfor %}\ {% endif %}\ + \n {% endfor %} {% endfor %}\n """ diff --git a/conf/constants.config b/conf/constants.config index 9207d255..95ae6baa 100644 --- a/conf/constants.config +++ b/conf/constants.config @@ -2,4 +2,4 @@ params { CONSTANTS { FASTA_COLUMN = "input_fasta" } -} \ No newline at end of file +} diff --git a/conf/modules.config b/conf/modules.config index 470e029c..69e7a8dd 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -221,10 +221,4 @@ process { mode: 'copy', ] } - withName: TREES { - publishDir = [ - path: "${params.outdir}/VISUALIZE", - mode: 'copy', - ] - } } diff --git a/containers/DRAM2-Nextflow-Main-Container-Aug162024-V1 b/containers/DRAM2-Nextflow-Main-Container-Aug162024-V1 deleted file mode 100644 index 48aea61f..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-Aug162024-V1 +++ /dev/null @@ -1,85 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export KMP_DUPLICATE_LIB_OK=TRUE - export PATH="/opt/miniconda/bin:$PATH" - -%files - ../assets/bbmap /opt - ../assets/conda/environment.yml /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels agbiome - conda config --add channels r - conda update -n base -c defaults conda - - # Install conda packages - conda install -c bioconda prodigal=2.6.3 - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - conda install numpy=1.26.4 - conda install samtools=1.17 -y - conda install bowtie2=2.5.1 -y - conda install -c conda-forge ncurses - conda install -c bioconda quast=5.2.0 - python -m pip install -U matplotlib - conda install matplotlib - conda install bbtools - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean diff --git a/containers/DRAM2-Nextflow-Main-Container-June282024-V5 b/containers/DRAM2-Nextflow-Main-Container-June282024-V5 deleted file mode 100644 index f1a8eaee..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-June282024-V5 +++ /dev/null @@ -1,87 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export KMP_DUPLICATE_LIB_OK=TRUE - export PATH="/opt/miniconda/bin:$PATH" - -%files - ../assets/bbmap /opt - ../assets/conda/environment.yml /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels agbiome - conda config --add channels r - conda update -n base -c defaults conda - - # Install conda packages - conda install -c bioconda prodigal=2.6.3 - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - conda install numpy=1.26.4 - conda install panel=1.3.8 - conda install bokeh=3.* - conda install samtools=1.17 -y - conda install bowtie2=2.5.1 -y - conda install -c conda-forge ncurses - conda install -c bioconda quast=5.2.0 - python -m pip install -U matplotlib - conda install matplotlib - conda install bbtools - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean diff --git a/containers/DRAM2-Nextflow-Main-Container-March112024-V3 b/containers/DRAM2-Nextflow-Main-Container-March112024-V3 deleted file mode 100644 index 809bd46e..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-March112024-V3 +++ /dev/null @@ -1,94 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export PATH="/opt/miniconda/bin:$PATH" - -%files - - ../assets/bbmap /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels r - conda update -n base -c defaults conda - - conda install -c bioconda prodigal=2.6.3 - - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - - # Commented out if conda install into base does not work - #conda create -n trnascan python=3.10 -y - #conda install -n trnascan bioconda::trnascan-se=2.0.12 - - # Conda Env with python 3.10 for samtools and bowtie - conda create -n support python=3.10 -y - - conda install -n support samtools=1.17 -y - - conda install -n support bowtie2=2.5.1 -y - - conda install -n support -c conda-forge ncurses - - conda install -n support -c bioconda quast=5.2.0 - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean - - diff --git a/containers/DRAM2-Nextflow-Main-Container-March112024-V4 b/containers/DRAM2-Nextflow-Main-Container-March112024-V4 deleted file mode 100644 index c91ebdce..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-March112024-V4 +++ /dev/null @@ -1,98 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export PATH="/opt/miniconda/bin:$PATH" - -%files - - ../assets/bbmap /opt - ../assets/conda/environment.yml /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels agbiome - conda config --add channels r - conda update -n base -c defaults conda - - conda install -c bioconda prodigal=2.6.3 - - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - - - conda install samtools=1.17 -y - - conda install bowtie2=2.5.1 -y - - conda install -c conda-forge ncurses - - conda install -c bioconda quast=5.2.0 - - python -m pip install -U matplotlib - - conda install matplotlib - - conda install bbtools - - conda create conda env create -f environment.yml - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean - - diff --git a/containers/DRAM2-Nextflow-Main-Container-March252024-V4 b/containers/DRAM2-Nextflow-Main-Container-March252024-V4 deleted file mode 100644 index f1a8eaee..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-March252024-V4 +++ /dev/null @@ -1,87 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export KMP_DUPLICATE_LIB_OK=TRUE - export PATH="/opt/miniconda/bin:$PATH" - -%files - ../assets/bbmap /opt - ../assets/conda/environment.yml /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels agbiome - conda config --add channels r - conda update -n base -c defaults conda - - # Install conda packages - conda install -c bioconda prodigal=2.6.3 - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - conda install numpy=1.26.4 - conda install panel=1.3.8 - conda install bokeh=3.* - conda install samtools=1.17 -y - conda install bowtie2=2.5.1 -y - conda install -c conda-forge ncurses - conda install -c bioconda quast=5.2.0 - python -m pip install -U matplotlib - conda install matplotlib - conda install bbtools - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean diff --git a/containers/DRAM2-Nextflow-Main-Container-March262024-V5 b/containers/DRAM2-Nextflow-Main-Container-March262024-V5 deleted file mode 100644 index ce0189dd..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-March262024-V5 +++ /dev/null @@ -1,100 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export PATH="/opt/miniconda/bin:$PATH" - -%files - - ../assets/bbmap /opt - ../assets/conda/environment.yml /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels agbiome - conda config --add channels r - conda update -n base -c defaults conda - - conda install -c bioconda prodigal=2.6.3 - - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - - conda install numpy=1.26.4 - conda install panel=1.3.8 - conda install bokeh=3.* - - conda install samtools=1.17 -y - - conda install bowtie2=2.5.1 -y - - conda install -c conda-forge ncurses - - conda install -c bioconda quast=5.2.0 - - python -m pip install -U matplotlib - - conda install matplotlib - - conda install bbtools - - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean - - diff --git a/containers/DRAM2-Nextflow-Main-Container-March262024-V6 b/containers/DRAM2-Nextflow-Main-Container-March262024-V6 deleted file mode 100644 index 0b44d5d9..00000000 --- a/containers/DRAM2-Nextflow-Main-Container-March262024-V6 +++ /dev/null @@ -1,114 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export PATH="/opt/miniconda/bin:$PATH" - -%files - - ../assets/bbmap /opt - ../assets/conda/environment.yml /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels agbiome - conda config --add channels r - conda update -n base -c defaults conda - - conda install -c bioconda prodigal=2.6.3 - - conda install python=3.10 - conda install pip - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==15.6f452 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - conda install -c conda-forge biopython=1.83 - - ## visualization packages - conda install numpy=1.26.4 - conda install panel=1.* - conda install bokeh=3.* - conda install click=8.1.* - - conda install samtools=1.17 -y - - conda install bowtie2=2.5.1 -y - - conda install -c conda-forge ncurses - - conda install -c bioconda quast=5.2.0 - - python -m pip install -U matplotlib - - conda install matplotlib - - conda install pplacer=1.1.alpha19 - - conda install seqtk - - conda install bbmap - - conda install mafft=7.525 - - conda install openpyxl=3.1.2 - - conda install 'networkx>2,<3' - - pip install matplotlib - - - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean diff --git a/containers/DRAM2-Nextflow-No-Databases-Nov302023-V1 b/containers/DRAM2-Nextflow-No-Databases-Nov302023-V1 deleted file mode 100644 index 7385a6a3..00000000 --- a/containers/DRAM2-Nextflow-No-Databases-Nov302023-V1 +++ /dev/null @@ -1,90 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export PATH="/opt/miniconda/bin:$PATH" - -%files - - ../assets/bbmap /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels r - conda update -n base -c defaults conda - - conda install -c bioconda prodigal=2.6.3 - - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==14.7e284 - conda install hmmer=3.3.2 - conda install trnascan-se=2.0.11 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - - - - # Conda Env with python 3.10 for samtools and bowtie - conda create -n support python=3.10 -y - - conda install -n support samtools=1.17 -y - - conda install -n support bowtie2=2.5.1 -y - - conda install -n support -c conda-forge ncurses - - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean - - diff --git a/containers/DRAM2-Nextflow-No-Databases-Nov302023-V2 b/containers/DRAM2-Nextflow-No-Databases-Nov302023-V2 deleted file mode 100644 index 2a3ea18d..00000000 --- a/containers/DRAM2-Nextflow-No-Databases-Nov302023-V2 +++ /dev/null @@ -1,91 +0,0 @@ -Bootstrap: docker -From: ubuntu:22.04 - -%labels - Maintainer Your Name reedwoyda@gmail.com - -%environment - # Set environment variables, if needed - export PATH="/opt/miniconda/bin:$PATH" - -%files - - ../assets/bbmap /opt - -%post - chmod 777 /opt - chmod 777 /opt/* - export TZ='America/Denver' - export DEBIAN_FRONTEND=noninteractive - - - # Update the package index and install required dependencies - apt-get update && apt-get install -y \ - wget \ - bzip2 \ - python3-pip \ - git \ - pigz \ - openjdk-11-jre \ - r-base-core \ - build-essential - - # Export filetype - export LC_CTYPE=en_US.UTF-8 - export LC_ALL=en_US.UTF-8 - - - # Install required R packages - R --slave -e 'install.packages("tidyverse", repos="https://cloud.r-project.org/")' - - # Download and install Miniconda - wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh - bash Miniconda3-latest-Linux-x86_64.sh -b -p /opt/miniconda - export PATH="/opt/miniconda/bin:$PATH" - - # Add conda channels - conda config --add channels anaconda - conda config --add channels conda-forge - conda config --add channels defaults - conda config --add channels bioconda - conda config --add channels r - conda update -n base -c defaults conda - - conda install -c bioconda prodigal=2.6.3 - - conda install python=3.10 - conda install pandas=1.5.2 - conda install pytest=7.2.0 - conda install scikit-bio=0.5.7 - conda install mmseqs2==14.7e284 - conda install hmmer=3.3.2 - conda install scipy=1.8.1 - conda install sqlalchemy=1.4.46 - conda install barrnap=0.9 - conda install altair=4.2.0 - conda install openpyxl=3.0.10 - conda install networkx=2.8.8 - conda install ruby=3.1.2 - conda install parallel=20221122 - conda install trnascan-se=2.0.12 - - # Commented out if conda install into base does not work - #conda create -n trnascan python=3.10 -y - #conda install -n trnascan bioconda::trnascan-se=2.0.12 - - # Conda Env with python 3.10 for samtools and bowtie - conda create -n support python=3.10 -y - - conda install -n support samtools=1.17 -y - - conda install -n support bowtie2=2.5.1 -y - - conda install -n support -c conda-forge ncurses - - # Export miniconda bin just to be safe - export PATH="/opt/miniconda/bin:$PATH" - - # Clean up - apt-get clean - - diff --git a/containers/Dockerfile b/containers/Dockerfile deleted file mode 100644 index 1cc423e3..00000000 --- a/containers/Dockerfile +++ /dev/null @@ -1,48 +0,0 @@ -# This Dockerfile is used to build the DRAM container image -# This image references files in the assets directory -# so the Docker build context should be the root of the repository -# The Dockerfile is run from the root of the repository with the following command: -# docker build -t dram- -f containers/Dockerfile . - -# Use miniconda3 as the base image -FROM continuumio/miniconda3 - -# Set environment variables -ENV KMP_DUPLICATE_LIB_OK=TRUE -ENV TZ='America/Denver' -ENV DEBIAN_FRONTEND=noninteractive -ENV LC_CTYPE=en_US.UTF-8 -ENV LC_ALL=en_US.UTF-8 - -# Label the image -LABEL maintainer="" - -# Make the /opt directory and its contents writable -RUN chmod 777 /opt && chmod 777 /opt/* - -# Install required dependencies -RUN apt-get update && apt-get install -y \ - wget \ - bzip2 \ - git \ - pigz \ - openjdk-17-jre \ - r-base-core \ - build-essential - -# Copy necessary files into the image -COPY ../assets/conda/environment.yml /opt/environment.yml - -# Create conda environment -RUN conda update conda \ - && conda env create -f /opt/environment.yml - -# Add conda environment to PATH -ENV PATH /opt/conda/envs/dram-env/bin:$PATH -ENV CONDA_DEFAULT_ENV dram-env - -# Activate conda environment -RUN echo "conda activate dram-env" >> ~/.bashrc - -# Clean up -RUN apt-get clean diff --git a/docs/Makefile b/docs/Makefile index 298ea9e2..51285967 100644 --- a/docs/Makefile +++ b/docs/Makefile @@ -16,4 +16,4 @@ help: # Catch-all target: route all unknown targets to Sphinx using the new # "make mode" option. $(O) is meant as a shortcut for $(SPHINXOPTS). %: Makefile - @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) \ No newline at end of file + @$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O) diff --git a/docs/changelog_include.md b/docs/changelog_include.md index f0d8ff87..d9e79ba6 100644 --- a/docs/changelog_include.md +++ b/docs/changelog_include.md @@ -1,3 +1,3 @@ ```{include} ../CHANGELOG.md -``` \ No newline at end of file +``` diff --git a/docs/conf.py b/docs/conf.py index 5e46ecb7..95f58756 100644 --- a/docs/conf.py +++ b/docs/conf.py @@ -18,14 +18,16 @@ # -- Project information ----------------------------------------------------- -project = u'DRAM' -copyright = u'2025, Rory M Flynn, Kelly C. Wrighton, Mikayla Borton, Reed Woyda, Madeline Scyphers' -author = u'Rory M Flynn, Kelly C. Wrighton, Mikayla Borton, Reed Woyda, Madeline Scyphers' +project = "DRAM" +copyright = "2025, Rory M Flynn, Kelly C. Wrighton, Mikayla Borton, Reed Woyda, Madeline Scyphers" +author = ( + "Rory M Flynn, Kelly C. Wrighton, Mikayla Borton, Reed Woyda, Madeline Scyphers" +) # The short X.Y version -version = u'' +version = "" # The full version, including alpha/beta/rc tags -release = u'' +release = "" # -- General configuration --------------------------------------------------- @@ -37,21 +39,19 @@ # Add any Sphinx extension module names here, as strings. They can be # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom # ones. -extensions = [ - "myst_parser" -] +extensions = ["myst_parser"] # Add any paths that contain templates here, relative to this directory. -templates_path = ['_templates'] +templates_path = ["_templates"] # The suffix(es) of source filenames. # You can specify multiple suffix as a list of string: # # source_suffix = ['.rst', '.md'] -source_suffix = '.md' +source_suffix = ".md" # The master toctree document. -master_doc = 'index' +master_doc = "index" # The language for content autogenerated by Sphinx. Refer to documentation # for a list of supported languages. @@ -63,7 +63,7 @@ # List of patterns, relative to source directory, that match files and # directories to ignore when looking for source files. # This pattern also affects html_static_path and html_extra_path. -exclude_patterns = [u'_build', 'Thumbs.db', '.DS_Store'] +exclude_patterns = ["_build", "Thumbs.db", ".DS_Store"] # The name of the Pygments (syntax highlighting) style to use. pygments_style = None @@ -76,7 +76,7 @@ # # html_theme = 'alabaster' # html_theme = 'sphinx_nefertiti' -html_theme = 'sphinx_rtd_theme' +html_theme = "sphinx_rtd_theme" # Theme options are theme-specific and customize the look and feel of a theme @@ -88,7 +88,7 @@ # Add any paths that contain custom static files (such as style sheets) here, # relative to this directory. They are copied after the builtin static files, # so a file named "default.css" will overwrite the builtin "default.css". -html_static_path = ['_static'] +html_static_path = ["_static"] # html_css_files = ["custom.css"] @@ -106,7 +106,7 @@ # -- Options for HTMLHelp output --------------------------------------------- # Output file base name for HTML help builder. -htmlhelp_basename = 'DRAMdoc' +htmlhelp_basename = "DRAMdoc" # -- Options for LaTeX output ------------------------------------------------ @@ -115,15 +115,12 @@ # The paper size ('letterpaper' or 'a4paper'). # # 'papersize': 'letterpaper', - # The font size ('10pt', '11pt' or '12pt'). # # 'pointsize': '10pt', - # Additional stuff for the LaTeX preamble. # # 'preamble': '', - # Latex figure (float) alignment # # 'figure_align': 'htbp', @@ -133,8 +130,13 @@ # (source start file, target name, title, # author, documentclass [howto, manual, or own class]). latex_documents = [ - (master_doc, 'DRAM.tex', u'DRAM Documentation', - u'Rory M Flynn, Kelly C. Wrighton, Mikayla Borton, Reed Woyda, Madeline Scyphers', 'manual'), + ( + master_doc, + "DRAM.tex", + "DRAM Documentation", + "Rory M Flynn, Kelly C. Wrighton, Mikayla Borton, Reed Woyda, Madeline Scyphers", + "manual", + ), ] @@ -142,10 +144,7 @@ # One entry per manual page. List of tuples # (source start file, name, description, authors, manual section). -man_pages = [ - (master_doc, 'dram', u'DRAM Documentation', - [author], 1) -] +man_pages = [(master_doc, "dram", "DRAM Documentation", [author], 1)] # -- Options for Texinfo output ---------------------------------------------- @@ -154,9 +153,15 @@ # (source start file, target name, title, author, # dir menu entry, description, category) texinfo_documents = [ - (master_doc, 'DRAM', u'DRAM Documentation', - author, 'DRAM', 'One line description of project.', - 'Miscellaneous'), + ( + master_doc, + "DRAM", + "DRAM Documentation", + author, + "DRAM", + "One line description of project.", + "Miscellaneous", + ), ] @@ -175,4 +180,4 @@ # epub_uid = '' # A list of files that should not be packed into the epub file. -epub_exclude_files = ['search.html'] \ No newline at end of file +epub_exclude_files = ["search.html"] diff --git a/docs/contributing.md b/docs/contributing.md index ad6ca0c4..b245d01e 100644 --- a/docs/contributing.md +++ b/docs/contributing.md @@ -3,11 +3,11 @@ Hi there! Many thanks for taking an interest in improving DRAM. -DRAM is written as a Nextflow Pipeline that wraps around the largely python code that does the DRAM calculations. Nextflow handles a lot of the cross platform deployment, dependency manegement, scheduling, and parallelization. What we need to do to get that out of Nextflow though is write whatever DRAM python code we need that can be interphased with through a CLI so Nextflow can call it directly by passing arguements to it. Then the script should write its outputs to files so Nextflow can pass those arguments to the next step. +DRAM is written as a Nextflow Pipeline that wraps around the largely python code that does the DRAM calculations. Nextflow handles a lot of the cross platform deployment, dependency manegement, scheduling, and parallelization. What we need to do to get that out of Nextflow though is write whatever DRAM python code we need that can be interphased with through a CLI so Nextflow can call it directly by passing arguements to it. Then the script should write its outputs to files so Nextflow can pass those arguments to the next step. -## Nextflow resources +## Nextflow resources -You can read more about Nextflow [here](https://www.nextflow.io/docs/latest/index.html), +You can read more about Nextflow [here](https://www.nextflow.io/docs/latest/index.html), ## Nf-core @@ -26,15 +26,15 @@ To make the DRAM code and processing logic more understandable for new contribut ### Adding a new step 1. Write up your main script or script code in whatever language and place it in the bin folder. - * We need to ensure it is executable for Nextflow, so add a shebang to the top of the file (ex. `#!/usr/bin/env python` for a python file) then run `chmod a+x bin/new_script.py` replacing new_sciprt.py with the actual script. -1. If this is a new process, add a new nextflow script (`.nf`) under `modules/local/whatever_subdir_it_goes` + - We need to ensure it is executable for Nextflow, so add a shebang to the top of the file (ex. `#!/usr/bin/env python` for a python file) then run `chmod a+x bin/new_script.py` replacing new_sciprt.py with the actual script. +1. If this is a new process, add a new nextflow script (`.nf`) under `modules/local/whatever_subdir_it_goes` 1. Define the corresponding input channels and output channels 1. If your scripts in the `bin` folder need external dependencies (such as from conda), then add a `environment.yml` file in the same directory as your process (in the `module/local/..`) in your process script add `conda "${moduleDir}/environment.yml"` above your input channels. (See other process scripts as examples). 1. You will now need to install the wave-cli tool to create containers on demand from conda environments. This is how we specify our containers without having to manage docker files or anything else like that. Wave just tells Nextflow how to pull a container on demand from a conda file. You can install wave-cli [here](https://github.com/seqeralabs/wave-cli). Ideally this will be integrated into our CI/CI system in the future. 1. Once you have wave installed, run `wave --freeze --conda-file modules/local/subdir/environment.yml` which will give you some string that starts something like `community.wave.seqera.io`. Below your `conda "${moduleDir}/environment.yml"`, add `container "YOUR STRING FROM WAVE"` - * Now users can run DRAM with with `-profile conda` and `-profile singulary/docker/apptainer/etc.` and it will just work without them installing the dependencies + - Now users can run DRAM with with `-profile conda` and `-profile singulary/docker/apptainer/etc.` and it will just work without them installing the dependencies 1. Add a computation label to your process, such as `label 'process_small'`, that tells Nextflow how much resources to use. We have defined defaults for what process_small, process_medium, etc. mean, but users can override this in their own configs, allowing more control. All the options can be found in `conf/base.config` -1. Add your process by name to `conf/modules.config` if you want to change where your output files get stored in the user's outdir. +1. Add your process by name to `conf/modules.config` if you want to change where your output files get stored in the user's outdir. 1. Add a script section to call your DRAM script, passing in whatever CLI argumenets. The outputs from your DRAM script should be the process outputs. You want them to be written directly in the working directory, Nextflow will manage moving them to the users output directy. You can also rename outputs for future Nextflow steps with the `emit:` keyword, and mark some outputs as optional (see other processes). 1. We now need to add this process to the correct part in our pipeline to be called and ran. If it is in an already established step such as Annotate, we might go to `subworkflows/local/annotate.nf` and find the right spot in that code and add it. Though we might need to add a new subworkflow and add that to our `workflows/dram.nf` -1. We also need to add any new parameters to our `nextflow.config` with a default. And then add the equivalent parameter to our `nextflow_schema.json` with help text. The `nextflow_schema.json` is how our `--help` CLI option is populated as well as what our parameters page on our docs is built from. It also allows us to add sanity checks and validation for all relevant parameters. \ No newline at end of file +1. We also need to add any new parameters to our `nextflow.config` with a default. And then add the equivalent parameter to our `nextflow_schema.json` with help text. The `nextflow_schema.json` is how our `--help` CLI option is populated as well as what our parameters page on our docs is built from. It also allows us to add sanity checks and validation for all relevant parameters. diff --git a/docs/index.md b/docs/index.md index fa577021..36c56333 100644 --- a/docs/index.md +++ b/docs/index.md @@ -2,7 +2,6 @@ The WrightonLabCSU/dram documentation is split into the following pages: - ```{toctree} --- maxdepth: 2 @@ -18,6 +17,6 @@ changelog_include # Indices and tables -* {ref}`genindex` -* {ref}`modindex` -* {ref}`search` \ No newline at end of file +- {ref}`genindex` +- {ref}`modindex` +- {ref}`search` diff --git a/docs/installation.md b/docs/installation.md index 35476055..361ed694 100644 --- a/docs/installation.md +++ b/docs/installation.md @@ -3,16 +3,17 @@ ## Requirements ### System Requirements -* Nextflow >= v23.04.2 -* One of the following dependency management systems: - * Conda - * A Nextflow supported Container Runtime: - * Apptainer - * Singularity CE - * Docker - * Podman - * Sarus -* DRAM databases (preformatted and downloaded via Globus) + +- Nextflow >= v23.04.2 +- One of the following dependency management systems: + - Conda + - A Nextflow supported Container Runtime: + - Apptainer + - Singularity CE + - Docker + - Podman + - Sarus +- DRAM databases (preformatted and downloaded via Globus) On many HPC systems, Nextflow, Conda, and some container runtime (usually Singularity or Apptainer) are already installed. If you are using a local system, you will need to install Nextflow and Conda or a container runtime. On an HPC system, these tools are often loaded with modules. Refer to your HPC system's documentation for instructions on how to load modules. @@ -23,10 +24,13 @@ On many HPC systems, Nextflow, Conda, and some container runtime (usually Singul If you do not have Nextflow installed, you have two options: #### Option A: Direct Installation + Follow the instructions from the [Nextflow documentation page](https://www.nextflow.io/docs/stable/install.html). #### Option B: Conda Installation (Recommended) + Install Nextflow within a conda environment to ensure all dependencies (including Java) are properly installed: + ```bash conda create --name env_nf nextflow -c bioconda conda activate env_nf @@ -58,18 +62,20 @@ If you do not have a container runtime installed, see the [nf-core documentation ### 3. Setup DRAM 1. Create a DRAM directory: + ```bash mkdir DRAM cd DRAM ``` 2. Download the DRAM databases: + - You only need to download the databases you plan to use - Access the databases through [Globus](https://app.globus.org/file-manager?origin_id=97ed64b9-dea0-4eb5-a7e0-0b50ac94e889) (UUID: 97ed64b9-dea0-4eb5-a7e0-0b50ac94e889) - You will need a Globus account to access and download the data - Two options for downloading: - * Using Globus Web UI: Download databases individually - * Using [Globus Connect Personal](https://docs.globus.org/globus-connect-personal/install/): Transfer whole folders at once (recommended for bulk transfers) + - Using Globus Web UI: Download databases individually + - Using [Globus Connect Personal](https://docs.globus.org/globus-connect-personal/install/): Transfer whole folders at once (recommended for bulk transfers) - The disk space required depends on which databases you choose to download - The download consists of a database folder containing all preformatted databases with the description database @@ -79,31 +85,37 @@ cd DRAM curl -o nextflow.config https://raw.githubusercontent.com/WrightonLabCSU/DRAM/refs/heads/dev/nextflow.config ``` - This file can be customized to change: - * Database locations - * Container runtime settings - * SLURM options - * Other profile options + - Database locations + - Container runtime settings + - SLURM options + - Other profile options ### 4. Install and Update DRAM #### Initial Installation + Install DRAM using Nextflow: + ```bash nextflow pull WrightonLabCSU/DRAM -r dev ``` Note: Once DRAM v2 is out of development, the `-r dev` flag will be removed and the command will be simply: + ```bash nextflow pull WrightonLabCSU/DRAM ``` #### Updating DRAM + To update DRAM, rerun the pull command: + ```bash nextflow pull WrightonLabCSU/DRAM ``` To pull a specific branch or version tag: + ```bash nextflow pull WrightonLabCSU/DRAM -r ``` @@ -111,7 +123,9 @@ nextflow pull WrightonLabCSU/DRAM -r Note: Only version tags >= 2 are supported. Pre-version 2 releases were before Nextflow was used. ### Dependency Management + DRAM uses Nextflow to handle all dependency management automatically. When you first run DRAM, it will: + 1. Download all required dependencies based on your chosen profile (conda, singularity, docker, etc.) 2. Cache these dependencies for future use 3. No additional Python packages or environment setup is needed @@ -119,18 +133,24 @@ DRAM uses Nextflow to handle all dependency management automatically. When you f ## Important Notes ### Installation Location + Nextflow installs all pipeline scripts by default in `$HOME/.nextflow/assets/WrightonLabCSU/DRAM`. If you're running DRAM on a shared system, you may want to install it in a shared directory. See the "Custom Installation Location" section below. ### Custom Installation Location + To install DRAM in a custom location: + 1. Clone the DRAM repository to your desired location 2. Run the pipeline by specifying the path: + ```bash nextflow run ``` ### Custom Configuration + To use a custom nextflow.config file: + ```bash nextflow run /main.nf -c ``` @@ -138,8 +158,9 @@ nextflow run /main.nf -c =7 - nf-core=3.2.1 + - pre-commit - pip - pip: - - sphinx-rtd-theme \ No newline at end of file + - sphinx-rtd-theme diff --git a/modules.json b/modules.json index 3408e2d1..48c04632 100644 --- a/modules.json +++ b/modules.json @@ -8,9 +8,7 @@ "multiqc": { "branch": "master", "git_sha": "cf17ca47590cc578dfb47db1c2a44ef86f89976d", - "installed_by": [ - "modules" - ] + "installed_by": ["modules"] } } }, @@ -19,26 +17,20 @@ "utils_nextflow_pipeline": { "branch": "master", "git_sha": "05954dab2ff481bcb999f24455da29a5828af08d", - "installed_by": [ - "subworkflows" - ] + "installed_by": ["subworkflows"] }, "utils_nfcore_pipeline": { "branch": "master", "git_sha": "05954dab2ff481bcb999f24455da29a5828af08d", - "installed_by": [ - "subworkflows" - ] + "installed_by": ["subworkflows"] }, "utils_nfschema_plugin": { "branch": "master", "git_sha": "2fd2cd6d0e7b273747f32e465fdc6bcc3ae0814e", - "installed_by": [ - "subworkflows" - ] + "installed_by": ["subworkflows"] } } } } } -} \ No newline at end of file +} diff --git a/modules/local/add_and_combine/add_annotations.nf b/modules/local/add_and_combine/add_annotations.nf index 5825a73c..9b04584b 100644 --- a/modules/local/add_and_combine/add_annotations.nf +++ b/modules/local/add_and_combine/add_annotations.nf @@ -38,9 +38,9 @@ process ADD_ANNOTATIONS { for col in duplicate_columns: # Create a new column that concatenates information from the old and new columns, if both are non-null - merged_df[col] = merged_df.apply(lambda x: str(x[col + '_old']) + "; " + str(x[col + '_new']) + merged_df[col] = merged_df.apply(lambda x: str(x[col + '_old']) + "; " + str(x[col + '_new']) if pd.notnull(x[col + '_old']) and pd.notnull(x[col + '_new']) - else x[col + '_old'] if pd.notnull(x[col + '_old']) + else x[col + '_old'] if pd.notnull(x[col + '_old']) else x[col + '_new'], axis=1) # Drop the old and new columns after merging their data merged_df.drop(columns=[col + '_old', col + '_new'], inplace=True) diff --git a/modules/local/add_and_combine/generate_gff_genbank.nf b/modules/local/add_and_combine/generate_gff_genbank.nf index 40a3b5c4..ee54a6dd 100644 --- a/modules/local/add_and_combine/generate_gff_genbank.nf +++ b/modules/local/add_and_combine/generate_gff_genbank.nf @@ -5,7 +5,7 @@ process GENERATE_GFF_GENBANK { conda "${moduleDir}/environment.yml" container "community.wave.seqera.io/library/python_pandas_biopython:7df21d027f67112e" - + input: val( all_genes_fna ) val( databases_list ) @@ -34,4 +34,4 @@ process GENERATE_GFF_GENBANK { generate_gff_genbank.py ${flags.join(' ')} --input_fastas_paths ${all_genes_fna} --database_list ${databases_list} --annotations ${raw_annotations} """ -} \ No newline at end of file +} diff --git a/modules/local/annotate/environment.yml b/modules/local/annotate/environment.yml index 0c321455..e81f7bf4 100644 --- a/modules/local/annotate/environment.yml +++ b/modules/local/annotate/environment.yml @@ -9,4 +9,4 @@ dependencies: - mmseqs2==18.8cc5c - scikit-bio=0.7.1 - scipy<2 - - click<9.0 \ No newline at end of file + - click<9.0 diff --git a/modules/local/annotate/gene_locs.nf b/modules/local/annotate/gene_locs.nf index 0bed3dde..97c7e619 100644 --- a/modules/local/annotate/gene_locs.nf +++ b/modules/local/annotate/gene_locs.nf @@ -5,7 +5,7 @@ process GENE_LOCS { conda "${moduleDir}/environment.yml" container "community.wave.seqera.io/library/python_pandas_hmmer_mmseqs2_pruned:d2c88b719ab1322c" - + tag { input_fasta } input: diff --git a/modules/local/annotate/merge_annotations.nf b/modules/local/annotate/merge_annotations.nf index c97c487e..cce32b23 100644 --- a/modules/local/annotate/merge_annotations.nf +++ b/modules/local/annotate/merge_annotations.nf @@ -1,6 +1,6 @@ process MERGE_ANNOTATIONS { label 'process_small' - + errorStrategy 'finish' conda "${moduleDir}/environment.yml" diff --git a/modules/local/annotate/mmseqs_index.nf b/modules/local/annotate/mmseqs_index.nf index 983339b8..c33d12b1 100644 --- a/modules/local/annotate/mmseqs_index.nf +++ b/modules/local/annotate/mmseqs_index.nf @@ -5,7 +5,7 @@ process MMSEQS_INDEX{ conda "${moduleDir}/environment.yml" container "community.wave.seqera.io/library/python_pandas_hmmer_mmseqs2_pruned:d2c88b719ab1322c" - + tag { input_fasta } input: @@ -25,4 +25,4 @@ process MMSEQS_INDEX{ """ -} \ No newline at end of file +} diff --git a/modules/local/annotate/mmseqs_search.nf b/modules/local/annotate/mmseqs_search.nf index f9b73bdd..279de72b 100644 --- a/modules/local/annotate/mmseqs_search.nf +++ b/modules/local/annotate/mmseqs_search.nf @@ -9,8 +9,8 @@ process MMSEQS_SEARCH { tag { input_fasta } input: - tuple( val(input_fasta), - path( query_database, stageAs: "query_database/" ), + tuple( val(input_fasta), + path( query_database, stageAs: "query_database/" ), path( prodigal_locs_tsv, stageAs: "gene_locs.tsv" ) ) path( mmseqs_database ) @@ -78,7 +78,7 @@ process MMSEQS_SEARCH { # Convert Reverse Best Hit results to BLAST outformat 6 mmseqs convertalis ${db_name}.mmsdb query_database/${input_fasta}.mmsdb mmseqs_out/${input_fasta}_${db_name}_tophit_rbh_minbitscore${bit_score_threshold}.mmsdb mmseqs_out/${input_fasta}___mmseqs_rbh_${db_name}.tsv --threads ${task.cpus} - + # Need additional processing for KEGG RBH rbh_mmseqs_filter.py filterdb "mmseqs_out/${input_fasta}___mmseqs_${db_name}.tsv" --reverse "mmseqs_out/${input_fasta}___mmseqs_rbh_${db_name}.tsv" --output "mmseqs_out/${input_fasta}___mmseqs_rbh_${db_name}_combined.tsv" mv mmseqs_out/${input_fasta}___mmseqs_rbh_${db_name}_combined.tsv mmseqs_out/${input_fasta}___mmseqs_${db_name}.tsv diff --git a/modules/local/call/call_genes_prodigal.nf b/modules/local/call/call_genes_prodigal.nf index 77674589..806bb20d 100644 --- a/modules/local/call/call_genes_prodigal.nf +++ b/modules/local/call/call_genes_prodigal.nf @@ -52,7 +52,7 @@ process CALL_GENES { # We parse the GFF to create a summary TSV for later use parse_faa.sh "${input_fasta}_called_genes.faa" "${input_fasta}_called_genes_table.tsv" - # Next we need to convert all metadata ID fields from generated unique + # Next we need to convert all metadata ID fields from generated unique # IDS (1_1, 1_2, 2_1, etc.) to SeqID_GeneNumber (Bin7_1, Bin7_2, etc.) gff_replace_id_with_scaffold_gene_number.sh "${input_fasta}_called_genes.gff" "${input_fasta}_called_genes_renamed.gff" mv "${input_fasta}_called_genes_renamed.gff" "${input_fasta}_called_genes.gff" diff --git a/modules/local/call/quast.nf b/modules/local/call/quast.nf index a2932e61..ffc3d77e 100644 --- a/modules/local/call/quast.nf +++ b/modules/local/call/quast.nf @@ -18,7 +18,7 @@ process QUAST { """ set -euo pipefail shopt -s nullglob # make *.fa expand to nothing if no matches - + export FASTA_COLUMN="${params.CONSTANTS.FASTA_COLUMN}" quast.py -o quast_results --no-plots --no-html --no-icarus --no-snps *.fa diff --git a/modules/local/collect_rna/environment.yml b/modules/local/collect_rna/environment.yml index c548e20d..22be72b1 100644 --- a/modules/local/collect_rna/environment.yml +++ b/modules/local/collect_rna/environment.yml @@ -7,4 +7,3 @@ dependencies: - pandas=1.5.2 - barrnap=0.9 - trnascan-se=2.0.12 - \ No newline at end of file diff --git a/modules/local/collect_rna/trna_scan.nf b/modules/local/collect_rna/trna_scan.nf index 1a36f540..7ebda828 100644 --- a/modules/local/collect_rna/trna_scan.nf +++ b/modules/local/collect_rna/trna_scan.nf @@ -26,7 +26,7 @@ process TRNA_SCAN { os.environ['TMPDIR'] = './tmp' FASTA_COLUMN="${params.CONSTANTS.FASTA_COLUMN}" - + # Create the temporary directory if it doesn't exist os.makedirs(os.environ['TMPDIR'], exist_ok=True) diff --git a/modules/local/distill/environment.yml b/modules/local/distill/environment.yml index 1f0713f8..d1281069 100644 --- a/modules/local/distill/environment.yml +++ b/modules/local/distill/environment.yml @@ -10,4 +10,4 @@ dependencies: - xlsxwriter - numpy - lark - - networkx \ No newline at end of file + - networkx diff --git a/modules/local/trees/trees.nf b/modules/local/trees/trees.nf deleted file mode 100644 index bc3720a3..00000000 --- a/modules/local/trees/trees.nf +++ /dev/null @@ -1,92 +0,0 @@ -process TREES { - label 'process_tiny' - - errorStrategy 'finish' - - input: - path( ch_combined_annotations, stageAs: "initial-annotations.tsv" ) - val( trees_list ) - path( ch_collected_proteins ) - path( tree_data_files ) - path( ch_trees_scripts ) - file( ch_add_trees ) - - output: - path("updated-annotations.tsv"), emit: updated_annotations, optional: true - path("aligned_sequences.jplace"), emit: tree_placements, optional: true - path("colored_tree.pdf"), emit: colored_tree, optional: true - path("colored_tree_python.pdf"), emit: colored_tree_python, optional: true - - script: - """ - # export constants for script - export FASTA_COLUMN="${params.CONSTANTS.FASTA_COLUMN}" - - ln -s ${tree_data_files}/* . - ln -s ${ch_trees_scripts}/*.py . - ln -s ${ch_trees_scripts}/*.R . - - cp initial-annotations.tsv current-annotations.tsv - - # Symlink additional tree directories if provided - if [[ "${params.add_trees}" != "" ]]; then - ln -s ${ch_add_trees}/* ${tree_data_files}/ - fi - - # Append additional tree directories to trees_list - if [ -d "${params.add_trees}" ]; then - for dir in \$(ls ${params.add_trees}); do - trees_list+=";\$dir" - done - fi - - # Split trees_list into an array - IFS=';' read -ra TREE_OPTIONS <<< "${trees_list}" - - for tree_option in "\${TREE_OPTIONS[@]}"; do - echo "Processing tree: \${tree_option}" - - # Determine the search terms file for the current tree - KO_LIST="\${tree_option}/\${tree_option}.refpkg/\${tree_option}_search_terms.txt" - python parse_annotations.py current-annotations.tsv \${KO_LIST} "extracted_query_ids.txt" - - if [ -s "extracted_query_ids.txt" ]; then - # The file is not empty, proceed with processing - - # Loop through each line in the output file, extract the corresponding sequence - mkdir -p extracted_sequences - while IFS=\$'\t' read -r input_fasta query_id; do - seqtk subseq \${input_fasta}_called_genes.faa <(echo \${query_id}) > extracted_sequences/\${input_fasta}_\${query_id}.fasta - done < extracted_query_ids.txt - - # Combine all sequences into one file - cat extracted_sequences/*.fasta > combined_extracted_sequences.fasta - - # Align sequences to the reference alignment - mafft --thread ${params.threads} --add combined_extracted_sequences.fasta --reorder trees/\${tree_option}/\${tree_option}.refpkg/\${tree_option}.aln > aligned_sequences.fasta - - # Run pplacer - pplacer -j ${task.cpus} -c trees/\${tree_option}/\${tree_option}.refpkg aligned_sequences.fasta - - # Generate visualization using guppy tog (translate .jplace to other formats) - guppy tog -o aligned_sequences.xml aligned_sequences.jplace - - # Update the annotations using the mapping and the placements - python update_annots_trees.py aligned_sequences.jplace current-annotations.tsv "trees/\${tree_option}/\${tree_option}.refpkg/\${tree_option}-tree-mapping.tsv" updated-annotations.tsv - - # Set the updated annotations as the current for the next tree - mv updated-annotations.tsv current-annotations.tsv - - # Color labels and generate PDF - Rscript color_labels.R aligned_sequences.xml extracted_query_ids.txt colored_tree.pdf - - else - echo "No gene IDs of interest found for tree \${tree_option}, skipping sequence extraction and analysis." - fi - done - - # Finalize the process - mv current-annotations.tsv updated-annotations.tsv - - """ -} diff --git a/modules/nf-core/multiqc/tests/main.nf.test.snap b/modules/nf-core/multiqc/tests/main.nf.test.snap index 2fcbb5ff..261dc0fa 100644 --- a/modules/nf-core/multiqc/tests/main.nf.test.snap +++ b/modules/nf-core/multiqc/tests/main.nf.test.snap @@ -38,4 +38,4 @@ }, "timestamp": "2024-10-02T17:52:09.185842" } -} \ No newline at end of file +} diff --git a/modules/utils/help.nf b/modules/utils/help.nf deleted file mode 100644 index 20c5092e..00000000 --- a/modules/utils/help.nf +++ /dev/null @@ -1,443 +0,0 @@ -CONDA_ENV_DEPS = file(params.main_environment).text.split('dependencies:')[1] - -DNA_HEADER = """ -=========================================== - $workflow.manifest.name -(==( )==) (==( )==) - `-.`. ,',-' `-.`. ,',-' - _,-'" _,-'" - ,-',' `.`-. ,-',' `.`-. -(==( )==) (==( )==) - `-.`. ,',-' `-.`. ,',-' - _,-'" _,-'" - ,-',' `.`-. ,-',' `.`-. -(==( )==) (==( )==) - $workflow.manifest.version -=========================================== -""" - -DEPENDENCIES = """ - Software versions used: - - $CONDA_ENV_DEPS -""" - -LICENSE = "MIT License. Micobial Ecosystems Lab, Colorado State University Fort Collins. 2024 (last updated 2024)" - -REQUIRED_OPTIONS = """ -REQUIRED $workflow.manifest.name profile options: - -profile STRING - Runs $workflow.manifest.name either using Conda (must be installed) or Singularity (must be installed). - Runs $workflow.manifest.name with no scheduling or scheduling via SLURM. - See SLURM options in full help menu. -""" -MAIN_HELP = """ -Description: - The purpose of $workflow.manifest.name is to provide FASTA annotation, across a vast array of databases, with expertly-currated distillation. - $workflow.manifest.name can be used to call, annotate and distill annotations from input FASTA files. - Call, annotate and distill can be run together or, each can be run idependently. - -Bring up help menu: - nextflow run $workflow.manifest.name --help (--h) - -Bring up versions menu: - nextflow run $workflow.manifest.name --version (--v) - -Usage: - nextflow run $workflow.manifest.name --rename --call --annotate --use_ - - Call genes using input fastas (use --rename to rename FASTA headers): - nextflow run $workflow.manifest.name --call --rename --input_fasta - - Annotate called genes using input fastas: - nextflow run $workflow.manifest.name --annotate --input_genes - - Distill using input annotations: - nextflow run $workflow.manifest.name --distill_ --annotations - - (Combined): Call, annotate and distill input fasta files: - nextflow run $workflow.manifest.name --rename --call --annotate --use_ - - (Real) example: (on multiple lines for clarity) - nextflow run $workflow.manifest.name --input_fasta ../test_data/ - --outdir $workflow.manifest.name-test-data-Feb012024/ - --call --rename - --annotate --use_uniref --use_kegg --use_merops --use_viral --use_camper --use_kofam --use_dbcan --use_methyl --use_canthyd --use_vog --use_fegenie --use_sulfur - --add_annotations ../test-data/old-DRAM-annotations.tsv - --distill_topic 'carbon transport energy' --distill_ecosystem 'eng_sys ag' - --distill_custom assets/forms/distill_sheets/test.tsv -resume --slurm_node zenith - --trnas ../test-data/trnas.tsv - --rrnas ../test-data/rrnas.tsv - --bin_quality ../test-data/checkM1-test-data.tsv - --taxa ../test-data/gtdbtk.bac120.summary.tsv - --generate_gff - --generate_gbk - --threads 5 - -with-report -with-trace -with-timeline - -Main $workflow.manifest.name Operations: - --call : Call genes using prodigal - --annotate : Annotate called genes using downloaded databases - --distill : Distill the annotations into a multi-sheet distillate.xlsx - --product : Generate a product heatmap of the annotations - --format_kegg : Format KEGG database for use in $workflow.manifest.name. Standalone operation, will exit after completion. -""" - -CALL_OPTIONS = """ -Call options: - --call Call genes on the input FASTA files using Prodigal. - - --input_fasta PATH - Directory containing input fasta files. - Default: <./input_fasta/*.fa*> - - --rename OPTION Rename FASTA headers based on file name. - Example: sample1.fa --> (fasta header renamed to) > sample1...... - Why? $workflow.manifest.name output is focused on scaffolds/contigs with respect to each provided input sample. - Thus, without renaming FASTA headers, the individual scaffolds/contigs will not be distinguashable. - *If you have already renamed your FASTA headers, do not include '--call'. - - --prodigal_mode STRING - Default: 'single' - - --prodigal_tras_table NUMBER (1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25) - Specify a translation table to use (default: '1'). - - --min_contig_len NUMBER - Default: '2500' -""" - -ANNOTATE_OPTIONS = """ -Annotate options: - --annotate Annotate called genes using downloaded databases - - --use_ STRING - metabolism_kegg_set = kegg, dbcan, merops, pfam, heme - metabolism_set = kofam, dbcan, merops, pfam, heme - adjectives_kegg_set = kegg, dbcan, merops, pfam, heme, sulfur, camper, methyl, fegenie - adjectives_set = kofam, dbcan, merops, pfam, heme, sulfur, camper, methyl, fegenie - *Only one set can be used. Can be used in combination with --use_[db-name] - - --input_fasta PATH - Directory containing input fasta files. - Default: './input_fasta/' - Either '--input_fasta' or '--input_genes' may be used - not both. - - --input_genes PATH - Directory containing called genes (.faa) - - --add_annotations PATH - Used to add in old annotations to the current run. (See example for format.) - - --generate_gff OPTION Will generate an output GFF for each sample based on the raw-annotations.tsv. - - --generate_gbk OPTION Will generate an output GBK for each sample based on the raw-annotations.tsv. -""" - -SUMMARIZE_OPTIONS = """ -Distill options: - --distill Distill the annotations into a multi-sheet distillate.xlsx - - --annotations PATH - Required if you are running distill without --call and --annotate. - - --rrnas PATH (See example for format.) - rRNA information will be included in distill output. - - --trnas PATH (See example for format.) - tRNA information will be included in distill output. - - --bin_quality PATH (See example for format.) - CheckM and CheckM2 compatible. - - --taxa PATH - Compatible with GTDB. (See example for format.) - - --distill_topic STRING OR - If more than one topic included, they must be enclosed in single quotes - - --distill_ecosystem STRING - If more than one ecosystem included, they must be enclosed in single quotes - - --distill_custom STRING (See example for format and options.) - As of now, only one custom distillate may be included. -""" - -PRODUCT_OPTIONS = """ -Product options: - --product Generate a product visualization of the annotations and save the output to the output directory. - - --annotations PATH - Required if you are running product without --call and --annotate. - - --groupby_column STRING Column to to group by in the annotations file for etc and function groupings - Default: 'fasta' - - --module_steps_form PATH - override default module steps form database TSV - - --etc_module_form PATH - override default etc module form database TSV - - --function_heatmap_form PATH - override default function heatmap form database TSV -""" - -TREE_OPTIONS = """ -Tree options: - --trees OPTION Will run Trees. (This option is not advised as $workflow.manifest.name Trees is in development.) -""" - -FORMAT_KEGG_DB_OPTIONS = """ -Format KEGG Database options: - --format_kegg Format KEGG database for use in $workflow.manifest.name. Standalone operation, will exit after completion. - - --kegg_pep_loc PATH - Path to and of the gene fasta files that are provided by the - KEGG FTP server or a concatenated version of them - --gene_ko_link_loc PATH - Path to the genes_ko_link file downloaded from KEGG - - --kegg_db PATH - Output path to the KEGG database directory. This is where the - formatted KEGG database will be stored. Default: `${params.kegg_db}` - relative to $workflow.manifest.name directory. - --kegg_download_date STRING - The date the KEGG database was downloaded. If not provided, the - current date will be used. - --skip_gene_ko_link OPTION Skip the gene_ko_link file. If you are using an older version of KEGG that does - supply the gene_ko_link file you can use this option to skip the gene_ko_link - file. Otherwise, the gene_ko_link file is required. -""" - -ADJECTIVES_OPTIONS = """ -Adjectives options: - --annotations_tsv_path PATH Location of an annotations.tsv. You don't - need to use this option if you are using the - output_dir for dram with a project_config. - If you use this option, you must also use - the force flag to bypass the safeguards that - prevent you from running distill with - insufficient data. - --adjectives_tsv_path PATH Location of the output adjectives.tsv. if - you leave this blank the adjectives.tsv file - will be put in the output directory. - -a, --adjectives TEXT A list of adjectives, by name, to evaluate. - This limits the number of adjectives that - are evaluated, and is faster. - -p, --plot_adjectives TEXT A list of adjectives, by name, to plot. This - limits the number of adjectives that are - plotted and is probably needed for speed. - -g, --plot_genomes TEXT - --plot_path PATH will become a folder of output plots, no - path no plots. - --strainer_tsv PATH The path for a tsv that will pass to - strainer to filter genes. The only option at - this time is ‘pgtb’ for positive genes that - are on true bugs. - --strainer_type PATH The type of process that should make the - strainer file. - --debug_ids_by_fasta_to_tsv PATH - This is a tool to debug the list of IDs - found by DRAM it is mostly for experts. - --user_rules_tsv PATH This is an optional path to a rules file - with strict formatting. It will overwrite - the original rules file that is stored with - the script. - --show_rules_path Show the path to the default rules path. - --list_name List the names for all adjectives_tsv that - are available, you can pass these names to - limit the adjectives that are evaluated - --list_id List the names for all adjectives_tsv that - are available, you can pass these names to - limit the adjectives that are evaluated, - --input_fasta PATH - Directory containing input fasta files. - Default: <./input_fasta/*.fa*> - """ - -GENERAL_OPTIONS = """ -General options: - --outdir PATH - Default: './DRAM_output/' - - --threads NUMBER Number of threads to use for processing. - Default: `${params.threads}` - - --slurm_node string - Example --slurm_queue c001 - - --slurm_queue string - Example: --slurn_queue 'smith-hi,smith-low' -""" - -CALL_DESCRIPTION = """ -Call description: The purpose of $workflow.manifest.name --call is to call genes on input FASTA files. - -Usage: - - Call genes using input fastas: - nextflow run $workflow.manifest.name --call --input_fasta --outdir --threads -""" - -ANNOTATE_DESCRIPTION = """ -Annotate description: The purpose of $workflow.manifest.name '--annotate' is to annotate called genes on input (nucleotide) FASTA (fa*) files. - -Usage: - - Annotate called genes using input called genes and the KOFAM database: - nextflow run $workflow.manifest.name --annotate --input_genes --use_kofam - - Annotate called genes using input fasta files and the KOFAM database: - nextflow run $workflow.manifest.name --annotate --input_fasta --use_kofam -""" - -SUMMARIZE_DESCRIPTION = """ -Distill description: The purpose of $workflow.manifest.name --distill is to distill down annotations based on curated distillation summary form(s). - User's may also provide a custom distillate via --distill_custom (TSV forms). - Distill can be ran independent of --call and --annotate however, annotations must be provided (--annotations ). - Optional tRNA, rRNA and bin quality may also be provided. - -Usage: - nextflow run $workflow.manifest.name --distill_ --annotations --outdir --threads - *Important: if more than one topic or ecosystem is included, they must be enclosed in single quotes. Example: --distill_topic 'carbon transport' - -Example: - Call and Annotate genes using input fastas and KOFAM database. Distill using carbon topic and AG ecosystem: - nextflow run $workflow.manifest.name --input_fasta --outdir --call --annotate --distill_topic carbon --distill_ecosystem ag --threads --use_kofam -""" - -PRODUCT_DESCRIPTION = """ -Product description: The purpose of $workflow.manifest.name --product is to generate a product visualization of the annotations - and save the output to the output directory. - -Usage: - nextflow run $workflow.manifest.name --product --annotations --outdir - -Example: - Create heatmap product visualization from annotations file and save to output directory: - nextflow run $workflow.manifest.name --product --annotations --outdir -""" - -ADJECTIVES_DESCRIPTION = """ -Annotate description: The purpose of $workflow.manifest.name '--adjectives' is to evaluate genes and describe their features. - -Usage: - TO BE ADDED LATER - -THIS IS A WORK IN PROGRESS AND IS NOT YET COMPLETE -""" - -FORMAT_KEGG_DB_DESCRIPTION = """ -Format KEGG DB description: The purpose of $workflow.manifest.name '--format_kegg' is to format the raw KEGG database (pep files) - for use in $workflow.manifest.name. Because use of the KEGG database requires a license, the user must download the raw KEGG database - themselves. Currently this only supports formatting a concatenated version of the KEGG pep files see - (https://github.com/WrightonLabCSU/DRAM/issues/305) for guidance on how to prepare your pep files for formatting. - -Usage: - nextflow run $workflow.manifest.name --format_kegg --kegg_pep_loc --kegg_db -""" - -/* -~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - Version menu -~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -*/ - -def version() { -log.info""" -${DNA_HEADER} -${DEPENDENCIES} -""" -} - -/* -~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ - Help menus -~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ -*/ - -def helpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${MAIN_HELP} -${REQUIRED_OPTIONS} -${CALL_OPTIONS} -${ANNOTATE_OPTIONS} -${SUMMARIZE_OPTIONS} -${PRODUCT_OPTIONS} -${TREE_OPTIONS} -${FORMAT_KEGG_DB_OPTIONS} -${GENERAL_OPTIONS} -""" -} - -def callHelpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${CALL_DESCRIPTION} -${REQUIRED_OPTIONS} -${CALL_OPTIONS} -${GENERAL_OPTIONS} -""" -} - -def annotateHelpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${ANNOTATE_DESCRIPTION} -${REQUIRED_OPTIONS} -${ANNOTATE_OPTIONS} -${GENERAL_OPTIONS} -""" -} - -def distillHelpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${SUMMARIZE_DESCRIPTION} -${REQUIRED_OPTIONS} -${SUMMARIZE_OPTIONS} -${GENERAL_OPTIONS} -""" -} - -def productHelpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${PRODUCT_DESCRIPTION} -${REQUIRED_OPTIONS} -${PRODUCT_OPTIONS} -${GENERAL_OPTIONS} -""" -} - -def adjectivesHelpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${ADJECTIVES_DESCRIPTION} -${REQUIRED_OPTIONS} -${ADJECTIVES_OPTIONS} -${GENERAL_OPTIONS} -""" -} - -def formatKeggHelpMessage() { -log.info """ -${DNA_HEADER} -${LICENSE} -${FORMAT_KEGG_DB_DESCRIPTION} -${REQUIRED_OPTIONS} -${FORMAT_KEGG_DB_OPTIONS} -${GENERAL_OPTIONS} -""" -} diff --git a/nextflow.config b/nextflow.config index 828e924c..e1536ddb 100644 --- a/nextflow.config +++ b/nextflow.config @@ -159,11 +159,11 @@ params { slurm_node = null // Slurm resource requirements // These are the default values for the slurm profile - // If not defined, will default to the largest Process resource requirements + // If not defined, will default to the largest Process resource requirements cpu_provision_limit = null mem_gb_provision_limit = null time_hr_provision_limit = null - + /* Process Options */ queue_size = 10 @@ -507,7 +507,7 @@ validation { \033[0;32m _,-'"\033[0;34m | | | | | _ / / /\\ \\ | |\\/| | \033[0;32m_,-'" \033[0m \033[0;32m ,-',' `.`-.\033[0;34m | |__| | | | \\ \\ / ____ \\ | | | | \033[0;32m,-',' `.`-. \033[0m \033[0;32m(==( )==)\033[0;34m |_____/ |_| \\_\\ /_/ \\_\\ |_| |_| \033[0;32m(==( )==) \033[0m - + \033[0;35m ${manifest.name} ${manifest.version}\033[0m \033[2m=====================================================================\033[0m diff --git a/nextflow_schema.json b/nextflow_schema.json index 8899dbe0..256aa91f 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -95,9 +95,7 @@ "fa_,icon": "fas fa-plus" } }, - "required": [ - "outdir" - ] + "required": ["outdir"] }, "call_prodigal_options": { "title": "Call Prodigal Options", @@ -109,42 +107,13 @@ "type": "string", "description": "Mode for Prodigal gene calling.", "default": "meta", - "enum": [ - "meta", - "single" - ] + "enum": ["meta", "single"] }, "prodigal_trans_table": { "type": "number", "description": "Translation table to use.", "default": 11.0, - "enum": [ - 1, - 2, - 3, - 4, - 5, - 6, - 7, - 8, - 9, - 10, - 11, - 12, - 13, - 14, - 15, - 16, - 17, - 18, - 19, - 20, - 21, - 22, - 23, - 24, - 25 - ] + "enum": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25] }, "min_contig_len": { "type": "number", @@ -153,9 +122,7 @@ } }, "dependentRequired": { - "call": [ - "input_fasta" - ] + "call": ["input_fasta"] } }, "annotate_options": { @@ -771,14 +738,7 @@ "description": "Method used to save pipeline results to output directory.", "help_text": "The Nextflow `publishDir` option specifies which intermediate files should be saved to the output directory. This option tells the pipeline what method should be used to move these files. See [Nextflow docs](https://www.nextflow.io/docs/latest/process.html#publishdir) for details.", "fa_icon": "fas fa-copy", - "enum": [ - "symlink", - "rellink", - "link", - "copy", - "copyNoFollow", - "move" - ], + "enum": ["symlink", "rellink", "link", "copy", "copyNoFollow", "move"], "hidden": true }, "email": { @@ -919,4 +879,4 @@ "$ref": "#/$defs/generic_options" } ] -} \ No newline at end of file +} diff --git a/nf-test.config b/nf-test.config index ae175153..9b6875a5 100644 --- a/nf-test.config +++ b/nf-test.config @@ -23,4 +23,4 @@ config { load "nft-csv@0.1.0" } -} \ No newline at end of file +} diff --git a/scripts/pre_docs_install.sh b/scripts/pre_docs_install.sh index a921b6fd..d5776b02 100644 --- a/scripts/pre_docs_install.sh +++ b/scripts/pre_docs_install.sh @@ -1,2 +1,2 @@ #!/usr/bin/env bash -nf-core pipelines schema docs --format markdown --output docs/params_doc.md \ No newline at end of file +nf-core pipelines schema docs --format markdown --output docs/params_doc.md diff --git a/subworkflows/local/annotate.nf b/subworkflows/local/annotate.nf index 2bcda518..7efc4440 100644 --- a/subworkflows/local/annotate.nf +++ b/subworkflows/local/annotate.nf @@ -98,11 +98,11 @@ workflow ANNOTATE { // n_fastas = file("$params.input_genes/${params.genes_fmt}").size() } - + if (params.annotate){ - DB_SEARCH( - ch_gene_locs, - ch_called_proteins, + DB_SEARCH( + ch_gene_locs, + ch_called_proteins, default_sheet, use_kegg, use_kofam, @@ -134,4 +134,4 @@ workflow ANNOTATE { ch_combined_annotations ch_quast_stats -} \ No newline at end of file +} diff --git a/subworkflows/local/call.nf b/subworkflows/local/call.nf index 74ae33d5..fd34c1c4 100644 --- a/subworkflows/local/call.nf +++ b/subworkflows/local/call.nf @@ -58,7 +58,7 @@ workflow CALL { ch_gene_locs // channel: [ val(input_fasta name), path(gene_locs_tsv) ] ch_called_genes // channel: [ val(input_fasta name), path(called_genes_file.fna) ] ch_called_proteins // channel: [ val(input_fasta name), path(called_proteins_file.faa) ] - ch_collected_faa + ch_collected_faa ch_collected_fna ch_collected_fasta } diff --git a/subworkflows/local/collect_rna.nf b/subworkflows/local/collect_rna.nf index 5df2bddb..55e77d11 100644 --- a/subworkflows/local/collect_rna.nf +++ b/subworkflows/local/collect_rna.nf @@ -30,7 +30,7 @@ workflow COLLECT_RNA { run_rrna_collect = false run_trna_collect = false - // If we didn't run call + // If we didn't run call if (!call) { if (params.rrnas) { Channel.fromPath("${params.rrnas}/*.tsv", checkIfExists: true) @@ -102,4 +102,4 @@ workflow COLLECT_RNA { ch_trna_collected ch_trna_combined -} \ No newline at end of file +} diff --git a/subworkflows/local/db_search.nf b/subworkflows/local/db_search.nf index d2317295..a08673c4 100644 --- a/subworkflows/local/db_search.nf +++ b/subworkflows/local/db_search.nf @@ -132,9 +132,9 @@ workflow DB_SEARCH { // KOFAM annotation if (use_kofam) { ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_KOFAM ( - ch_combined_proteins_locs, - params.kofam_e_value, + HMM_SEARCH_KOFAM ( + ch_combined_proteins_locs, + params.kofam_e_value, DB_CHANNEL_SETUP.out.ch_kofam_db, ch_kofam_list, true, @@ -157,8 +157,8 @@ workflow DB_SEARCH { // dbCAN annotation if (use_dbcan) { ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_DBCAN ( - ch_combined_proteins_locs, + HMM_SEARCH_DBCAN ( + ch_combined_proteins_locs, params.dbcan_e_value, DB_CHANNEL_SETUP.out.ch_dbcan_db, default_sheet, @@ -174,9 +174,9 @@ workflow DB_SEARCH { if (use_camper) { // HMM ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_CAMPER ( - ch_combined_proteins_locs, - params.camper_e_value, + HMM_SEARCH_CAMPER ( + ch_combined_proteins_locs, + params.camper_e_value, DB_CHANNEL_SETUP.out.ch_camper_hmm_db, ch_camper_hmm_list, false, @@ -195,9 +195,9 @@ workflow DB_SEARCH { // FeGenie annotation if (use_fegenie) { ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_FEGENIE ( - ch_combined_proteins_locs, - params.fegenie_e_value, + HMM_SEARCH_FEGENIE ( + ch_combined_proteins_locs, + params.fegenie_e_value, DB_CHANNEL_SETUP.out.ch_fegenie_db, default_sheet, false, @@ -225,9 +225,9 @@ workflow DB_SEARCH { //HMM ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_CANTHYD ( - ch_combined_proteins_locs, - params.canthyd_e_value, + HMM_SEARCH_CANTHYD ( + ch_combined_proteins_locs, + params.canthyd_e_value, DB_CHANNEL_SETUP.out.ch_canthyd_hmm_db, ch_canthyd_hmm_list, false, @@ -240,9 +240,9 @@ workflow DB_SEARCH { // Sulfur annotation if (use_sulfur) { ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_SULFUR ( - ch_combined_proteins_locs, - params.sulfur_e_value, + HMM_SEARCH_SULFUR ( + ch_combined_proteins_locs, + params.sulfur_e_value, DB_CHANNEL_SETUP.out.ch_sulfur_db, default_sheet, false, @@ -276,9 +276,9 @@ workflow DB_SEARCH { // Metals annotation if (use_metals) { ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) - HMM_SEARCH_METALS ( - ch_combined_proteins_locs, - params.metals_e_value, + HMM_SEARCH_METALS ( + ch_combined_proteins_locs, + params.metals_e_value, DB_CHANNEL_SETUP.out.ch_metals_db, default_sheet, false, @@ -291,12 +291,12 @@ workflow DB_SEARCH { if (use_vog) { ch_combined_proteins_locs = ch_called_proteins.join(ch_gene_locs) HMM_SEARCH_VOG ( - ch_combined_proteins_locs, - params.vog_e_value, + ch_combined_proteins_locs, + params.vog_e_value, DB_CHANNEL_SETUP.out.ch_vogdb_db, default_sheet, false, - vogdb_name + vogdb_name ) ch_vog_formatted = HMM_SEARCH_VOG.out.formatted_hits formattedOutputChannels = formattedOutputChannels.mix(ch_vog_formatted) @@ -314,7 +314,7 @@ workflow DB_SEARCH { } fastas = formattedOutputChannels.map { it[1] }.collect() genes = ch_called_proteins.map { it[1] }.collect() - + COMBINE_ANNOTATIONS( fastas, genes ) ch_combined_annotations = COMBINE_ANNOTATIONS.out.combined_annotations_out @@ -457,4 +457,4 @@ workflow DB_CHANNEL_SETUP { ch_vogdb_db ch_viral_db index_mmseqs -} \ No newline at end of file +} diff --git a/subworkflows/local/merge.nf b/subworkflows/local/merge.nf index 8b4f7ece..d6945aeb 100644 --- a/subworkflows/local/merge.nf +++ b/subworkflows/local/merge.nf @@ -40,4 +40,4 @@ workflow MERGE { .set { ch_merge_annotations_collected } MERGE_ANNOTATIONS( ch_merge_annotations_collected ) -} \ No newline at end of file +} diff --git a/subworkflows/local/qc.nf b/subworkflows/local/qc.nf index 298c4fff..3fcdd537 100644 --- a/subworkflows/local/qc.nf +++ b/subworkflows/local/qc.nf @@ -62,7 +62,7 @@ workflow QC { .collect() .set { ch_collected_fna } } - + GENERATE_GFF_GENBANK( ch_collected_fna, params.database_list, ch_final_annots ) } @@ -73,4 +73,4 @@ workflow QC { ch_final_annots ch_rrna_collected ch_trna_collected -} \ No newline at end of file +} diff --git a/subworkflows/local/utils_pipeline_setup.nf b/subworkflows/local/utils_pipeline_setup.nf index 90908185..5e40ab25 100644 --- a/subworkflows/local/utils_pipeline_setup.nf +++ b/subworkflows/local/utils_pipeline_setup.nf @@ -16,4 +16,4 @@ def getDBFlag(db_list, db_name, value_for_all) { } else { return false } -} \ No newline at end of file +} diff --git a/subworkflows/nf-core/utils_nextflow_pipeline/tests/main.function.nf.test.snap b/subworkflows/nf-core/utils_nextflow_pipeline/tests/main.function.nf.test.snap index e3f0baf4..846287c4 100644 --- a/subworkflows/nf-core/utils_nextflow_pipeline/tests/main.function.nf.test.snap +++ b/subworkflows/nf-core/utils_nextflow_pipeline/tests/main.function.nf.test.snap @@ -17,4 +17,4 @@ }, "timestamp": "2024-02-28T12:02:12.425833" } -} \ No newline at end of file +} diff --git a/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.function.nf.test.snap b/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.function.nf.test.snap index 02c67014..b13b3112 100644 --- a/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.function.nf.test.snap +++ b/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.function.nf.test.snap @@ -133,4 +133,4 @@ }, "timestamp": "2024-02-28T12:03:21.714424" } -} \ No newline at end of file +} diff --git a/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.workflow.nf.test.snap b/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.workflow.nf.test.snap index 859d1030..84ee1e1d 100644 --- a/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.workflow.nf.test.snap +++ b/subworkflows/nf-core/utils_nfcore_pipeline/tests/main.workflow.nf.test.snap @@ -16,4 +16,4 @@ }, "timestamp": "2024-02-28T12:03:25.726491" } -} \ No newline at end of file +} diff --git a/subworkflows/nf-core/utils_nfschema_plugin/main.nf b/subworkflows/nf-core/utils_nfschema_plugin/main.nf index 4994303e..93de2a52 100644 --- a/subworkflows/nf-core/utils_nfschema_plugin/main.nf +++ b/subworkflows/nf-core/utils_nfschema_plugin/main.nf @@ -43,4 +43,3 @@ workflow UTILS_NFSCHEMA_PLUGIN { emit: dummy_emit = true } - diff --git a/subworkflows/nf-core/utils_nfschema_plugin/tests/nextflow.config b/subworkflows/nf-core/utils_nfschema_plugin/tests/nextflow.config index 0907ac58..478fb8a0 100644 --- a/subworkflows/nf-core/utils_nfschema_plugin/tests/nextflow.config +++ b/subworkflows/nf-core/utils_nfschema_plugin/tests/nextflow.config @@ -5,4 +5,4 @@ plugins { validation { parametersSchema = "${projectDir}/subworkflows/nf-core/utils_nfschema_plugin/tests/nextflow_schema.json" monochromeLogs = true -} \ No newline at end of file +} diff --git a/tests/annotation_snapshot.nf.test b/tests/annotation_snapshot.nf.test index 685761fc..7a0495fd 100644 --- a/tests/annotation_snapshot.nf.test +++ b/tests/annotation_snapshot.nf.test @@ -17,7 +17,7 @@ nextflow_pipeline { // sortRows doesn't seem to actual sort these tsvs for some reason, so I manually sorted them def actual = path("${projectDir}/tests/data/owc/annotation/raw_annotations_snapshot.tsv").csv(sep: "\t") def expected = path("${projectDir}/tests/data/owc/annotation/dram1_informed_annotations.tsv").csv(sep: "\t") - + assert actual.columns["query_id"] == expected.columns["query_id"] assert actual.columns["input_fasta"] == expected.columns["input_fasta"] assert actual.columns["start_position"] == expected.columns["start_position"] @@ -26,4 +26,4 @@ nextflow_pipeline { assert actual.columns["heme_regulatory_motif_count"] == expected.columns["heme_regulatory_motif_count"] } } -} \ No newline at end of file +} diff --git a/tests/data/owc/annotation/raw_annotations_snapshot.tsv b/tests/data/owc/annotation/raw_annotations_snapshot.tsv index b3723a04..e0df8d7a 100644 --- a/tests/data/owc/annotation/raw_annotations_snapshot.tsv +++ b/tests/data/owc/annotation/raw_annotations_snapshot.tsv @@ -1,29 +1,29 @@ query_id input_fasta start_position stop_position strandedness rank gene_number kegg_id kegg_EC kegg_bitScore kegg_description kegg_gene_name kofam_id kofam_EC kofam_bitScore kofam_description kofam_score_rank heme_regulatory_motif_count dbcan_id dbcan_EC dbcan_bitScore dbcan_description dbcan_score_rank -OWC_0000_k121_3157_1 OWC_0000 2 580 -1 E 1 0 -OWC_0000_k121_3157_2 OWC_0000 596 997 -1 C 2 K14127 EC:1.8.98.5; EC:1.8.98.6 205.0 barc:AOA65_1889 (K14127) mvhD, vhuD, vhcD; F420-non-reducing hydrogenase iron-sulfur subunit [EC:1.12.99.- 1.8.98.5 1.8.98.6] barc:AOA65_1889 K14127 EC:1.12.99.-; EC:1.8.98.5; EC:1.8.98.6 250.7 F420-non-reducing hydrogenase iron-sulfur subunit [EC:1.12.99.- 1.8.98.5 1.8.98.6] 250.7 0 -OWC_0000_k121_3157_3 OWC_0000 998 4048 -1 A 3 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 1129.0 barb:AOA66_1510 (K03388) hdrA2; heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] barb:AOA66_1510 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 1131.2 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 1131.2 0 -OWC_0000_k121_3157_4 OWC_0000 4059 5147 -1 C 4 K00441 EC:1.12.98.1 260.0 loki:Lokiarch_10850 (K00441) frhB; coenzyme F420 hydrogenase subunit beta [EC:1.12.98.1] loki:Lokiarch_10850 K00441 EC:1.12.98.1 320.1 coenzyme F420 hydrogenase subunit beta [EC:1.12.98.1] 320.1 0 -OWC_0000_k121_3157_5 OWC_0000 5153 6280 -1 C 5 K08264 EC:1.8.98.1 278.0 sfu:Sfum_1801 (K08264) hdrD; heterodisulfide reductase subunit D [EC:1.8.98.1] sfu:Sfum_1801 K08264 EC:1.8.98.1 316.6 heterodisulfide reductase subunit D [EC:1.8.98.1] 316.6 0 -OWC_0000_k121_3157_6 OWC_0000 6496 7005 -1 C 6 166.0 loki:Lokiarch_40200 () loki:Lokiarch_40200 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 185.8 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 185.8 0 -OWC_0000_k121_43717_1 OWC_0000 150 665 1 C 1 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 208.0 mif:Metin_0381 (K03388) hdrA2; heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] mif:Metin_0381 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 170.9 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 170.9 0 -OWC_0000_k121_43717_2 OWC_0000 831 2024 1 A 2 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 371.0 mif:Metin_0381 (K03388) hdrA2; heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] mif:Metin_0381 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 442.5 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 442.5 0 -OWC_0000_k121_43717_3 OWC_0000 2658 3170 1 C 3 67.0 loki:Lokiarch_09920 () loki:Lokiarch_09920 K00443 EC:1.12.98.1 19.85 coenzyme F420 hydrogenase subunit gamma [EC:1.12.98.1] 39.7 0 -OWC_0001_k121_1650290_1 OWC_0001 3 461 1 E 1 0 -OWC_0001_k121_1650290_2 OWC_0001 820 939 1 E 2 0 -OWC_0001_k121_1650290_3 OWC_0001 1108 2694 1 C 3 273.0 mcj:MCON_0756 () mcj:MCON_0756 K07752 EC:3.4.17.22 21.3 carboxypeptidase D [EC:3.4.17.22] 21.3 0 -OWC_0001_k121_1650290_4 OWC_0001 3766 4008 1 C 4 105.0 metm:MSMTP_1429 () metm:MSMTP_1429 0 -OWC_0001_k121_21365628_1 OWC_0001 3 383 1 E 1 0 -OWC_0001_k121_21365628_10 OWC_0001 6987 8144 -1 C 2 155.0 psyt:DSAG12_00320 () psyt:DSAG12_00320 K05889 EC:1.1.2.6 19.3 polyvinyl alcohol dehydrogenase (cytochrome) [EC:1.1.2.6] 19.3 0 -OWC_0001_k121_21365628_11 OWC_0001 8326 9180 -1 C 3 K09711 177.0 hth:HTH_1873 (K09711) lipS1; lipoyl synthase hth:HTH_1873 K09711 243.8 lipoyl synthase 243.8 0 -OWC_0001_k121_21365628_12 OWC_0001 9168 9434 -1 C 4 65.0 smr:Smar_0192 () smr:Smar_0192 K03800 EC:6.3.1.20 25.8 lipoate---protein ligase [EC:6.3.1.20] 25.8 0 -OWC_0001_k121_21365628_13 OWC_0001 9440 10147 -1 C 5 K03800 EC:6.3.1.20 199.0 agw:QT03_C0001G0351 (K03800) lplA, lplJ, lipL1; lipoate---protein ligase [EC:6.3.1.20] agw:QT03_C0001G0351 K03800 EC:6.3.1.20 219.2 lipoate---protein ligase [EC:6.3.1.20] 219.2 0 -OWC_0001_k121_21365628_14 OWC_0001 10170 11147 -1 C 6 K24689 227.0 thy:A3L12_03680 (K24689) lipS2; lipoyl synthase thy:A3L12_03680 K24689 309.1 lipoyl synthase 309.1 0 -OWC_0001_k121_21365628_15 OWC_0001 11194 11685 -1 E 7 K23356 52.0 HTH-type transcriptional regulator, sugar sensing transcriptional regulator 52.0 0 -OWC_0001_k121_21365628_2 OWC_0001 407 1039 -1 C 8 144.0 ttr:Tter_2727 () ttr:Tter_2727 K03387 EC:1.8.1.- 67.2 NADH-dependent peroxiredoxin subunit F [EC:1.8.1.-] 67.2 0 -OWC_0001_k121_21365628_3 OWC_0001 1162 1665 1 C 9 151.0 cthm:CFE_1764 () cthm:CFE_1764 0 -OWC_0001_k121_21365628_4 OWC_0001 1713 2447 1 C 10 289.0 pbu:L21SP3_00081 () pbu:L21SP3_00081 K05897 EC:1.3.3.16 82.8 oxazoline/thiazoline dehydrogenase [EC:1.3.3.16] 82.8 0 -OWC_0001_k121_21365628_5 OWC_0001 2491 3528 1 A 11 K01990 394.0 kcr:Kcr_0542 (K01990) ABC-2.A; ABC-2 type transport system ATP-binding protein kcr:Kcr_0542 K25144 309.0 linearmycin/streptolysin S transport system ATP-binding protein 309.0 0 -OWC_0001_k121_21365628_6 OWC_0001 3534 4295 1 A 12 K01992 365.0 kcr:Kcr_0543 (K01992) ABC-2.P; ABC-2 type transport system permease protein kcr:Kcr_0543 K18233 132.5 oleandomycin transport system permease protein 132.5 0 -OWC_0001_k121_21365628_7 OWC_0001 4437 4889 1 C 13 86.0 scia:HUG15_04845 () scia:HUG15_04845 K06149 74.2 universal stress protein A 74.2 0 -OWC_0001_k121_21365628_8 OWC_0001 4886 6211 -1 C 14 212.0 tra:Trad_1166 () tra:Trad_1166 K05770 27.1 translocator protein 27.1 0 -OWC_0001_k121_21365628_9 OWC_0001 6269 6772 -1 E 15 K07133 15.3 uncharacterized protein 15.3 0 +OWC_0000_k121_3157_1 OWC_0000 2 580 -1 E 1 0 +OWC_0000_k121_3157_2 OWC_0000 596 997 -1 C 2 K14127 EC:1.8.98.5; EC:1.8.98.6 205.0 barc:AOA65_1889 (K14127) mvhD, vhuD, vhcD; F420-non-reducing hydrogenase iron-sulfur subunit [EC:1.12.99.- 1.8.98.5 1.8.98.6] barc:AOA65_1889 K14127 EC:1.12.99.-; EC:1.8.98.5; EC:1.8.98.6 250.7 F420-non-reducing hydrogenase iron-sulfur subunit [EC:1.12.99.- 1.8.98.5 1.8.98.6] 250.7 0 +OWC_0000_k121_3157_3 OWC_0000 998 4048 -1 A 3 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 1129.0 barb:AOA66_1510 (K03388) hdrA2; heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] barb:AOA66_1510 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 1131.2 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 1131.2 0 +OWC_0000_k121_3157_4 OWC_0000 4059 5147 -1 C 4 K00441 EC:1.12.98.1 260.0 loki:Lokiarch_10850 (K00441) frhB; coenzyme F420 hydrogenase subunit beta [EC:1.12.98.1] loki:Lokiarch_10850 K00441 EC:1.12.98.1 320.1 coenzyme F420 hydrogenase subunit beta [EC:1.12.98.1] 320.1 0 +OWC_0000_k121_3157_5 OWC_0000 5153 6280 -1 C 5 K08264 EC:1.8.98.1 278.0 sfu:Sfum_1801 (K08264) hdrD; heterodisulfide reductase subunit D [EC:1.8.98.1] sfu:Sfum_1801 K08264 EC:1.8.98.1 316.6 heterodisulfide reductase subunit D [EC:1.8.98.1] 316.6 0 +OWC_0000_k121_3157_6 OWC_0000 6496 7005 -1 C 6 166.0 loki:Lokiarch_40200 () loki:Lokiarch_40200 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 185.8 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 185.8 0 +OWC_0000_k121_43717_1 OWC_0000 150 665 1 C 1 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 208.0 mif:Metin_0381 (K03388) hdrA2; heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] mif:Metin_0381 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 170.9 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 170.9 0 +OWC_0000_k121_43717_2 OWC_0000 831 2024 1 A 2 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 371.0 mif:Metin_0381 (K03388) hdrA2; heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] mif:Metin_0381 K03388 EC:1.8.7.3; EC:1.8.98.4; EC:1.8.98.5; EC:1.8.98.6 442.5 heterodisulfide reductase subunit A2 [EC:1.8.7.3 1.8.98.4 1.8.98.5 1.8.98.6] 442.5 0 +OWC_0000_k121_43717_3 OWC_0000 2658 3170 1 C 3 67.0 loki:Lokiarch_09920 () loki:Lokiarch_09920 K00443 EC:1.12.98.1 19.85 coenzyme F420 hydrogenase subunit gamma [EC:1.12.98.1] 39.7 0 +OWC_0001_k121_1650290_1 OWC_0001 3 461 1 E 1 0 +OWC_0001_k121_1650290_2 OWC_0001 820 939 1 E 2 0 +OWC_0001_k121_1650290_3 OWC_0001 1108 2694 1 C 3 273.0 mcj:MCON_0756 () mcj:MCON_0756 K07752 EC:3.4.17.22 21.3 carboxypeptidase D [EC:3.4.17.22] 21.3 0 +OWC_0001_k121_1650290_4 OWC_0001 3766 4008 1 C 4 105.0 metm:MSMTP_1429 () metm:MSMTP_1429 0 +OWC_0001_k121_21365628_1 OWC_0001 3 383 1 E 1 0 +OWC_0001_k121_21365628_10 OWC_0001 6987 8144 -1 C 2 155.0 psyt:DSAG12_00320 () psyt:DSAG12_00320 K05889 EC:1.1.2.6 19.3 polyvinyl alcohol dehydrogenase (cytochrome) [EC:1.1.2.6] 19.3 0 +OWC_0001_k121_21365628_11 OWC_0001 8326 9180 -1 C 3 K09711 177.0 hth:HTH_1873 (K09711) lipS1; lipoyl synthase hth:HTH_1873 K09711 243.8 lipoyl synthase 243.8 0 +OWC_0001_k121_21365628_12 OWC_0001 9168 9434 -1 C 4 65.0 smr:Smar_0192 () smr:Smar_0192 K03800 EC:6.3.1.20 25.8 lipoate---protein ligase [EC:6.3.1.20] 25.8 0 +OWC_0001_k121_21365628_13 OWC_0001 9440 10147 -1 C 5 K03800 EC:6.3.1.20 199.0 agw:QT03_C0001G0351 (K03800) lplA, lplJ, lipL1; lipoate---protein ligase [EC:6.3.1.20] agw:QT03_C0001G0351 K03800 EC:6.3.1.20 219.2 lipoate---protein ligase [EC:6.3.1.20] 219.2 0 +OWC_0001_k121_21365628_14 OWC_0001 10170 11147 -1 C 6 K24689 227.0 thy:A3L12_03680 (K24689) lipS2; lipoyl synthase thy:A3L12_03680 K24689 309.1 lipoyl synthase 309.1 0 +OWC_0001_k121_21365628_15 OWC_0001 11194 11685 -1 E 7 K23356 52.0 HTH-type transcriptional regulator, sugar sensing transcriptional regulator 52.0 0 +OWC_0001_k121_21365628_2 OWC_0001 407 1039 -1 C 8 144.0 ttr:Tter_2727 () ttr:Tter_2727 K03387 EC:1.8.1.- 67.2 NADH-dependent peroxiredoxin subunit F [EC:1.8.1.-] 67.2 0 +OWC_0001_k121_21365628_3 OWC_0001 1162 1665 1 C 9 151.0 cthm:CFE_1764 () cthm:CFE_1764 0 +OWC_0001_k121_21365628_4 OWC_0001 1713 2447 1 C 10 289.0 pbu:L21SP3_00081 () pbu:L21SP3_00081 K05897 EC:1.3.3.16 82.8 oxazoline/thiazoline dehydrogenase [EC:1.3.3.16] 82.8 0 +OWC_0001_k121_21365628_5 OWC_0001 2491 3528 1 A 11 K01990 394.0 kcr:Kcr_0542 (K01990) ABC-2.A; ABC-2 type transport system ATP-binding protein kcr:Kcr_0542 K25144 309.0 linearmycin/streptolysin S transport system ATP-binding protein 309.0 0 +OWC_0001_k121_21365628_6 OWC_0001 3534 4295 1 A 12 K01992 365.0 kcr:Kcr_0543 (K01992) ABC-2.P; ABC-2 type transport system permease protein kcr:Kcr_0543 K18233 132.5 oleandomycin transport system permease protein 132.5 0 +OWC_0001_k121_21365628_7 OWC_0001 4437 4889 1 C 13 86.0 scia:HUG15_04845 () scia:HUG15_04845 K06149 74.2 universal stress protein A 74.2 0 +OWC_0001_k121_21365628_8 OWC_0001 4886 6211 -1 C 14 212.0 tra:Trad_1166 () tra:Trad_1166 K05770 27.1 translocator protein 27.1 0 +OWC_0001_k121_21365628_9 OWC_0001 6269 6772 -1 E 15 K07133 15.3 uncharacterized protein 15.3 0 diff --git a/workflows/dram.nf b/workflows/dram.nf index 957bdf3c..5938f345 100644 --- a/workflows/dram.nf +++ b/workflows/dram.nf @@ -149,7 +149,7 @@ workflow DRAM { def custom_distill_dir = file(distill_custom) if (!custom_distill_dir.exists()) { error "Error: The specified custom_distill sheet (--sum_custom or --distill_custom) does not exist: ${distill_custom}" - } + } } if (params.summarize){ @@ -258,7 +258,7 @@ workflow DRAM { distill_ecosystem, distill_custom ) - + }