From 976c683eb95bcbe8f34dd220c6faa027110c41e7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Thu, 20 Nov 2025 09:13:16 +0200 Subject: [PATCH 01/19] updated config files, added array size parameter for cluster execution --- conf/base.config | 6 ++++++ nextflow.config | 1 + 2 files changed, 7 insertions(+) diff --git a/conf/base.config b/conf/base.config index 1e69ac57..a8dc5396 100644 --- a/conf/base.config +++ b/conf/base.config @@ -59,8 +59,14 @@ process { withLabel:error_ignore { errorStrategy = 'ignore' } + withLabel:error_retry { errorStrategy = 'retry' maxRetries = 2 } + + withName: 'DRAM:ANNOTATE:CALL:.*|DRAM:ANNOTATE:DB_SEARCH:.*' { + array = params.array_size + } + } diff --git a/nextflow.config b/nextflow.config index fd933daf..38e50edd 100644 --- a/nextflow.config +++ b/nextflow.config @@ -163,6 +163,7 @@ params { /* Process Options */ + array_size = 10 queue_size = 10 // This is the resource requirements for a single process // Not the limit to the total resources available to the pipeline From ef13eed33c6f04bb3ac219aec3b63d23b5bd44aa Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Thu, 20 Nov 2025 09:56:01 +0200 Subject: [PATCH 02/19] updated nextflow.config --- nextflow.config | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/nextflow.config b/nextflow.config index 38e50edd..d776e4b0 100644 --- a/nextflow.config +++ b/nextflow.config @@ -164,7 +164,7 @@ params { /* Process Options */ array_size = 10 - queue_size = 10 + // queue_size = 10 // This is the resource requirements for a single process // Not the limit to the total resources available to the pipeline // Up to queue_size processes can run in parallel, of various sizes From d9a3bc64c9b6b529396d9e0ce3b2e6fc979fe3fe Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 21 Nov 2025 15:27:13 +0200 Subject: [PATCH 03/19] Swap output assignments for rRNA and tRNA collections --- subworkflows/local/collect_rna.nf | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) diff --git a/subworkflows/local/collect_rna.nf b/subworkflows/local/collect_rna.nf index 16c723a0..7e0d51ce 100644 --- a/subworkflows/local/collect_rna.nf +++ b/subworkflows/local/collect_rna.nf @@ -72,8 +72,8 @@ workflow COLLECT_RNA { // Create sheet for rrnas from the collected rRNAs or provided rRNAs // Run RRNA_COLLECT to generate a combined TSV for all fastas RRNA_COLLECT( ch_collected_rRNAs ) - ch_rrna_sheet = RRNA_COLLECT.out.rrna_collected_out - ch_rrna_combined = RRNA_COLLECT.out.rrna_combined_out + ch_rrna_sheet = RRNA_COLLECT.out.rrna_combined_out + ch_rrna_combined = RRNA_COLLECT.out.rrna_collected_out } else { ch_rrna_sheet = default_sheet ch_rrna_combined = default_sheet @@ -82,8 +82,8 @@ workflow COLLECT_RNA { // Create sheet for trnas from the collected tRNAs or provided tRNAs // Run TRNA_COLLECT to generate a combined TSV for all fastas TRNA_COLLECT( ch_collected_tRNAs ) - ch_trna_sheet = TRNA_COLLECT.out.trna_collected_out - ch_trna_combined = TRNA_COLLECT.out.trna_combined_out + ch_trna_sheet = TRNA_COLLECT.out.trna_combined_out + ch_trna_combined = TRNA_COLLECT.out.trna_collected_out } else { ch_trna_sheet = default_sheet ch_trna_combined = default_sheet @@ -96,4 +96,4 @@ workflow COLLECT_RNA { ch_trna_sheet ch_trna_combined -} \ No newline at end of file +} From 63ea2689e5b9836680ef9e4675d0508953dc642c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Tue, 25 Nov 2025 14:04:20 +0200 Subject: [PATCH 04/19] Refactor distill script and configuration for improved clarity and functionality - Update groupby_column default value to "input_fasta" in distill.py - Adjust input paths in distill.nf for consistency - Enhance argument handling in SUMMARIZE process --- bin/distill.py | 53 +++++++++++++++----------------- conf/modules.config | 1 + modules/local/distill/distill.nf | 27 ++++++++++------ 3 files changed, 43 insertions(+), 38 deletions(-) diff --git a/bin/distill.py b/bin/distill.py index a6068826..360d791a 100755 --- a/bin/distill.py +++ b/bin/distill.py @@ -27,7 +27,6 @@ DISTILATE_SORT_ORDER_COLUMNS = [COL_HEADER, COL_SUBHEADER, COL_MODULE, COL_GENE_ID] EXCEL_MAX_CELL_SIZE = 32767 -FASTA_COLUMN = os.getenv('FASTA_COLUMN') DISTILL_DIR = Path(__file__).parent / "assets/forms/distill_sheets" @@ -74,7 +73,7 @@ def fill_a_frame(frame: pd.DataFrame): return pd.Series(counts, index=genome_summary_frame.index) - counts = annotations.groupby(groupby_column, sort=False).apply(fill_a_frame) + counts = annotations.groupby(groupby_column, sort=False)[annotations.columns].apply(fill_a_frame) genome_summary_frame = pd.concat([genome_summary_frame, counts.T], axis=1) return genome_summary_frame @@ -99,7 +98,7 @@ def fill_genome_summary_frame_gene_names(annotations, genome_summary_frame, grou return genome_summary_frame -def summarize_rrnas(rrnas_df, groupby_column=FASTA_COLUMN): +def summarize_rrnas(rrnas_df, groupby_column="input_fasta"): genome_rrna_dict = dict() for genome, frame in rrnas_df.groupby(groupby_column): genome_rrna_dict[genome] = Counter(frame['type']) @@ -113,7 +112,7 @@ def summarize_rrnas(rrnas_df, groupby_column=FASTA_COLUMN): return rrna_frame -def make_genome_summary(annotations, genome_summary_frame, logger, groupby_column=FASTA_COLUMN): +def make_genome_summary(annotations, genome_summary_frame, logger, groupby_column="input_fasta"): summary_frames = list() # get ko summaries @@ -159,11 +158,11 @@ def write_summarized_genomes_to_xlsx(summarized_genomes, output_file, extra_fram frame.to_excel(writer, sheet_name=sheet, index=False) for extra_frame in extra_frames: if extra_frame is not None and not extra_frame.empty: - extra_frame.to_excel(writer, sheet_name=extra_frame[COL_SHEET].iloc[0], index=False) + extra_frame.to_excel(writer, sheet_name=extra_frame[COL_HEADER].iloc[0], index=False) # TODO: add assembly stats like N50, longest contig, total assembled length etc -def make_genome_stats(annotations, rrna_frame=None, trna_frame=None, quast_frame=None, groupby_column=FASTA_COLUMN): +def make_genome_stats(annotations, rrna_frame=None, trna_frame=None, quast_frame=None, groupby_column="input_fasta"): rows = list() columns = ['genome'] if 'scaffold' in annotations.columns: @@ -230,19 +229,19 @@ def make_genome_stats(annotations, rrna_frame=None, trna_frame=None, quast_frame @click.command() @click.option("-i", "--input_file", required=True, help="Annotations path") # @click.option("-o", "--output_dir", required=True, help="Directory to write summarized genomes") -@click.option("--rrna_path", help="rRNA output from annotation") -@click.option("--trna_path", help="tRNA output from annotation") -@click.option("--quast_path", help="Quast summary TSV from the quast step") +@click.option("--rrna_path", help="rRNA output from annotation", default=None, type=click.Path(exists=True)) +@click.option("--trna_path", help="tRNA output from annotation", default=None, type=click.Path(exists=True)) +@click.option("--quast_path", help="Quast summary TSV from the quast step", default=None, type=click.Path(exists=True)) @click.option("--groupby_column", help="Column from annotations to group as organism units", - default=FASTA_COLUMN) + default="input_fasta", type = click.STRING) @click.option("--distil_topics", default="default", help="Default distillates topics to run.") @click.option("--distil_ecosystem", default="eng_sys,ag", help="Default distillates ecosystems to run.") -@click.option("--custom_distillate", default=[], callback=validate_comma_separated, help="Custom distillate forms to add your own modules, comma separated. ") +@click.option("--custom_distillate", default="", callback=validate_comma_separated, help="Custom distillate forms to add your own modules, comma separated. ") @click.option("--distillate_gene_names", is_flag=True, show_default=True, default=False, help="Give names of genes instead of counts in genome metabolism summary") -def distill(input_file, rrna_path=None, trna_path=None, quast_path=None, groupby_column=FASTA_COLUMN, distil_topics=None, distil_ecosystem=None, - custom_distillate=None, distillate_gene_names=False): +def distill(input_file, rrna_path, trna_path, quast_path, groupby_column, distil_topics, distil_ecosystem, + custom_distillate, distillate_gene_names): """Summarize metabolic content of annotated genomes""" # make output folder # mkdir(output_dir) @@ -255,24 +254,20 @@ def distill(input_file, rrna_path=None, trna_path=None, quast_path=None, groupby # Check the columns are present check_columns(annotations, logger) - if trna_path is None: - trna_frame = None - else: + trna_frame = None + rrna_frame = None + if all([v is not None for v in [trna_path, rrna_path]]): trna_frame = pd.read_csv(trna_path, sep='\t') - if rrna_path is None: - rrna_frame = None - else: rrna_frame = pd.read_csv(rrna_path, sep='\t') - # Check NF DRAM didn't pass an empty sheet to signal no tRNAs or rRNAs - if rrna_frame.empty: - rrna_frame = None - if trna_frame.empty: - trna_frame = None - - if quast_path is None: - quast_frame = None - else: + if any(v.dropna(how="all").empty for v in [trna_frame, rrna_frame]): + trna_frame = None + rrna_frame = None + + quast_frame = None + if quast_path is not None: quast_frame = pd.read_csv(quast_path, sep='\t') + if quast_frame.dropna(how="all").empty: + quast_frame = None distil_sheets_names = [] if "default" in distil_topics: @@ -322,7 +317,7 @@ def distill(input_file, rrna_path=None, trna_path=None, quast_path=None, groupby genome_summary_form = genome_summary_form.reset_index(drop=True) # make genome stats - genome_stats = make_genome_stats(annotations, rrna_frame, trna_frame, quast_frame=quast_frame, groupby_column=groupby_column) + genome_stats = make_genome_stats(annotations, rrna_frame, trna_frame, quast_frame, groupby_column=groupby_column) genome_stats.to_csv('genome_stats.tsv', sep='\t', index=None) logger.info('Calculated genome statistics') diff --git a/conf/modules.config b/conf/modules.config index 3cdcf759..a867fb63 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -254,6 +254,7 @@ process { ] } withName: SUMMARIZE { + ext.args = { '--groupby_column "input_fasta"' } publishDir = [ [ path: "${params.outdir}/SUMMARIZE", diff --git a/modules/local/distill/distill.nf b/modules/local/distill/distill.nf index 3c772684..41a9024e 100644 --- a/modules/local/distill/distill.nf +++ b/modules/local/distill/distill.nf @@ -7,10 +7,10 @@ process SUMMARIZE { container "community.wave.seqera.io/library/python_pandas_openpyxl_click_dram-viz:bd6f4fb065d73a68" input: - path( ch_combined_annotations, stageAs: "raw-annotations.tsv" ) - path( ch_rrna_collected, stageAs: "rrna_combined.tsv" ) - path( ch_trna_collected, stageAs: "trna_combined.tsv" ) - path( ch_quast_stats ) + path( combined_annotations, stageAs: "raw-annotations.tsv" ) + path( rrna_collected, stageAs: "rrna_combined.tsv" ) + path( trna_collected, stageAs: "trna_combined.tsv" ) + path( quast_stats ) val( distill_topic ) val( distill_ecosystem ) val( distill_custom ) @@ -22,11 +22,20 @@ process SUMMARIZE { path( "genome_stats.tsv" ), emit: genome_stats script: - """ - # export constants for script - export FASTA_COLUMN="${params.CONSTANTS.FASTA_COLUMN}" - - distill.py -i ${ch_combined_annotations} --rrna_path '${ch_rrna_collected}' --trna_path '${ch_trna_collected}' --distil_topics "${distill_topic}" --distil_ecosystem "${distill_ecosystem}" --custom_distillate "${distill_custom}" --quast_path '${ch_quast_stats}' + def args = task.ext.args ?: "" + def rrna = rrna_collected ? "--rrna_path ${rrna_collected}" : "" + def trna = trna_collected ? "--trna_path ${trna_collected}" : "" + def quast = quast_stats ? "--trna_path ${quast_stats}" : "" """ + distill.py \ + -i ${combined_annotations} \ + ${rrna} \ + ${trna} \ + ${quast} \ + --distil_topics "${distill_topic}" \ + --distil_ecosystem "${distill_ecosystem}" \ + --custom_distillate "${distill_custom}" \ + ${args} + """ } From 74149799f48e05d97d7fa77ecb3ad1aa8448683b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Wed, 26 Nov 2025 10:41:52 +0200 Subject: [PATCH 05/19] Refactor input and output path definitions for consistency in the SUMMARIZE process --- modules/local/distill/distill.nf | 24 ++++++++++++------------ 1 file changed, 12 insertions(+), 12 deletions(-) diff --git a/modules/local/distill/distill.nf b/modules/local/distill/distill.nf index 41a9024e..94a5b94e 100644 --- a/modules/local/distill/distill.nf +++ b/modules/local/distill/distill.nf @@ -7,25 +7,25 @@ process SUMMARIZE { container "community.wave.seqera.io/library/python_pandas_openpyxl_click_dram-viz:bd6f4fb065d73a68" input: - path( combined_annotations, stageAs: "raw-annotations.tsv" ) - path( rrna_collected, stageAs: "rrna_combined.tsv" ) - path( trna_collected, stageAs: "trna_combined.tsv" ) - path( quast_stats ) - val( distill_topic ) - val( distill_ecosystem ) - val( distill_custom ) + path combined_annotations + path rrna_collected + path trna_collected + path quast_stats + val distill_topic + val distill_ecosystem + val distill_custom output: - path( "metabolism_summary.xlsx" ), emit: distillate - path( "*.log" ), emit: log - path( "summarized_genomes.tsv" ), emit: summarized_genomes - path( "genome_stats.tsv" ), emit: genome_stats + path "metabolism_summary.xlsx", emit: distillate + path "*.log", emit: log + path "summarized_genomes.tsv", emit: summarized_genomes + path "genome_stats.tsv", emit: genome_stats script: def args = task.ext.args ?: "" def rrna = rrna_collected ? "--rrna_path ${rrna_collected}" : "" def trna = trna_collected ? "--trna_path ${trna_collected}" : "" - def quast = quast_stats ? "--trna_path ${quast_stats}" : "" + def quast = quast_stats ? "--quast_path ${quast_stats}" : "" """ distill.py \ From a77c29e8205e302a85ebe8a03e79106962c2a6c8 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Wed, 26 Nov 2025 12:33:07 +0200 Subject: [PATCH 06/19] Fix conditional check for gene columns in genome summary export to prevent errors --- bin/distill.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/bin/distill.py b/bin/distill.py index 360d791a..232a8192 100755 --- a/bin/distill.py +++ b/bin/distill.py @@ -153,8 +153,9 @@ def write_summarized_genomes_to_xlsx(summarized_genomes, output_file, extra_fram frame = frame.sort_values(DISTILATE_SORT_ORDER_COLUMNS) frame = frame.drop([COL_SHEET], axis=1) gene_columns = list(set(frame.columns) - set(CONSTANT_DISTILLATE_COLUMNS)) - split_genes = pd.concat([split_names_to_long(frame[i].astype(str)) for i in gene_columns], axis=1) - frame = pd.concat([frame[CONSTANT_DISTILLATE_COLUMNS], split_genes], axis=1) + if gene_columns: + split_genes = pd.concat([split_names_to_long(frame[i].astype(str)) for i in gene_columns], axis=1) + frame = pd.concat([frame[CONSTANT_DISTILLATE_COLUMNS], split_genes], axis=1) frame.to_excel(writer, sheet_name=sheet, index=False) for extra_frame in extra_frames: if extra_frame is not None and not extra_frame.empty: @@ -199,7 +200,6 @@ def make_genome_stats(annotations, rrna_frame=None, trna_frame=None, quast_frame # Rename the index column to input_fasta (or whatever you want) df_rrna = df_rrna.rename(columns={"index": "genome"}) df_rrna.columns.name = None - print(df_rrna) genome_stats = pd.merge(genome_stats, df_rrna, how="outer", on="genome") if trna_frame is not None: meta_cols = ["gene_id", "gene_description", "category", From e8b0e95c51208b24cff41d23cbdb3e61218ca887 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Wed, 26 Nov 2025 14:27:45 +0200 Subject: [PATCH 07/19] Refactor channel usage for consistency across workflows and improve readability --- subworkflows/local/annotate.nf | 9 +-- subworkflows/local/call.nf | 4 +- subworkflows/local/collect_rna.nf | 8 +-- subworkflows/local/db_search.nf | 115 +++++++++++++++--------------- subworkflows/local/merge.nf | 6 +- subworkflows/local/qc.nf | 8 +-- workflows/dram.nf | 33 ++++----- 7 files changed, 86 insertions(+), 97 deletions(-) diff --git a/subworkflows/local/annotate.nf b/subworkflows/local/annotate.nf index bd30a51b..b231ac73 100644 --- a/subworkflows/local/annotate.nf +++ b/subworkflows/local/annotate.nf @@ -34,8 +34,8 @@ workflow ANNOTATE { ch_combined_annotations = default_sheet if (params.rename || call) { - fasta_name = ch_fasta.map { it[0] } - fasta_files = ch_fasta.map { it[1] } + fasta_name = ch_fasta.map { it-> it[0] } + fasta_files = ch_fasta.map { it -> it[1] } n_fastas = file("$params.input_fasta/${params.fasta_fmt}").size() } @@ -49,10 +49,7 @@ workflow ANNOTATE { // we use flatten here to turn a list back into a channel renamed_fasta_paths = RENAME_FASTA.out.renamed_fasta_paths.flatten() // we need to recreate the fasta channel with the renamed fasta files - ch_fasta = renamed_fasta_paths.map { - fasta_name = it.getBaseName() - tuple(fasta_name, it) - } + ch_fasta = renamed_fasta_paths.map { it -> [ it.getBaseName(), it ] } } ch_quast_stats = default_sheet diff --git a/subworkflows/local/call.nf b/subworkflows/local/call.nf index 74ae33d5..5f7c5dc6 100644 --- a/subworkflows/local/call.nf +++ b/subworkflows/local/call.nf @@ -38,13 +38,13 @@ workflow CALL { .set { ch_collected_faa } // Set the resulting list to ch_collected_faa // Collect all individual fasta to pass to quast - Channel.empty() + channel.empty() .mix( ch_called_genes ) .collect() .set { ch_collected_fna } // Collect all individual fasta to pass to quast - Channel.empty() + channel.empty() .mix( ch_filtered_fasta, ch_gene_gff ) .collect() .set { ch_collected_fasta } diff --git a/subworkflows/local/collect_rna.nf b/subworkflows/local/collect_rna.nf index 9105e83a..2c566b07 100644 --- a/subworkflows/local/collect_rna.nf +++ b/subworkflows/local/collect_rna.nf @@ -33,7 +33,7 @@ workflow COLLECT_RNA { // If we didn't run call if (!call) { if (params.rrnas) { - Channel.fromPath("${params.rrnas}/*.tsv", checkIfExists: true) + channel.fromPath("${params.rrnas}/*.tsv", checkIfExists: true) .ifEmpty { exit 1, "If you specify --distill_ without --call, you must provide individual rRNA files generated with barrnap. Cannot find any files at: ${params.rrnas}\nNB: Path needs to follow pattern: path/to/directory" } .collect() .set { ch_collected_rRNAs } @@ -42,7 +42,7 @@ workflow COLLECT_RNA { } if (params.trnas) { // the user provided rrnas or trnas - Channel.fromPath("${params.trnas}/*.tsv", checkIfExists: true) + channel.fromPath("${params.trnas}/*.tsv", checkIfExists: true) .ifEmpty { exit 1, "If you specify --distill_ without --call, you must provide individual tRNA files generated with tRNAscan-SE. Cannot find any files at: ${params.trnas}\nNB: Path needs to follow pattern: path/to/directory" } .collect() .set { ch_collected_tRNAs } @@ -53,14 +53,14 @@ workflow COLLECT_RNA { TRNA_SCAN( ch_fasta ) ch_trna_scan = TRNA_SCAN.out.trna_scan_out // Collect all input_fasta formatted tRNA files - Channel.empty() + channel.empty() .mix( ch_trna_scan ) .collect() .set { ch_collected_tRNAs } // Run barrnap on each fasta to identify rRNAs RRNA_SCAN( ch_fasta ) ch_rrna_scan = RRNA_SCAN.out.rrna_scan_out - Channel.empty() + channel.empty() .mix( ch_rrna_scan ) .collect() .set { ch_collected_rRNAs } diff --git a/subworkflows/local/db_search.nf b/subworkflows/local/db_search.nf index e93b3498..dc18a662 100644 --- a/subworkflows/local/db_search.nf +++ b/subworkflows/local/db_search.nf @@ -83,7 +83,7 @@ workflow DB_SEARCH { main: - DB_CHANNEL_SETUP( + DB_channel_SETUP( use_kegg, use_kofam, use_dbcan, @@ -125,23 +125,20 @@ workflow DB_SEARCH { if (!call) { - ch_called_proteins = Channel + ch_called_proteins = channel .fromPath(file(params.input_genes) / params.genes_fmt, checkIfExists: true) .ifEmpty { exit 1, "If you specify --annotate without --call, you must provide a fasta file of called genes using --input_genes. Cannot find any called gene fasta files matching: ${params.input_genes}\nNB: Path needs to follow pattern: path/to/directory/" } - .map { - input_fastaName = it.getBaseName() - tuple(input_fastaName, it) + .map { it -> [ it.getBaseName(), it ] } } - GENE_LOCS( ch_called_proteins) ch_gene_locs = GENE_LOCS.out.prodigal_locs_tsv n_fastas = file("$params.input_genes/${params.genes_fmt}").size() } - def formattedOutputChannels = channel.of() + def formattedOutputchannels = channel.of() // Here we will create mmseqs2 index files for each of the inputs if we are going to do a mmseqs2 database - if (DB_CHANNEL_SETUP.out.index_mmseqs) { + if (DB_channel_SETUP.out.index_mmseqs) { // Use MMSEQS2 to index each called genes protein file MMSEQS_INDEX( ch_called_proteins ) ch_mmseqs_query = MMSEQS_INDEX.out.mmseqs_index_out @@ -150,17 +147,17 @@ workflow DB_SEARCH { // KEGG annotation if (use_kegg) { ch_combined_query_locs_kegg = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_KEGG( ch_combined_query_locs_kegg, DB_CHANNEL_SETUP.out.ch_kegg_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, kegg_name ) + MMSEQS_SEARCH_KEGG( ch_combined_query_locs_kegg, DB_channel_SETUP.out.ch_kegg_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, kegg_name ) ch_kegg_unformatted = MMSEQS_SEARCH_KEGG.out.mmseqs_search_formatted_out SQL_KEGG(ch_kegg_unformatted, kegg_name, ch_sql_descriptions_db) ch_kegg_formatted = SQL_KEGG.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_kegg_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_kegg_formatted) } // KOFAM annotation if (use_kofam) { - HMM_SEARCH_KOFAM ( ch_called_proteins, params.kofam_e_value, DB_CHANNEL_SETUP.out.ch_kofam_db ) + HMM_SEARCH_KOFAM ( ch_called_proteins, params.kofam_e_value, DB_channel_SETUP.out.ch_kofam_db ) ch_kofam_hmms = HMM_SEARCH_KOFAM.out.hmm_search_out PARSE_HMM_KOFAM ( ch_kofam_hmms ) @@ -170,23 +167,23 @@ workflow DB_SEARCH { KOFAM_HMM_FORMATTER ( ch_combined_hits_locs_kofam, ch_kofam_list ) ch_kofam_formatted = KOFAM_HMM_FORMATTER.out.kofam_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_kofam_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_kofam_formatted) } // PFAM annotation if (use_pfam) { ch_combined_query_locs_pfam = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_PFAM( ch_combined_query_locs_pfam, DB_CHANNEL_SETUP.out.ch_pfam_mmseqs_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, pfam_name ) + MMSEQS_SEARCH_PFAM( ch_combined_query_locs_pfam, DB_channel_SETUP.out.ch_pfam_mmseqs_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, pfam_name ) ch_pfam_unformatted = MMSEQS_SEARCH_PFAM.out.mmseqs_search_formatted_out SQL_PFAM(ch_pfam_unformatted, pfam_name, ch_sql_descriptions_db) ch_pfam_formatted = SQL_PFAM.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_pfam_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_pfam_formatted) } // dbCAN annotation if (use_dbcan) { - HMM_SEARCH_DBCAN ( ch_called_proteins, params.dbcan_e_value , DB_CHANNEL_SETUP.out.ch_dbcan_db) + HMM_SEARCH_DBCAN ( ch_called_proteins, params.dbcan_e_value , DB_channel_SETUP.out.ch_dbcan_db) ch_dbcan_hmms = HMM_SEARCH_DBCAN.out.hmm_search_out PARSE_HMM_DBCAN ( ch_dbcan_hmms ) @@ -196,12 +193,12 @@ workflow DB_SEARCH { DBCAN_HMM_FORMATTER ( ch_combined_hits_locs_dbcan, dbcan_name, ch_sql_descriptions_db ) ch_dbcan_formatted = DBCAN_HMM_FORMATTER.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_dbcan_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_dbcan_formatted) } // CAMPER annotation if (use_camper) { // HMM - HMM_SEARCH_CAMPER ( ch_called_proteins, params.camper_e_value , DB_CHANNEL_SETUP.out.ch_camper_hmm_db) + HMM_SEARCH_CAMPER ( ch_called_proteins, params.camper_e_value , DB_channel_SETUP.out.ch_camper_hmm_db) ch_camper_hmms = HMM_SEARCH_CAMPER.out.hmm_search_out PARSE_HMM_CAMPER ( ch_camper_hmms ) @@ -211,18 +208,18 @@ workflow DB_SEARCH { CAMPER_HMM_FORMATTER ( ch_combined_hits_locs_camper, ch_camper_hmm_list ) ch_camper_hmm_formatted = CAMPER_HMM_FORMATTER.out.camper_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_camper_hmm_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_camper_hmm_formatted) // MMseqs ch_combined_query_locs_camper = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_CAMPER( ch_combined_query_locs_camper, DB_CHANNEL_SETUP.out.ch_camper_mmseqs_db, params.bit_score_threshold, params.rbh_bit_score_threshold, DB_CHANNEL_SETUP.out.ch_camper_mmseqs_list, camper_name ) + MMSEQS_SEARCH_CAMPER( ch_combined_query_locs_camper, DB_channel_SETUP.out.ch_camper_mmseqs_db, params.bit_score_threshold, params.rbh_bit_score_threshold, DB_channel_SETUP.out.ch_camper_mmseqs_list, camper_name ) ch_camper_mmseqs_formatted = MMSEQS_SEARCH_CAMPER.out.mmseqs_search_formatted_out - formattedOutputChannels = formattedOutputChannels.mix(ch_camper_mmseqs_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_camper_mmseqs_formatted) } // FeGenie annotation if (use_fegenie) { - HMM_SEARCH_FEGENIE ( ch_called_proteins, params.fegenie_e_value, DB_CHANNEL_SETUP.out.ch_fegenie_db ) + HMM_SEARCH_FEGENIE ( ch_called_proteins, params.fegenie_e_value, DB_channel_SETUP.out.ch_fegenie_db ) ch_fegenie_hmms = HMM_SEARCH_FEGENIE.out.hmm_search_out PARSE_HMM_FEGENIE ( ch_fegenie_hmms ) @@ -231,27 +228,27 @@ workflow DB_SEARCH { ch_combined_hits_locs_fegenie = ch_fegenie_parsed.join(ch_gene_locs) FEGENIE_HMM_FORMATTER ( ch_combined_hits_locs_fegenie ) ch_fegenie_formatted = FEGENIE_HMM_FORMATTER.out.fegenie_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_fegenie_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_fegenie_formatted) } // Methyl annotation if (use_methyl) { ch_combined_query_locs_methyl = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_METHYL( ch_combined_query_locs_methyl, DB_CHANNEL_SETUP.out.ch_methyl_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, methyl_name ) + MMSEQS_SEARCH_METHYL( ch_combined_query_locs_methyl, DB_channel_SETUP.out.ch_methyl_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, methyl_name ) ch_methyl_mmseqs_formatted = MMSEQS_SEARCH_METHYL.out.mmseqs_search_formatted_out - formattedOutputChannels = formattedOutputChannels.mix(ch_methyl_mmseqs_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_methyl_mmseqs_formatted) } // CANT-HYD annotation if (use_canthyd) { // MMseqs ch_combined_query_locs_canthyd = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_CANTHYD( ch_combined_query_locs_canthyd, DB_CHANNEL_SETUP.out.ch_canthyd_mmseqs_db, params.bit_score_threshold, params.rbh_bit_score_threshold, DB_CHANNEL_SETUP.out.ch_canthyd_mmseqs_list, canthyd_name ) + MMSEQS_SEARCH_CANTHYD( ch_combined_query_locs_canthyd, DB_channel_SETUP.out.ch_canthyd_mmseqs_db, params.bit_score_threshold, params.rbh_bit_score_threshold, DB_channel_SETUP.out.ch_canthyd_mmseqs_list, canthyd_name ) ch_canthyd_mmseqs_formatted = MMSEQS_SEARCH_CANTHYD.out.mmseqs_search_formatted_out - formattedOutputChannels = formattedOutputChannels.mix(ch_canthyd_mmseqs_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_canthyd_mmseqs_formatted) //HMM - HMM_SEARCH_CANTHYD ( ch_called_proteins, params.canthyd_e_value , DB_CHANNEL_SETUP.out.ch_canthyd_hmm_db) + HMM_SEARCH_CANTHYD ( ch_called_proteins, params.canthyd_e_value , DB_channel_SETUP.out.ch_canthyd_hmm_db) ch_canthyd_hmms = HMM_SEARCH_CANTHYD.out.hmm_search_out PARSE_HMM_CANTHYD ( ch_canthyd_hmms ) @@ -261,12 +258,12 @@ workflow DB_SEARCH { CANTHYD_HMM_FORMATTER ( ch_combined_hits_locs_canthyd, ch_canthyd_hmm_list ) ch_canthyd_hmm_formatted = CANTHYD_HMM_FORMATTER.out.canthyd_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_canthyd_hmm_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_canthyd_hmm_formatted) } // Sulfur annotation if (use_sulfur) { - HMM_SEARCH_SULFUR ( ch_called_proteins, params.sulfur_e_value, DB_CHANNEL_SETUP.out.ch_sulfur_db ) + HMM_SEARCH_SULFUR ( ch_called_proteins, params.sulfur_e_value, DB_channel_SETUP.out.ch_sulfur_db ) ch_sulfur_hmms = HMM_SEARCH_SULFUR.out.hmm_search_out PARSE_HMM_SULFUR ( ch_sulfur_hmms ) @@ -276,33 +273,33 @@ workflow DB_SEARCH { SULFUR_HMM_FORMATTER ( ch_combined_hits_locs_sulfur ) ch_sulfur_formatted = SULFUR_HMM_FORMATTER.out.sulfur_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_sulfur_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_sulfur_formatted) } // MEROPS annotation if (use_merops) { ch_combined_query_locs_merops = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_MEROPS( ch_combined_query_locs_merops, DB_CHANNEL_SETUP.out.ch_merops_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, merops_name ) + MMSEQS_SEARCH_MEROPS( ch_combined_query_locs_merops, DB_channel_SETUP.out.ch_merops_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, merops_name ) ch_merops_unformatted = MMSEQS_SEARCH_MEROPS.out.mmseqs_search_formatted_out SQL_MEROPS(ch_merops_unformatted, merops_name, ch_sql_descriptions_db) ch_merops_formatted = SQL_MEROPS.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_merops_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_merops_formatted) } // Uniref annotation if (use_uniref) { ch_combined_query_locs_uniref = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_UNIREF( ch_combined_query_locs_uniref, DB_CHANNEL_SETUP.out.ch_uniref_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, uniref_name ) + MMSEQS_SEARCH_UNIREF( ch_combined_query_locs_uniref, DB_channel_SETUP.out.ch_uniref_db, params.bit_score_threshold, params.rbh_bit_score_threshold, default_sheet, uniref_name ) ch_uniref_unformatted = MMSEQS_SEARCH_UNIREF.out.mmseqs_search_formatted_out SQL_UNIREF(ch_uniref_unformatted, uniref_name, ch_sql_descriptions_db) ch_uniref_formatted = SQL_UNIREF.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_uniref_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_uniref_formatted) } // VOGdb annotation if (use_vog) { - HMM_SEARCH_VOG ( ch_called_proteins, params.vog_e_value , DB_CHANNEL_SETUP.out.ch_vogdb_db ) + HMM_SEARCH_VOG ( ch_called_proteins, params.vog_e_value , DB_channel_SETUP.out.ch_vogdb_db ) ch_vog_hmms = HMM_SEARCH_VOG.out.hmm_search_out PARSE_HMM_VOG ( ch_vog_hmms ) @@ -312,21 +309,21 @@ workflow DB_SEARCH { VOG_HMM_FORMATTER ( ch_combined_hits_locs_vog, vogdb_name, ch_sql_descriptions_db ) ch_vog_formatted = VOG_HMM_FORMATTER.out.vog_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_vog_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_vog_formatted) } // Viral annotation if (params.use_viral) { ch_combined_query_locs_viral = ch_mmseqs_query.join(ch_gene_locs) - MMSEQS_SEARCH_VIRAL( ch_combined_query_locs_viral, DB_CHANNEL_SETUP.out.ch_viral_db, params.bit_score_threshold, params.rbh_bit_score_threshold,default_sheet, viral_name ) + MMSEQS_SEARCH_VIRAL( ch_combined_query_locs_viral, DB_channel_SETUP.out.ch_viral_db, params.bit_score_threshold, params.rbh_bit_score_threshold,default_sheet, viral_name ) ch_viral_unformatted = MMSEQS_SEARCH_VIRAL.out.mmseqs_search_formatted_out SQL_VIRAL(ch_viral_unformatted, viral_name, ch_sql_descriptions_db) ch_viral_formatted = SQL_VIRAL.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_viral_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_viral_formatted) } - fastas = formattedOutputChannels.map { it[1] }.collect() - genes = ch_called_proteins.map { it[1] }.collect() + fastas = formattedOutputchannels.map { it -> it[1] }.collect() + genes = ch_called_proteins.map { it -> it[1] }.collect() COMBINE_ANNOTATIONS( fastas, genes ) ch_combined_annotations = COMBINE_ANNOTATIONS.out.combined_annotations_out @@ -337,7 +334,7 @@ workflow DB_SEARCH { } -workflow DB_CHANNEL_SETUP { +workflow DB_channel_SETUP { take: use_kegg use_kofam @@ -356,24 +353,24 @@ workflow DB_CHANNEL_SETUP { main: index_mmseqs = false - ch_kegg_db = Channel.empty() - ch_kofam_db = Channel.empty() - ch_dbcan_db = Channel.empty() - ch_camper_hmm_db = Channel.empty() - ch_camper_mmseqs_db = Channel.empty() - ch_camper_mmseqs_list = Channel.empty() - ch_merops_db = Channel.empty() - ch_pfam_mmseqs_db = Channel.empty() - ch_heme_db = Channel.empty() - ch_sulfur_db = Channel.empty() - ch_uniref_db = Channel.empty() - ch_methyl_db = Channel.empty() - ch_fegenie_db = Channel.empty() - ch_canthyd_hmm_db = Channel.empty() - ch_canthyd_mmseqs_db = Channel.empty() - ch_canthyd_mmseqs_list = Channel.empty() - ch_vogdb_db = Channel.empty() - ch_viral_db = Channel.empty() + ch_kegg_db = channel.empty() + ch_kofam_db = channel.empty() + ch_dbcan_db = channel.empty() + ch_camper_hmm_db = channel.empty() + ch_camper_mmseqs_db = channel.empty() + ch_camper_mmseqs_list = channel.empty() + ch_merops_db = channel.empty() + ch_pfam_mmseqs_db = channel.empty() + ch_heme_db = channel.empty() + ch_sulfur_db = channel.empty() + ch_uniref_db = channel.empty() + ch_methyl_db = channel.empty() + ch_fegenie_db = channel.empty() + ch_canthyd_hmm_db = channel.empty() + ch_canthyd_mmseqs_db = channel.empty() + ch_canthyd_mmseqs_list = channel.empty() + ch_vogdb_db = channel.empty() + ch_viral_db = channel.empty() if (use_kegg) { ch_kegg_db = file(params.kegg_db).exists() ? file(params.kegg_db) : error("Error: If using --annotate, you must supply prebuilt databases. KEGG database file not found at ${params.kegg_db}") diff --git a/subworkflows/local/merge.nf b/subworkflows/local/merge.nf index 8b4f7ece..a14fa940 100644 --- a/subworkflows/local/merge.nf +++ b/subworkflows/local/merge.nf @@ -31,10 +31,10 @@ workflow MERGE { } // Create a channel with the paths to the .tsv files - Channel - .from(tsv_files.collect { annotations_dir.toString() + '/' + it }) + channel + .from(tsv_files.collect { it -> annotations_dir.toString() + '/' + it }) .set { ch_merge_annotations } - Channel.empty() + channel.empty() .mix( ch_merge_annotations ) .collect() .set { ch_merge_annotations_collected } diff --git a/subworkflows/local/qc.nf b/subworkflows/local/qc.nf index 298c4fff..fa397491 100644 --- a/subworkflows/local/qc.nf +++ b/subworkflows/local/qc.nf @@ -49,15 +49,13 @@ workflow QC { if( params.generate_gff || params.generate_gbk ){ if (!call) { - ch_called_genes = Channel + ch_called_genes = channel .fromPath(file(params.input_genes) / params.genes_fna_fmt, checkIfExists: true) .ifEmpty { exit 1, "If you specify --generate_gff or --generate_gbk without --call, you must provide a fasta file of called genes using --input_genes and --genes_fna_fmt,. Cannot find any called gene fasta files matching: ${params.input_genes} and ${params.genes_fna_fmt}\nNB: Path needs to follow pattern: path/to/directory/" } - .map { - input_fastaName = it.getBaseName() - tuple(input_fastaName, it) + .map { it -> [ it.getBaseName(), it ] } } // Collect all individual fasta to pass to quast - Channel.empty() + channel.empty() .mix( ch_called_genes ) .collect() .set { ch_collected_fna } diff --git a/workflows/dram.nf b/workflows/dram.nf index fd4a5fc2..1dd909a0 100644 --- a/workflows/dram.nf +++ b/workflows/dram.nf @@ -37,9 +37,9 @@ workflow DRAM { // Setup // - ch_versions = Channel.empty() - ch_multiqc_files = Channel.empty() - ch_fasta = Channel.empty() + ch_versions = channel.empty() + ch_multiqc_files = channel.empty() + ch_fasta = channel.empty() default_sheet = file(params.distill_dummy_sheet) distill_flag = (params.summarize || params.distill_topic != "" || params.distill_ecosystem != "" || params.distill_custom != "" || params.sum_ecos != "") @@ -61,14 +61,11 @@ workflow DRAM { if (params.rename || call) { - ch_fasta = Channel + ch_fasta = channel .fromPath(file(params.input_fasta) / params.fasta_fmt, checkIfExists: true) .ifEmpty { exit 1, "Cannot find any fasta files matching: ${params.input_fasta}\nNB: Path needs to follow pattern: path/to/directory/" } - ch_fasta = ch_fasta.map { - fasta_name = it.getBaseName() - tuple(fasta_name, it) - } + ch_fasta = ch_fasta.map { it -> [ it.getBaseName(), it ] } } use_kegg = params.use_kegg @@ -85,7 +82,7 @@ workflow DRAM { use_vog = params.use_vog if (params.anno_dbs != "") { - anno_dbs = params.anno_dbs.tokenize(',').collect { it.trim().toLowerCase() } + anno_dbs = params.anno_dbs.tokenize(',').collect { it -> it.trim().toLowerCase() } value_for_all = 'all' use_kegg = getDBFlag(anno_dbs, 'kegg', value_for_all) use_kofam = getDBFlag(anno_dbs, 'kofam', value_for_all) @@ -241,7 +238,7 @@ workflow DRAM { ch_final_annots = ADD_ANNOTATIONS.out.combined_annots_out } } else { // If the user has not specified --annotate, use the provided annotations - ch_final_annots = Channel + ch_final_annots = channel .fromPath(params.annotations, checkIfExists: true) .ifEmpty { exit 1, "If you specify --distill_ without --annotate, you must provide an annotations TSV file (--annotations ) with approprite formatting. Cannot find any called gene files matching: ${params.annotations}\nNB: Path needs to follow pattern: path/to/directory/" } } @@ -263,7 +260,7 @@ workflow DRAM { } else if (params.annotations) { - ch_final_annots = Channel + ch_final_annots = channel .fromPath(params.annotations, checkIfExists: true) .ifEmpty { exit 1, "Parameter annotations problem: Cannot find any called gene files matching: ${params.annotations}\nNB: Path needs to follow pattern: path/to/directory/" } } @@ -293,24 +290,24 @@ workflow DRAM { // // MODULE: MultiQC // - ch_multiqc_config = Channel.fromPath( + ch_multiqc_config = channel.fromPath( "$projectDir/assets/multiqc_config.yml", checkIfExists: true) ch_multiqc_custom_config = params.multiqc_config ? - Channel.fromPath(params.multiqc_config, checkIfExists: true) : - Channel.empty() + channel.fromPath(params.multiqc_config, checkIfExists: true) : + channel.empty() ch_multiqc_logo = params.multiqc_logo ? - Channel.fromPath(params.multiqc_logo, checkIfExists: true) : - Channel.empty() + channel.fromPath(params.multiqc_logo, checkIfExists: true) : + channel.empty() summary_params = paramsSummaryMap( workflow, parameters_schema: "nextflow_schema.json") - ch_workflow_summary = Channel.value(paramsSummaryMultiqc(summary_params)) + ch_workflow_summary = channel.value(paramsSummaryMultiqc(summary_params)) ch_multiqc_files = ch_multiqc_files.mix( ch_workflow_summary.collectFile(name: 'workflow_summary_mqc.yaml')) ch_multiqc_custom_methods_description = params.multiqc_methods_description ? file(params.multiqc_methods_description, checkIfExists: true) : file("$projectDir/assets/methods_description_template.yml", checkIfExists: true) - ch_methods_description = Channel.value( + ch_methods_description = channel.value( methodsDescriptionText(ch_multiqc_custom_methods_description)) ch_multiqc_files = ch_multiqc_files.mix(ch_collated_versions) From 44187394ad3bb31e68992242feb75271515b94e1 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Thu, 27 Nov 2025 11:03:26 +0200 Subject: [PATCH 08/19] Update SUMMARIZE module to use parameterized fasta column for grouping --- conf/modules.config | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/conf/modules.config b/conf/modules.config index a867fb63..342b35f5 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -254,7 +254,7 @@ process { ] } withName: SUMMARIZE { - ext.args = { '--groupby_column "input_fasta"' } + ext.args = { "--groupby_column ${params.CONSTANTS.FASTA_COLUMN}" } publishDir = [ [ path: "${params.outdir}/SUMMARIZE", From cd3b7ac1ca571b7b6eb153254f11b1f03086e782 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 28 Nov 2025 10:53:04 +0200 Subject: [PATCH 09/19] Fix closure in QC workflow --- subworkflows/local/qc.nf | 12 ++++++------ 1 file changed, 6 insertions(+), 6 deletions(-) diff --git a/subworkflows/local/qc.nf b/subworkflows/local/qc.nf index fa397491..fe7a5bf8 100644 --- a/subworkflows/local/qc.nf +++ b/subworkflows/local/qc.nf @@ -25,35 +25,35 @@ workflow QC { // Add Bin Quality to annotations - if( params.bin_quality ){ + if ( params.bin_quality ) { ch_bin_quality = file(params.bin_quality) ADD_BIN_QUALITY( ch_combined_annotations, ch_bin_quality ) ch_updated_annots = ADD_BIN_QUALITY.out.annots_bin_quality_out } - else{ + else { ch_updated_annots = ch_combined_annotations } // Add Taxonomy to annotations - if( params.taxa ){ + if ( params.taxa ) { ch_taxa = file(params.taxa) ADD_TAXA( ch_updated_annots, ch_taxa ) ch_updated_taxa_annots = ADD_TAXA.out.annots_taxa_out } - else{ + else { ch_updated_taxa_annots = ch_combined_annotations } ch_final_annots = ch_updated_taxa_annots - if( params.generate_gff || params.generate_gbk ){ + if ( params.generate_gff || params.generate_gbk ) { if (!call) { ch_called_genes = channel .fromPath(file(params.input_genes) / params.genes_fna_fmt, checkIfExists: true) .ifEmpty { exit 1, "If you specify --generate_gff or --generate_gbk without --call, you must provide a fasta file of called genes using --input_genes and --genes_fna_fmt,. Cannot find any called gene fasta files matching: ${params.input_genes} and ${params.genes_fna_fmt}\nNB: Path needs to follow pattern: path/to/directory/" } .map { it -> [ it.getBaseName(), it ] } - } + // Collect all individual fasta to pass to quast channel.empty() .mix( ch_called_genes ) From ed054bdb48531fc6a29b2e71fd21ea12b7130858 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 28 Nov 2025 10:57:43 +0200 Subject: [PATCH 10/19] Fix closure in DB_SEARCH workflow --- subworkflows/local/db_search.nf | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/subworkflows/local/db_search.nf b/subworkflows/local/db_search.nf index dc18a662..ea65cd01 100644 --- a/subworkflows/local/db_search.nf +++ b/subworkflows/local/db_search.nf @@ -129,7 +129,7 @@ workflow DB_SEARCH { .fromPath(file(params.input_genes) / params.genes_fmt, checkIfExists: true) .ifEmpty { exit 1, "If you specify --annotate without --call, you must provide a fasta file of called genes using --input_genes. Cannot find any called gene fasta files matching: ${params.input_genes}\nNB: Path needs to follow pattern: path/to/directory/" } .map { it -> [ it.getBaseName(), it ] } - } + GENE_LOCS( ch_called_proteins) ch_gene_locs = GENE_LOCS.out.prodigal_locs_tsv n_fastas = file("$params.input_genes/${params.genes_fmt}").size() From d39ff1405e0011c5e678ca4cb13773bdbac7661d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Mon, 1 Dec 2025 15:14:11 +0200 Subject: [PATCH 11/19] Updated combine_annotations.py to fix binwise summary. TODO: getting rid of FASTA_COLUMN environment variable --- bin/combine_annotations.py | 26 +++++++------------------- 1 file changed, 7 insertions(+), 19 deletions(-) diff --git a/bin/combine_annotations.py b/bin/combine_annotations.py index 3387f868..9029e8ca 100755 --- a/bin/combine_annotations.py +++ b/bin/combine_annotations.py @@ -14,15 +14,14 @@ logger = get_logger(filename=Path(__file__).stem) def read_and_preprocess(path: Path): - # We design input fastas from intermediate steps to be named like: "input_fasta___some_information_annotation_file.tsv" input_fasta = input_fasta_from_filepath(path) try: df = pd.read_csv(path) - df[FASTA_COLUMN] = input_fasta # Add input_fasta column + df[FASTA_COLUMN] = input_fasta return df except Exception as e: logger.error(f"Error loading DataFrame for input_fasta {input_fasta}: {str(e)}") - return pd.DataFrame() # Return an empty DataFrame in case of error + return pd.DataFrame() def input_fasta_from_filepath(file_path: Path): return file_path.stem.split("___")[0] @@ -51,7 +50,6 @@ def count_motifs(gene_faa, motif="(C..CH)", genes_faa_dict=None): for seq in read_sequence(gene_faa, format="fasta"): if seq.metadata["id"] not in genes_faa_dict: genes_faa_dict[seq.metadata["id"]] = {} - genes_faa_dict[seq.metadata["id"]]["heme_regulatory_motif_count"] = len(list(seq.find_with_regex(motif))) return genes_faa_dict @@ -61,12 +59,10 @@ def set_gene_data(gene_faa, genes_faa_dict=None): for seq in read_sequence(gene_faa, format="fasta"): if seq.metadata["id"] not in genes_faa_dict: genes_faa_dict[seq.metadata["id"]] = {} - split_label = seq.metadata["id"].split("_") gene_position = split_label[-1] start_position, end_position, strandedness = seq.metadata["description"].split("#")[1:4] - - genes_faa_dict[seq.metadata["id"]][FASTA_COLUMN] = os.path.commonprefix([Path(gene_faa).stem, seq.metadata["id"]]).rstrip("_") + genes_faa_dict[seq.metadata["id"]][FASTA_COLUMN] = str(Path(gene_faa).stem).replace('_called_genes', '') genes_faa_dict[seq.metadata["id"]]["scaffold"] = ( seq.metadata["id"] .removeprefix(genes_faa_dict[seq.metadata["id"]][FASTA_COLUMN]) @@ -83,16 +79,13 @@ def organize_columns(df, special_columns=None): special_columns = [] base_columns = ['query_id', FASTA_COLUMN, "scaffold", 'gene_number', 'start_position', 'stop_position', 'strandedness', 'rank'] base_columns = [col for col in base_columns if col in df.columns] - kegg_columns = sorted([col for col in df.columns if col.startswith('kegg_')], key=lambda x: (x != 'kegg_id', x)) other_columns = [col for col in df.columns if col not in base_columns + kegg_columns + special_columns] - db_prefixes = set(col.split('_')[0] for col in other_columns) sorted_other_columns = [] for prefix in db_prefixes: prefixed_columns = sorted([col for col in other_columns if col.startswith(prefix + '_')], key=lambda x: (x != f"{prefix}_id", x)) sorted_other_columns.extend(prefixed_columns) - final_columns_order = base_columns + kegg_columns + sorted_other_columns + special_columns return df[final_columns_order] @@ -106,11 +99,10 @@ def combine_annotations(annotations_dir, genes_dir, output, threads): annotations = Path(annotations_dir).glob("*") genes_faa = Path(genes_dir).glob("*") with ThreadPoolExecutor(max_workers=threads) as executor: - # futures = [executor.submit(read_and_preprocess, input_fasta, path) for input_fasta, path in input_fastas_and_paths] futures = [executor.submit(read_and_preprocess, Path(path)) for path in annotations] data_frames = [future.result() for future in as_completed(futures)] - combined_data = pd.concat(data_frames, ignore_index=True) + combined_data = pd.concat([df for df in data_frames if not df.empty], ignore_index=True) if genes_faa: genes_faa_dict = dict() for gene_path in genes_faa: @@ -118,13 +110,9 @@ def combine_annotations(annotations_dir, genes_dir, output, threads): genes_faa_dict count_motifs(gene_path, "(C..CH)", genes_faa_dict=genes_faa_dict) set_gene_data(gene_path, genes_faa_dict) - df = pd.DataFrame.from_dict(genes_faa_dict, orient='index') - combined_data = combined_data.drop(columns=df.columns, errors='ignore') - df.index.name = 'query_id' - - # we use outer to get any genes that don't have hits - combined_data = pd.merge(combined_data, df, how="outer", on="query_id") - combined_data.loc[combined_data[FASTA_COLUMN].isna(), FASTA_COLUMN] = "" + df = pd.DataFrame.from_dict(genes_faa_dict, orient='index').reset_index().rename(columns={'index': 'query_id'}) + combined_data = combined_data.drop(columns=df.columns.difference(["query_id", "scaffold", FASTA_COLUMN]), errors='ignore') + combined_data = pd.merge(combined_data, df, how="outer", on=["query_id", FASTA_COLUMN]) combined_data = convert_bit_scores_to_numeric(combined_data) From 64ab39ea7beb23743f7c11ead73ed8e9bc449791 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Thu, 18 Dec 2025 15:20:22 +0200 Subject: [PATCH 12/19] Add QC:COLLECT_RNA to array pattern --- conf/base.config | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/conf/base.config b/conf/base.config index a8dc5396..460af8ca 100644 --- a/conf/base.config +++ b/conf/base.config @@ -65,7 +65,7 @@ process { maxRetries = 2 } - withName: 'DRAM:ANNOTATE:CALL:.*|DRAM:ANNOTATE:DB_SEARCH:.*' { + withName: 'DRAM:ANNOTATE:CALL:.*|DRAM:ANNOTATE:DB_SEARCH:.*|DRAM:ANNOTATE:QC:COLLECT_RNA:.*' { array = params.array_size } From 23b1a1886bafb0e8acfa3423ba09792b3fd9584b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 24 Apr 2026 13:31:15 +0300 Subject: [PATCH 13/19] feat: accept gzip-compressed fasta input Adds a DECOMPRESS_FASTA module (bbtools reformat.sh in the existing bbmap container) and routes only .gz inputs through it via a branch on the fasta channel. Basename stripping is unified so sample.fa and sample.fa.gz produce the same downstream name, keeping outputs identical regardless of input compression. Co-Authored-By: Claude Opus 4.7 (1M context) --- modules/local/rename/decompress_fasta.nf | 20 ++++++++++++++++++++ nextflow_schema.json | 4 ++-- workflows/dram.nf | 17 +++++++++++++++-- 3 files changed, 37 insertions(+), 4 deletions(-) create mode 100644 modules/local/rename/decompress_fasta.nf diff --git a/modules/local/rename/decompress_fasta.nf b/modules/local/rename/decompress_fasta.nf new file mode 100644 index 00000000..c56d57a8 --- /dev/null +++ b/modules/local/rename/decompress_fasta.nf @@ -0,0 +1,20 @@ +process DECOMPRESS_FASTA { + label 'process_tiny' + + tag { name } + + conda "${moduleDir}/environment.yml" + container "community.wave.seqera.io/library/bbmap:801715ef64484762" + + input: + tuple val(name), path(fasta_gz) + + output: + tuple val(name), path("DECOMPRESSED/${name}.fa"), emit: decompressed_fasta + + script: + """ + mkdir -p DECOMPRESSED + reformat.sh in=${fasta_gz} out=DECOMPRESSED/${name}.fa + """ +} diff --git a/nextflow_schema.json b/nextflow_schema.json index 8899dbe0..9f875955 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -68,13 +68,13 @@ "format": "path", "exists": true, "description": "Path to FASTA directory", - "help_text": "This parameter is *mandatory*.", + "help_text": "This parameter is *mandatory*. Files may be uncompressed (.fa/.fna/.fasta) or gzip-compressed (.fa.gz/.fna.gz/.fasta.gz); compressed inputs are decompressed automatically.", "fa_icon": "fas fa-folder-open" }, "fasta_fmt": { "type": "string", "default": "*.f*", - "description": "Input format for the FASTA file.", + "description": "Input glob for the FASTA files. The default matches both plain and .gz files.", "fa_icon": "fas fa-plus" }, "input_genes": { diff --git a/workflows/dram.nf b/workflows/dram.nf index bf17269b..4c5ce1e0 100644 --- a/workflows/dram.nf +++ b/workflows/dram.nf @@ -20,6 +20,7 @@ include { MERGE } from "../subworkflows/local/merge.nf" include { ANNOTATE } from "../subworkflows/local/annotate.nf" include { ADD_ANNOTATIONS } from "../modules/local/add_and_combine/add_annotations.nf" include { SUMMARIZE } from "../modules/local/distill/distill.nf" +include { DECOMPRESS_FASTA } from "../modules/local/rename/decompress_fasta.nf" /* @@ -60,11 +61,23 @@ workflow DRAM { if (params.rename || call) { - ch_fasta = channel + ch_fasta_raw = channel .fromPath(file(params.input_fasta) / params.fasta_fmt, checkIfExists: true) .ifEmpty { exit 1, "Cannot find any fasta files matching: ${params.input_fasta}\nNB: Path needs to follow pattern: path/to/directory/" } - ch_fasta = ch_fasta.map { it -> [ it.getBaseName(), it ] } + // Strip .gz (if present) and then .fa/.fna/.fasta so gz and plain inputs yield identical sample names + ch_fasta_named = ch_fasta_raw.map { f -> + def name = f.name.replaceAll(/\.gz$/, '').replaceAll(/\.(fa|fna|fasta)$/, '') + [ name, f ] + } + + ch_fasta_branched = ch_fasta_named.branch { entry -> + gz: entry[1].name.endsWith('.gz') + plain: true + } + + DECOMPRESS_FASTA( ch_fasta_branched.gz ) + ch_fasta = DECOMPRESS_FASTA.out.decompressed_fasta.mix( ch_fasta_branched.plain ) } use_kegg = params.use_kegg From 3059c89ec35af467b07d747be2c4c67002bfa07d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 24 Apr 2026 13:33:28 +0300 Subject: [PATCH 14/19] fix: register array_size in schema so it validates It was already defined in nextflow.config (default 10) and consumed by conf/base.config, but absent from nextflow_schema.json, so runs emitted a schema-validation warning. Added alongside queue_size under Process Options. Co-Authored-By: Claude Opus 4.7 (1M context) --- nextflow_schema.json | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/nextflow_schema.json b/nextflow_schema.json index 9f875955..287d848c 100644 --- a/nextflow_schema.json +++ b/nextflow_schema.json @@ -672,6 +672,11 @@ "type": "integer", "default": 10, "description": "Maximum number of jobs to submit to the queue at once." + }, + "array_size": { + "type": "integer", + "default": 10, + "description": "Number of tasks to submit per job array. Set to 0 to disable job arrays (e.g. when running on the local executor, which does not support them)." } } }, From d00f4175fff6e705f19b5af5e1d2db45ce3745da Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 24 Apr 2026 13:49:00 +0300 Subject: [PATCH 15/19] chore: remove unused trees subsystem and DRAM-v1 legacy setup scripts Drops the never-included trees module and all scripts only it referenced (parse_annotations.py, update_annots_trees.py, color_labels.R), plus update_tree.py which had no references at all. Also removes assets/trees/ refpkgs (only consumed by the dropped module) and the DRAM-v1 standalone DB setup scripts under assets/internal/ which were never wired into the DSL2 pipeline. Co-Authored-By: Claude Opus 4.7 (1M context) --- assets/internal/generate_sql_database.py | 86 - assets/internal/prepare_databases.py | 784 --- .../amoa_pmoa/pmoa_amoa-tree-mapping.tsv | 18 - .../amoa_pmoa/pmoa_amoa_search_terms.txt | 11 - assets/trees/dmso/dmso.refpkg/CONTENTS.json | 26 - .../dmso.refpkg/RAxML_info.dmso_refs.fasta | 423 -- assets/trees/dmso/dmso.refpkg/Untitled 1.csv | 87 - ...nchLabels.dmso_refs.fasta_mode_low.renamed | 1 - .../dmso/dmso.refpkg/dmso-tree-mapping.tsv | 87 - assets/trees/dmso/dmso.refpkg/dmso.aln | 2838 --------- .../dmso/dmso.refpkg/dmso_phylo_model.json | 11 - assets/trees/dmso/dmso.refpkg/dmso_refs.fasta | 917 --- .../dmso/dmso.refpkg/dmso_refs.fasta.model | 581 -- .../dmso/dmso.refpkg/dmso_search_terms.txt | 12 - assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv | 76 - .../nar_nxr/nar_nxr.refpkg/CONTENTS.json | 25 - .../nar_nxr.refpkg/RAxML_info.nar_nxr_raxml | 95 - .../trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre | 1 - .../nar_nxr_seqs_for_tree_aligned.faa | 5425 ----------------- .../nar_nxr.refpkg/phylo_modelNQB2rG.json | 11 - assets/trees/nar_nxr/nar_nxr.tre | 1 - assets/trees/nar_nxr/nar_nxr_color_map.tsv | 6 - assets/trees/nar_nxr/nar_nxr_search_terms.txt | 13 - .../nar_nxr/nar_nxr_seqs_for_tree_aligned.faa | 5425 ----------------- bin/color_labels.R | 49 - bin/parse_annotations.py | 46 - bin/update_annots_trees.py | 84 - bin/update_tree.py | 49 - modules/local/trees/trees.nf | 92 - 29 files changed, 17280 deletions(-) delete mode 100644 assets/internal/generate_sql_database.py delete mode 100644 assets/internal/prepare_databases.py delete mode 100644 assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv delete mode 100644 assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt delete mode 100644 assets/trees/dmso/dmso.refpkg/CONTENTS.json delete mode 100644 assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta delete mode 100644 assets/trees/dmso/dmso.refpkg/Untitled 1.csv delete mode 100644 assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso.aln delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_refs.fasta delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model delete mode 100644 assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt delete mode 100644 assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa delete mode 100644 assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json delete mode 100644 assets/trees/nar_nxr/nar_nxr.tre delete mode 100644 assets/trees/nar_nxr/nar_nxr_color_map.tsv delete mode 100644 assets/trees/nar_nxr/nar_nxr_search_terms.txt delete mode 100644 assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa delete mode 100755 bin/color_labels.R delete mode 100755 bin/parse_annotations.py delete mode 100755 bin/update_annots_trees.py delete mode 100755 bin/update_tree.py delete mode 100644 modules/local/trees/trees.nf diff --git a/assets/internal/generate_sql_database.py b/assets/internal/generate_sql_database.py deleted file mode 100644 index e7d26490..00000000 --- a/assets/internal/generate_sql_database.py +++ /dev/null @@ -1,86 +0,0 @@ -import os -import sqlite3 -import argparse - -def insert_data(conn, table_name, data): - placeholders = ', '.join(['?'] * len(data[0])) - query = f"INSERT OR REPLACE INTO {table_name} VALUES ({placeholders})" - conn.executemany(query, data) - conn.commit() - -def process_dbcan(db_dir): - description_file = os.path.join(db_dir, 'dbcan.fam-activities.tsv') - ec_file = os.path.join(db_dir, 'dbcan.fam.subfam.ec.tsv') - - descriptions = {} - ecs = {} - skipped_lines = [] - - # Process descriptions - with open(description_file) as f: - for line in f: - if line.startswith('#') or not line.strip(): - continue - parts = line.strip().split('\t') - if len(parts) >= 2: - descriptions[parts[0]] = ' '.join(parts[1:]) - elif len(parts) == 1: - descriptions[parts[0]] = "No description available" - else: - skipped_lines.append(f"Skipped line in description file: {line.strip()} (expected at least 2 columns, found {len(parts)})") - - # Process EC numbers - with open(ec_file) as f: - for line in f: - parts = line.strip().split('\t') - if len(parts) > 2: - ecs[parts[0]] = ecs.get(parts[0], set()) - ecs[parts[0]].add(parts[2]) - - data = [] - for entry in descriptions: - ec = ','.join(ecs.get(entry, [])) - data.append((entry, descriptions[entry], ec)) - - return data, skipped_lines - -def main(): - parser = argparse.ArgumentParser(description="Generate descriptions database for DRAM.") - parser.add_argument('--db_dir', required=True, help="Directory containing the database subdirectories.") - parser.add_argument('--output_db', required=True, help="Path to the output SQLite database.") - parser.add_argument('--log', required=True, help="Path to the log file.") - - args = parser.parse_args() - - log_entries = [] - db_dir = args.db_dir - output_db = args.output_db - - conn = sqlite3.connect(output_db) - log_entries.append(f"Opened database {output_db}") - - dbcan_dir = os.path.join(db_dir, 'dbcan') - if os.path.exists(dbcan_dir): - conn.execute(""" - CREATE TABLE IF NOT EXISTS dbcan_description ( - id VARCHAR(30) NOT NULL, - description VARCHAR(1000), - ec VARCHAR(1000), - PRIMARY KEY (id) - ); - """) - log_entries.append("Processing dbcan_description from " + dbcan_dir) - data, skipped_lines = process_dbcan(dbcan_dir) - insert_data(conn, 'dbcan_description', data) - log_entries.append(f"Inserted {len(data)} records into dbcan_description") - log_entries.extend(skipped_lines) - - with open(args.log, 'w') as log_file: - for entry in log_entries: - log_file.write(entry + '\n') - - conn.close() - log_entries.append("Closed database connection") - -if __name__ == "__main__": - main() \ No newline at end of file diff --git a/assets/internal/prepare_databases.py b/assets/internal/prepare_databases.py deleted file mode 100644 index 42a113d8..00000000 --- a/assets/internal/prepare_databases.py +++ /dev/null @@ -1,784 +0,0 @@ -import os -import subprocess -from os import path, mkdir -import argparse -import shutil -from shutil import move, rmtree -from glob import glob -import requests - -DEFAULT_THREADS = 1 - -# Define database URLs -database_urls = { - "dbcan": { - "hmm_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/dbCAN-HMMdb-V12.txt", - "family_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/CAZyDB.08062022.fam.subfam.ec.txt", - "subfamily_url": "https://bcb.unl.edu/dbCAN2/download/Databases/V12/CAZyDB.08062022.fam-activities.txt" - }, - "cant_hyd": { - "base_url": "https://api.github.com/repos/dgittins/CANT-HYD-HydrocarbonBiodegradation/contents/HMMs/concatenated%20HMMs", - }, - "camper": { - "hmm_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER.hmm", - "faa_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_blast.faa", - "mmseq_scores_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_blast_scores.tsv", - "hmm_scores_url": "https://raw.githubusercontent.com/WrightonLabCSU/CAMPER/main/CAMPER_hmm_scores.tsv" - }, - "vogdb": { - "hmm_url": "https://fileshare.lisc.univie.ac.at/vog/latest/vog.hmm.tar.gz", - "annotations_url": "https://fileshare.lisc.univie.ac.at/vog/latest/vog.annotations.tsv.gz" - }, - "pfam": { - "hmm_url": "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.hmm.dat.gz", - "mmseq_url": "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.full.gz" - }, - "merops": { - "mmseqs_url": "ftp://ftp.ebi.ac.uk/pub/databases/merops/current_release/pepunit.lib" - }, - "kofam": { - "hmm_url": "ftp://ftp.genome.jp/pub/db/kofam/profiles.tar.gz", - "ko_list_url": "ftp://ftp.genome.jp/pub/db/kofam/ko_list.gz" - }, - "fegenie": { - "base_url": "https://api.github.com/repos/Arkadiy-Garber/FeGenie/contents/hmms/iron/", - "directories": [ - "iron_aquisition-heme_oxygenase", - "iron_aquisition-heme_transport", - "iron_aquisition-iron_transport", - "iron_aquisition-siderophore_synthesis", - "iron_aquisition-siderophore_transport", - "iron_aquisition-siderophore_transport_potential", - "iron_gene_regulation", - "iron_oxidation", - "iron_storage", - "iron_reduction", - "magnetosome_formation" - ], - "files": [ - "HMM-bitcutoffs.txt" - ] - }, - "sulfur": { - "hmm_path": "/home/reedrich/Wrighton-Lab/Projects/DRAM-Main-Main-Project/DRAM2/DRAM-2-Nextflow/databases/sulfur/sulfur.hmm" - }, - "methyl": { - "faa_path": "/home/reedrich/Wrighton-Lab/Projects/DRAM-Main-Main-Project/DRAM2/DRAM-2-Nextflow/databases/methyl/methylotrophy.faa" - } -} - -# Define rename_mapping dictionaries for each database -rename_mapping_dbcan = { - "hmm_url": "dbcan.hmm", - "family_url": "dbcan.fam-activities.tsv", - "subfamily_url": "dbcan.fam.subfam.ec.tsv" -} - -rename_mapping_cant_hyd = { - "hmm_file": "cant_hyd.hmm" -} - -rename_mapping_camper = { - "CAMPER.hmm": "hmm/camper.hmm", - "CAMPER_blast.faa": "mmseqs/camper_blast.faa", - "CAMPER_blast_scores.tsv": "mmseqs/camper_blast_scores.tsv", - "CAMPER_hmm_scores.tsv": "hmm/camper_hmm_scores.tsv" -} - -rename_mapping_vogdb = { - "hmm_url": "vog_latest_hmms.hmm", - "annotations_url": "vog_annotations_latest.tsv.gz" -} - -rename_mapping_pfam = { - "Pfam-A.hmm.dat.gz": "hmm/Pfam-A.hmm.dat", - "Pfam-A.full.gz": "mmseqs/Pfam-A.full.gz" -} - -rename_mapping_merops = { - "pepunit.lib": "mmseqs/merops_peptidases_nr.faa", -} - -rename_mapping_kofam = { - "hmm_url": "kofam_profiles.hmm", - "ko_list": "kofam_ko_list.tsv" -} - -rename_mapping_fegenie = { - "hmm_file": "fegenie.hmm", - "HMM-bitcutoffs.txt": "fegenie_iron_cut_offs.txt", -} - -rename_mapping_sulfur = { - "hmm_file": "sulfur.hmm" -} - -rename_mapping_methyl = { - "hmm_file": "methyl.faa" -} - -def download_cant_hyd_files(output_dir): - base_url = database_urls["cant_hyd"]["base_url"] - response = requests.get(base_url) - - if response.status_code == 200: - files = response.json() - for file in files: - if file["type"] == "file" and file["name"] == "CANT-HYD.hmm": - download_url = file["download_url"] - file_name = "cant_hyd.hmm" # Rename the file to cant_hyd.hmm - download_file_path = path.join(output_dir, file_name) - - file_response = requests.get(download_url) - if file_response.status_code == 200: - with open(download_file_path, "wb") as f: - f.write(file_response.content) - print(f"Downloaded file: {file_name}") - else: - print(f"Failed to download file: {file_name}. Status code: {file_response.status_code}") - else: - print(f"Failed to fetch file list from GitHub. Status code: {response.status_code}") - - print("cant_hyd files downloaded successfully.") - -def download_fegenie_files(output_dir): - repo_url = "https://github.com/Arkadiy-Garber/FeGenie.git" - fegenie_dir = path.join(output_dir, "FeGenie") - - # Remove the directory and its contents if it exists - if path.exists(fegenie_dir): - print(f"Removing contents of the directory {fegenie_dir}.") - shutil.rmtree(fegenie_dir) - - # Clone the FeGenie repository - git_clone_repo(repo_url, fegenie_dir) - - # Move the contents of the cloned repository to the output directory - for item in os.listdir(fegenie_dir): - item_path = path.join(fegenie_dir, item) - destination_path = path.join(output_dir, item) - - # Move the item to the destination directory - if path.exists(destination_path): - if path.isdir(destination_path): - shutil.rmtree(destination_path) - else: - os.remove(destination_path) - move(item_path, output_dir) - print(f"Moved {item} to {output_dir}") - - # Move and rename HMM-bitcutoffs.txt - bitcutoffs_src = path.join(output_dir, "iron", "HMM-bitcutoffs.txt") - bitcutoffs_dst = path.join(output_dir, "fegenie_iron_cut_offs.txt") - if path.exists(bitcutoffs_src): - move(bitcutoffs_src, bitcutoffs_dst) - print(f"Moved and renamed HMM-bitcutoffs.txt to {bitcutoffs_dst}") - - # Remove the cloned repository directory - rmtree(fegenie_dir) - - print("FeGenie files downloaded successfully.") - - -def download_fegenie_file(base_url, file_name, output_dir): - """ - Download a file from the FeGenie repository. - - Args: - base_url (str): The base URL of the FeGenie repository. - file_name (str): The name of the file to download. - output_dir (str): The directory where the downloaded file will be saved. - """ - download_url = f"{base_url}/{file_name}" - download_file_path = path.join(output_dir, file_name) - - # Send a GET request to the download URL - response = requests.get(download_url) - - if response.status_code == 200: - # Write the content of the response to the file - with open(download_file_path, "wb") as file: - file.write(response.content) - print(f"Downloaded file: {file_name}") - else: - print(f"Failed to download file: {file_name}. Status code: {response.status_code}") - -def download_databases(output_dir, databases): - for database in databases: - if database in database_urls: - urls = database_urls[database] - database_output_dir = path.join(output_dir, database) - if not path.exists(database_output_dir): - mkdir(database_output_dir) - - if database == "fegenie": - download_fegenie_files(database_output_dir) - elif database == "sulfur" or database == "methyl": - continue # Skip downloading for sulfur and methyl - elif database == "dbcan": - for url_key, url_value in urls.items(): - download_url = url_value # Get the download URL from the dictionary - download_file_name = path.basename(download_url) # Extract the file name from the URL - download_file_path = path.join(database_output_dir, download_file_name) - - # Download the file using curl - curl_command = f"curl -L -o {download_file_path} {download_url}" - subprocess.run(curl_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - - print(f"Downloaded file: {download_file_name}") - elif database == "cant_hyd": - download_cant_hyd_files(database_output_dir) - elif database == "kofam": - for url_key, url_value in urls.items(): - download_url = url_value # Get the download URL from the dictionary - download_file_name = path.basename(download_url) # Extract the file name from the URL - download_file_path = path.join(database_output_dir, download_file_name) - - # Download the file using curl - curl_command = f"curl -L -o {download_file_path} {download_url}" - subprocess.run(curl_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - - print(f"Downloaded file: {download_file_name}") - else: - for url_key, url_value in urls.items(): - download_url = urls[url_key] # Get the download URL from the dictionary - download_file_name = path.basename(download_url) # Extract the file name from the URL - download_file_path = path.join(database_output_dir, download_file_name) - - # Download the file using curl - curl_command = f"curl -L -o {download_file_path} {download_url}" - subprocess.run(curl_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - - print(f"Downloaded file: {download_file_name}") - - print(f"All files downloaded for {database} database.") - else: - print(f"URLs for {database} database are not defined. Skipping.") - -def process_vogdb_database(database_file, output_dir, num_threads=1): - print("Processing VogDB database...") - if path.exists(database_file): - # Extract the downloaded tar.gz file - tar_command = f"tar -xzf {database_file} -C {output_dir}" - subprocess.run(tar_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - - # Locate the .gz file in the extracted directory (if any) - hmm_files = glob(path.join(output_dir, "hmm", "*.hmm.gz")) - print("Extracted .hmm.gz files:", hmm_files) - - # Decompress each .hmm.gz file using pigz - for hmm_file in hmm_files: - decompress_command = f"pigz -d -p {num_threads} {hmm_file}" - subprocess.run(decompress_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - print(f"Decompressed file: {hmm_file}") - - print("VogDB processed successfully.") - else: - print("VogDB file not found. Skipping processing.") - -def process_camper_database(output_dir): - print("Processing Camper database...") - - for original_file, new_file in rename_mapping_camper.items(): - original_path = path.join(output_dir, original_file) - new_path = path.join(output_dir, new_file) - new_dir = path.dirname(new_path) - - # Create target directory if it doesn't exist - if not path.exists(new_dir): - os.makedirs(new_dir) - - if path.exists(original_path): - move(original_path, new_path) - print(f"File {original_file} renamed and moved to {new_path}") - else: - print(f"File {original_file} not found. Skipping.") - - # Index the HMM file - hmm_file = path.join(output_dir, "hmm", "camper.hmm") - try: - index_hmm(path.join(output_dir, "hmm"), hmm_file) - except subprocess.CalledProcessError as e: - print(f"Error running hmmpress on {hmm_file}: {e}") - - # Rename MMseqs files to follow the desired naming scheme - mmseqs_dir = path.join(output_dir, "mmseqs") - mmseqs_files = { - "camper_blast_scores.tsv": "camper_scores.tsv" - } - for old_name, new_name in mmseqs_files.items(): - old_path = path.join(mmseqs_dir, old_name) - new_path = path.join(mmseqs_dir, new_name) - if path.exists(old_path): - move(old_path, new_path) - print(f"File {old_name} renamed and moved to {new_path}") - else: - print(f"File {old_name} not found. Skipping.") - - print("Camper processed successfully.") - -def process_pfam_database(output_dir, num_threads=1): - print("Processing Pfam database...") - - for original_file, new_file in rename_mapping_pfam.items(): - original_path = path.join(output_dir, original_file) - new_path = path.join(output_dir, new_file) - new_dir = path.dirname(new_path) - - # Create target directory if it doesn't exist - if not path.exists(new_dir): - os.makedirs(new_dir) - - if path.exists(original_path): - if original_file.endswith(".gz"): - decompress_command = f"pigz -d -p {num_threads} {original_path}" - subprocess.run(decompress_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - original_path = original_path[:-3] # Remove .gz extension after decompression - move(original_path, new_path) - print(f"File {original_file} decompressed (if needed), renamed and moved to {new_path}") - else: - print(f"File {original_file} not found. Skipping.") - - print("Pfam processed successfully.") - -def process_merops_database(output_dir, num_threads=1): - print("Processing Merops database...") - - for original_file, new_file in rename_mapping_merops.items(): - original_path = path.join(output_dir, original_file) - new_path = path.join(output_dir, new_file) - new_dir = path.dirname(new_path) - - # Create target directory if it doesn't exist - if not path.exists(new_dir): - os.makedirs(new_dir) - - if path.exists(original_path): - move(original_path, new_path) - print(f"File {original_file} renamed and moved to {new_path}") - else: - print(f"File {original_file} not found. Skipping.") - - print("Merops processed successfully.") - - # Create the MMseqs2 database - create_mmseqs(new_path, new_path + "_db", num_threads) - -def process_fegenie_database(output_dir): - print("Processing FeGenie database...") - - # Download and prepare FeGenie files - download_fegenie_files(output_dir) - - # Concatenate all .hmm files into a single file - hmm_output_file = path.join(output_dir, "fegenie.hmm") - concatenate_hmm_files(output_dir, hmm_output_file) - - # Sanitize the concatenated HMM file - sanitized_hmm_file = path.join(output_dir, "sanitized_fegenie.hmm") - sanitize_hmm_file(hmm_output_file, sanitized_hmm_file) - - # Move the sanitized HMM file to replace the original one - final_hmm_file = path.join(output_dir, "fegenie.hmm") - os.remove(hmm_output_file) - move(sanitized_hmm_file, final_hmm_file) - - # Index the sanitized HMM file - try: - index_hmm(output_dir, final_hmm_file) - except subprocess.CalledProcessError as e: - print(f"Error running hmmpress: {e}") - print("Please check the format of the sanitized concatenated HMM file.") - - # Remove the directories after concatenation - directories = database_urls["fegenie"]["directories"] - for directory in directories: - dir_path = path.join(output_dir, directory) - if path.exists(dir_path): - rmtree(dir_path) - print(f"Removed directory: {dir_path}") - - # Delete all files except fegenie.hmm, fegenie.hmm index files, and fegenie_iron_cut_offs.txt - for file in os.listdir(output_dir): - if not (file.startswith("fegenie.hmm") or file == "fegenie_iron_cut_offs.txt"): - file_path = path.join(output_dir, file) - if path.isdir(file_path): - rmtree(file_path) - else: - os.remove(file_path) - print(f"Removed file: {file_path}") - - print("FeGenie processed successfully.") - - - -def process_sulfur_database(output_dir): - print("Processing Sulfur database...") - sulfur_hmm_path = database_urls["sulfur"]["hmm_path"] - - # Create the sulfur output directory if it doesn't exist - if not path.exists(output_dir): - mkdir(output_dir) - - # Move the sulfur HMM file to the sulfur output directory - destination_path = path.join(output_dir, path.basename(sulfur_hmm_path)) - shutil.copyfile(sulfur_hmm_path, destination_path) - print(f"Copied sulfur HMM file to: {destination_path}") - - # Index the HMM file - try: - index_hmm(output_dir, output_dir) - except subprocess.CalledProcessError as e: - print(f"Error running hmmpress: {e}") - print("Please check the format of the sulfur HMM file.") - - print("Sulfur processed successfully.") - -def process_methyl_database(output_dir, num_threads=1): - print("Processing Methyl database...") - - # Paths for methyl database files - methyl_faa_path = database_urls["methyl"]["faa_path"] - methyl_faa_dest = path.join(output_dir, "methyl.faa") - - # Create the output directory if it doesn't exist - if not path.exists(output_dir): - mkdir(output_dir) - - # Copy the methyl .faa file to the output directory - shutil.copyfile(methyl_faa_path, methyl_faa_dest) - print(f"Copied methyl .faa file to: {methyl_faa_dest}") - - print("Methyl processed successfully.") - -def process_cant_hyd_database(output_dir): - print("Processing cant_hyd database...") - repo_url = "https://github.com/dgittins/CANT-HYD-HydrocarbonBiodegradation.git" - cant_hyd_dir = path.join(output_dir, "cant_hyd_repo") - hmm_dir = path.join(output_dir, "hmm") - - # Remove the directory and its contents if it exists - if path.exists(cant_hyd_dir): - print(f"Removing contents of the directory {cant_hyd_dir}.") - shutil.rmtree(cant_hyd_dir) - - # Clone the cant_hyd repository - git_clone_repo(repo_url, cant_hyd_dir) - - # Create the hmm subdirectory if it doesn't exist - if not path.exists(hmm_dir): - os.makedirs(hmm_dir) - - # Move the concatenated HMM file to the hmm subdirectory - concatenated_hmm_path = path.join(cant_hyd_dir, "HMMs", "concatenated HMMs", "CANT-HYD.hmm") - final_hmm_path = path.join(hmm_dir, "cant_hyd.hmm") - if path.exists(concatenated_hmm_path): - move(concatenated_hmm_path, final_hmm_path) - print(f"Moved CANT-HYD.hmm to {final_hmm_path}") - else: - print(f"Concatenated HMM file not found in the repository.") - - # Remove the cloned repository directory - rmtree(cant_hyd_dir) - - # Index the HMM file - try: - index_hmm(hmm_dir, final_hmm_path) - except subprocess.CalledProcessError as e: - print(f"Error running hmmpress: {e}") - print("Please check the format of the cant_hyd HMM file.") - - # Ensure no extra cant_hyd.hmm files persist outside the hmm subdirectory - if path.exists(path.join(output_dir, "cant_hyd.hmm")): - os.remove(path.join(output_dir, "cant_hyd.hmm")) - print("Removed extraneous cant_hyd.hmm from the output directory.") - - print("cant_hyd processed successfully.") - -def process_dbcan_database(output_dir): - print("Processing dbcan database...") - rename_mapping = { - "dbCAN-HMMdb-V12.txt": "dbcan.hmm", - "CAZyDB.08062022.fam.subfam.ec.txt": "dbcan.fam.subfam.ec.tsv", - "CAZyDB.08062022.fam-activities.txt": "dbcan.fam-activities.tsv" - } - - for original_file, new_file in rename_mapping.items(): - original_path = path.join(output_dir, original_file) - new_path = path.join(output_dir, new_file) - new_dir = path.dirname(new_path) - - # Create target directory if it doesn't exist - if not path.exists(new_dir): - os.makedirs(new_dir) - - if path.exists(original_path): - move(original_path, new_path) - print(f"File {original_file} renamed and moved to {new_path}") - else: - print(f"File {original_file} not found. Skipping.") - - # Index the HMM file - try: - index_hmm(output_dir, path.join(output_dir, "dbcan.hmm")) - except subprocess.CalledProcessError as e: - print(f"Error running hmmpress: {e}") - print("Please check the format of the dbcan HMM file.") - - print("dbcan processed successfully.") - -def process_kofam_database(output_dir, num_threads=1): - print("Processing kofam database...") - hmm_dir = path.join(output_dir, "hmm") - - # Create the hmm subdirectory if it doesn't exist - if not path.exists(hmm_dir): - os.makedirs(hmm_dir) - - # Extract the profiles.tar.gz file - profiles_tar_path = path.join(output_dir, "profiles.tar.gz") - if path.exists(profiles_tar_path): - tar_command = f"tar -xzf {profiles_tar_path} -C {hmm_dir}" - subprocess.run(tar_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - print(f"Extracted {profiles_tar_path} to {hmm_dir}") - else: - print("Profiles tar file not found. Skipping extraction.") - - # Decompress ko_list.gz and rename - ko_list_path = path.join(output_dir, "ko_list.gz") - if path.exists(ko_list_path): - decompress_command = f"pigz -d -p {num_threads} {ko_list_path}" - subprocess.run(decompress_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - ko_list_path = ko_list_path[:-3] # Remove .gz extension after decompression - move(ko_list_path, path.join(output_dir, "kofam_ko_list.tsv")) - print(f"Decompressed and renamed ko_list to kofam_ko_list.tsv") - else: - print("ko_list.gz file not found. Skipping decompression.") - - # Concatenate all HMM files into a single file - kofam_hmm_file = path.join(output_dir, "kofam_profiles.hmm") - concatenate_hmm_files(hmm_dir, kofam_hmm_file) - - # Index the concatenated HMM file - try: - index_hmm(output_dir, kofam_hmm_file) - except subprocess.CalledProcessError as e: - print(f"Error running hmmpress on {kofam_hmm_file}: {e}") - print("Please check the format of the kofam HMM files.") - - # Remove the hmm directory and profiles.tar.gz file - if path.exists(hmm_dir): - rmtree(hmm_dir) - print(f"Removed directory: {hmm_dir}") - if path.exists(profiles_tar_path): - os.remove(profiles_tar_path) - print(f"Removed file: {profiles_tar_path}") - - print("kofam processed successfully.") - -def generate_readme(output_dir, databases_info): - def human_readable_size(size, decimal_places=1): - for unit in ['B', 'KB', 'MB', 'GB', 'TB']: - if size < 1024.0: - return f"{size:.{decimal_places}f} {unit}" - size /= 1024.0 - - readme_content = "Database Information:\n\n" - for database_name, database_info in databases_info.items(): - readme_content += f"Database: {database_name}\n" - readme_content += "URLs used for download:\n" - for url_key, url_value in database_info["urls"].items(): - readme_content += f"- {url_key}: {url_value}\n" - readme_content += f"\nDate and Time Downloaded: {database_info['download_date']}\n\n" - - # List contents of the directory with sizes, including subdirectories - database_dir = path.join(output_dir, database_name) - if path.exists(database_dir) and path.isdir(database_dir): - readme_content += f"{database_name}/\n" - for root, dirs, files in os.walk(database_dir): - for file_name in files: - file_path = path.join(root, file_name) - size = os.path.getsize(file_path) - relative_path = path.relpath(file_path, database_dir) - readme_content += f"{relative_path} ({human_readable_size(size)})\n" - readme_content += "\n" - - readme_file_path = path.join(output_dir, "README.txt") - with open(readme_file_path, "w") as readme_file: - readme_file.write(readme_content) - - print(f"README.txt generated successfully at {readme_file_path}") - -def index_hmm(hmm_dir, hmm_file): - try: - # Run HMMER to index the HMM file - index_command = f"hmmpress -f {hmm_file}" - result = subprocess.run(index_command, shell=True, check=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE) - print(result.stdout.decode('utf-8')) - print(f"Indexed HMM file: {path.basename(hmm_file)}") - except subprocess.CalledProcessError as e: - print(f"Error indexing HMM file {path.basename(hmm_file)}: {e}") - print(e.stderr.decode('utf-8')) - -def create_mmseqs(fasta_loc, output_loc, threads): - """Takes a fasta file and makes a mmseqs2 database for use in blast searching and hmm searching with mmseqs2.""" - print(f"Creating MMseqs2 database for {fasta_loc}...") - subprocess.run(["mmseqs", "createdb", fasta_loc, output_loc], check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - tmp_dir = path.join(path.dirname(output_loc), "tmp") - subprocess.run(["mmseqs", "createindex", output_loc, tmp_dir, "--threads", str(threads)], check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - print(f"MMseqs2 database created at {output_loc}") - - # Remove the temporary directory - if path.exists(tmp_dir): - rmtree(tmp_dir) - print(f"Removed temporary directory: {tmp_dir}") - -def sanitize_hmm_file(input_file, output_file): - with open(input_file, 'r') as in_file: - lines = in_file.readlines() - - sanitized_lines = [] - current_entry = [] - entry_started = False - entry_names = {} - name_suffix_counter = {} - - for line in lines: - line = line.strip() - if line.startswith("HMMER3/f"): - if entry_started: - # Process current entry before starting a new one - sanitized_entry = process_entry(current_entry, entry_names, name_suffix_counter) - sanitized_lines.extend(sanitized_entry) - current_entry = [] - entry_started = True - current_entry.append(line) - elif entry_started: - current_entry.append(line) - if line == "//": - entry_started = False - # Process the last entry - sanitized_entry = process_entry(current_entry, entry_names, name_suffix_counter) - sanitized_lines.extend(sanitized_entry) - current_entry = [] - - if entry_started: - # Process the final entry if it wasn't already processed - sanitized_entry = process_entry(current_entry, entry_names, name_suffix_counter) - sanitized_lines.extend(sanitized_entry) - - with open(output_file, 'w') as out_file: - out_file.write('\n'.join(sanitized_lines)) - - print(f"Sanitized HMM file written to: {output_file}") - -def process_entry(entry_lines, entry_names, name_suffix_counter): - name_line_index = None - acc_line_index = None - entry_name = None - - for i, line in enumerate(entry_lines): - if line.startswith("NAME"): - name_line_index = i - entry_name = line.split()[1] - elif line.startswith("ACC"): - acc_line_index = i - - if entry_name: - if entry_name in entry_names: - name_suffix_counter[entry_name] += 1 - unique_suffix = f"_{name_suffix_counter[entry_name]}" - entry_name += unique_suffix - entry_lines[name_line_index] = f"NAME {entry_name}" - if acc_line_index is not None: - acc_line = entry_lines[acc_line_index] - acc_line_parts = acc_line.split() - if len(acc_line_parts) > 1: - acc_line_parts[1] += unique_suffix - entry_lines[acc_line_index] = " ".join(acc_line_parts) - else: - entry_names[entry_name] = True - name_suffix_counter[entry_name] = 0 - - return entry_lines - -def concatenate_hmm_files(hmm_dir, output_file): - hmm_files = [] - for root, _, files in os.walk(hmm_dir): - for file in files: - if file.endswith(".hmm"): - hmm_files.append(path.join(root, file)) - - hmm_files.sort() - - with open(output_file, 'w') as out_file: - for hmm_file in hmm_files: - with open(hmm_file, 'r') as in_file: - lines = in_file.readlines() - out_file.writelines(lines) - if not lines[-1].strip() == "//": - out_file.write("\n//\n") - else: - out_file.write("\n") - - print(f"Concatenated HMM files into: {output_file}") - -def git_clone_repo(repo_url, output_dir): - clone_command = f"git clone {repo_url} {output_dir}" - subprocess.run(clone_command, shell=True, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL) - -def main(): - parser = argparse.ArgumentParser(description="Prepare databases for annotation") - parser.add_argument("--output_dir", help="Output directory path", required=True) - parser.add_argument("--databases", "-db", nargs='+', help="List of databases to update", required=True) - parser.add_argument("--threads", type=int, default=DEFAULT_THREADS, help="Number of threads for processing") - parser.add_argument("--verbose", action="store_true", help="Verbose mode") - parser.add_argument("--download_date", help="Download date for databases") - args = parser.parse_args() - - # Download databases - download_databases(args.output_dir, args.databases) - - # Process databases - for database in args.databases: - database_output_dir = path.join(args.output_dir, database) - if database == "vogdb": - process_vogdb_database(path.join(database_output_dir, "vog.hmm.tar.gz"), database_output_dir, args.threads) - concatenate_hmm_files(path.join(database_output_dir, "hmm"), path.join(database_output_dir, "vog_latest_hmms.hmm")) - rmtree(path.join(database_output_dir, "hmm")) - os.remove(path.join(database_output_dir, "vog.hmm.tar.gz")) - index_hmm(database_output_dir, path.join(database_output_dir, "vog_latest_hmms.hmm")) - elif database == "camper": - process_camper_database(database_output_dir) - create_mmseqs(path.join(database_output_dir, "mmseqs", "camper_blast.faa"), path.join(database_output_dir, "mmseqs", "camper.mmsdb"), args.threads) - elif database == "pfam": - process_pfam_database(database_output_dir, args.threads) - elif database == "merops": - process_merops_database(database_output_dir, args.threads) - elif database == "fegenie": - process_fegenie_database(database_output_dir) - elif database == "sulfur": - process_sulfur_database(database_output_dir) - elif database == "methyl": - process_methyl_database(database_output_dir) - create_mmseqs(path.join(database_output_dir, "methyl.faa"), path.join(database_output_dir, "methyl"), args.threads) - elif database == "dbcan": - process_dbcan_database(database_output_dir) - elif database == "cant_hyd": - process_cant_hyd_database(database_output_dir) - elif database == "kofam": - process_kofam_database(database_output_dir, args.threads) - - # Generate README - databases_info = {} - for database in args.databases: - if database in database_urls: - databases_info[database] = { - "urls": database_urls[database], - "download_date": args.download_date - } - - generate_readme(args.output_dir, databases_info) - -if __name__ == "__main__": - main() \ No newline at end of file diff --git a/assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv b/assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv deleted file mode 100644 index e07cc4d0..00000000 --- a/assets/trees/amoa_pmoa/pmoa_amoa-tree-mapping.tsv +++ /dev/null @@ -1,18 +0,0 @@ -gene call -NASQAN2011_051_A_bin.9_Ga0466380_000062_16 amoA-Nitrifier -stroublescreek_2019_sw_WHONDRS-S19S_0089_B_bin.19_k121_1382190_6 pmoA-Methanotroph -NASQAN2016_083_B_bin.62_k121_494990_1 pmoA-Methanotroph -NASQAN2015_172_B_bin.50_k121_110295_6 pmoA-Methanotroph -NASQAN2015_010_F_bin.15_scaffold_716_4 pmoA-Methanotroph -NASQAN2015_010_B_bin.40_k121_261665_1 pmoA-Methanotroph -NASQAN2015_010_A_bin.16_Ga0466474_000760_3 pmoA-Methanotroph -NASQAN2014_188_B_bin.62_k121_1916134_1 pmoA-Methanotroph -lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.22_k121_1561591_36 pmoA-Methanotroph -icacos_2019_sw_WHONDRS-S19S_0094_B_bin.101_k121_1011190_4 pmoA-Methanotroph -hugercreek_2019_sw_WHONDRS-S19S_0044_F_bin.32_scaffold_210_8 pmoA-Methanotroph -hugercreek_2019_sw_WHONDRS-S19S_0044_B_bin.34_k121_1606639_3 pmoA-Methanotroph -gunnisonriver_2019_sw_WHONDRS-S19S_0062_B_bin.67_k121_1407577_11 pmoA-Methanotroph -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.17_k121_961747_19 pmoA-Methanotroph -blueriver_2019_sw_WHONDRS-S19S_0024_B_bin.60_k121_1016154_8 pmoA-Methanotroph -blueriver_2019_sw_WHONDRS-S19S_0024_B_bin.60_k121_1651208_1 pmoA-Methanotroph -blackearthcreek_2019_sw_WHONDRS-S19S_0061_F_bin.11_scaffold_109_4 pmoA-Methanotroph diff --git a/assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt b/assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt deleted file mode 100644 index 19fdef5a..00000000 --- a/assets/trees/amoa_pmoa/pmoa_amoa_search_terms.txt +++ /dev/null @@ -1,11 +0,0 @@ -K10944 -ammonia monooxygenase -amoA -ammonia oxidation -nitrification -methane monooxygenase -pmoA -methane oxidation -methanotroph -EC: 1.14.18.3 -EC: 1.14.99.39 diff --git a/assets/trees/dmso/dmso.refpkg/CONTENTS.json b/assets/trees/dmso/dmso.refpkg/CONTENTS.json deleted file mode 100644 index 0b9baeaf..00000000 --- a/assets/trees/dmso/dmso.refpkg/CONTENTS.json +++ /dev/null @@ -1,26 +0,0 @@ -{ - "metadata": { - "create_date": "2024-05-13 10:00:00", - "format_version": "1.1", - "locus": "1861" - }, - "files": { - "aln_fasta": "dmso.aln", - "phylo_model": "dmso_phylo_model.json", - "tree": "bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed", - "tree_stats": "RAxML_info.dmso_refs.fasta" - - }, - "md5": { - "aln_fasta": "d224231710a0c259103a657c64c25d57", - "phylo_model": "0bc512c776715246a24b93391822e0e6", - "tree": "7880cd304b5db4792a0544faeddecdac", - "tree_stats": "d088fa3c4b149b7ccce5dc3843204c35" - }, - "log": [ - "Stripped refpkg (removed 0 files)", - "Loaded initial files into empty refpkg" - ], - "rollback": null, - "rollforward": null -} diff --git a/assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta b/assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta deleted file mode 100644 index 18435a51..00000000 --- a/assets/trees/dmso/dmso.refpkg/RAxML_info.dmso_refs.fasta +++ /dev/null @@ -1,423 +0,0 @@ - - -This is RAxML version 8.2.9 released by Alexandros Stamatakis on July 20 2016. - -With greatly appreciated code contributions by: -Andre Aberer (HITS) -Simon Berger (HITS) -Alexey Kozlov (HITS) -Kassian Kobert (HITS) -David Dao (KIT and HITS) -Sarah Lutteropp (KIT and HITS) -Nick Pattengale (Sandia) -Wayne Pfeiffer (SDSC) -Akifumi S. Tanabe (NRIFS) -Charlie Taylor (UF) - - -Alignment has 866 distinct alignment patterns - -Proportion of gaps and completely undetermined characters in this alignment: 38.35% - -RAxML rapid bootstrapping and subsequent ML search - -Using 1 distinct models/data partitions with joint branch length optimization - - - -Executing 100 rapid bootstrap inferences and thereafter a thorough ML search - -All free model parameters will be estimated by RAxML -ML estimate of 25 per site rate categories - -Likelihood of final tree will be evaluated and optimized under GAMMA - -GAMMA Model parameters will be estimated up to an accuracy of 0.1000000000 Log Likelihood units - -Partition: 0 -Alignment Patterns: 866 -Name: No Name Provided -DataType: AA -Substitution Matrix: LG -Using fixed base frequencies - - - - -RAxML was called as follows: - -raxmlHPC-PTHREADS -f a -m PROTCATLG -n dmso_refs.fasta -N 100 -p 1234 -s dmso_refs.fasta.phy -x 1234 -T 10 - - - -Time for BS model parameter optimization 0.124676 -Bootstrap[0]: Time 3.169462 seconds, bootstrap likelihood -76430.666973, best rearrangement setting 10 -Bootstrap[1]: Time 2.712014 seconds, bootstrap likelihood -77546.608252, best rearrangement setting 15 -Bootstrap[2]: Time 2.764819 seconds, bootstrap likelihood -74372.994119, best rearrangement setting 15 -Bootstrap[3]: Time 2.806386 seconds, bootstrap likelihood -76930.479065, best rearrangement setting 12 -Bootstrap[4]: Time 2.640082 seconds, bootstrap likelihood -79660.177375, best rearrangement setting 9 -Bootstrap[5]: Time 2.848176 seconds, bootstrap likelihood -73284.515856, best rearrangement setting 12 -Bootstrap[6]: Time 2.781467 seconds, bootstrap likelihood -77576.202035, best rearrangement setting 14 -Bootstrap[7]: Time 2.854323 seconds, bootstrap likelihood -77748.588236, best rearrangement setting 10 -Bootstrap[8]: Time 2.708592 seconds, bootstrap likelihood -76091.070124, best rearrangement setting 13 -Bootstrap[9]: Time 2.824420 seconds, bootstrap likelihood -77670.099908, best rearrangement setting 14 -Bootstrap[10]: Time 3.011455 seconds, bootstrap likelihood -74798.130429, best rearrangement setting 14 -Bootstrap[11]: Time 2.865858 seconds, bootstrap likelihood -74927.199956, best rearrangement setting 5 -Bootstrap[12]: Time 2.770799 seconds, bootstrap likelihood -76609.570227, best rearrangement setting 9 -Bootstrap[13]: Time 2.763006 seconds, bootstrap likelihood -75438.207037, best rearrangement setting 10 -Bootstrap[14]: Time 2.969280 seconds, bootstrap likelihood -74923.353365, best rearrangement setting 13 -Bootstrap[15]: Time 2.678948 seconds, bootstrap likelihood -75865.866781, best rearrangement setting 6 -Bootstrap[16]: Time 2.662132 seconds, bootstrap likelihood -72911.410662, best rearrangement setting 15 -Bootstrap[17]: Time 2.792305 seconds, bootstrap likelihood -75379.580846, best rearrangement setting 13 -Bootstrap[18]: Time 2.892445 seconds, bootstrap likelihood -80324.506934, best rearrangement setting 9 -Bootstrap[19]: Time 2.786553 seconds, bootstrap likelihood -72270.100764, best rearrangement setting 8 -Bootstrap[20]: Time 2.809719 seconds, bootstrap likelihood -73748.314934, best rearrangement setting 13 -Bootstrap[21]: Time 2.845561 seconds, bootstrap likelihood -75385.406316, best rearrangement setting 10 -Bootstrap[22]: Time 2.774577 seconds, bootstrap likelihood -73668.616005, best rearrangement setting 5 -Bootstrap[23]: Time 2.683971 seconds, bootstrap likelihood -77498.603255, best rearrangement setting 10 -Bootstrap[24]: Time 2.810509 seconds, bootstrap likelihood -74341.494886, best rearrangement setting 14 -Bootstrap[25]: Time 2.735748 seconds, bootstrap likelihood -72581.128145, best rearrangement setting 7 -Bootstrap[26]: Time 2.882895 seconds, bootstrap likelihood -74868.016278, best rearrangement setting 11 -Bootstrap[27]: Time 2.598391 seconds, bootstrap likelihood -77135.663040, best rearrangement setting 11 -Bootstrap[28]: Time 2.713763 seconds, bootstrap likelihood -74282.268325, best rearrangement setting 8 -Bootstrap[29]: Time 2.875335 seconds, bootstrap likelihood -76303.714027, best rearrangement setting 13 -Bootstrap[30]: Time 2.897037 seconds, bootstrap likelihood -77047.341575, best rearrangement setting 6 -Bootstrap[31]: Time 2.762513 seconds, bootstrap likelihood -76890.228702, best rearrangement setting 9 -Bootstrap[32]: Time 2.758115 seconds, bootstrap likelihood -75231.999227, best rearrangement setting 13 -Bootstrap[33]: Time 2.848642 seconds, bootstrap likelihood -74310.324400, best rearrangement setting 8 -Bootstrap[34]: Time 2.850801 seconds, bootstrap likelihood -74057.460243, best rearrangement setting 8 -Bootstrap[35]: Time 2.842190 seconds, bootstrap likelihood -76889.097344, best rearrangement setting 12 -Bootstrap[36]: Time 2.693162 seconds, bootstrap likelihood -72288.074882, best rearrangement setting 5 -Bootstrap[37]: Time 2.721867 seconds, bootstrap likelihood -72214.897833, best rearrangement setting 8 -Bootstrap[38]: Time 2.746011 seconds, bootstrap likelihood -79858.362103, best rearrangement setting 12 -Bootstrap[39]: Time 2.701599 seconds, bootstrap likelihood -76003.871644, best rearrangement setting 13 -Bootstrap[40]: Time 2.940543 seconds, bootstrap likelihood -73830.857312, best rearrangement setting 14 -Bootstrap[41]: Time 2.665834 seconds, bootstrap likelihood -75052.748018, best rearrangement setting 13 -Bootstrap[42]: Time 2.832848 seconds, bootstrap likelihood -73832.743609, best rearrangement setting 10 -Bootstrap[43]: Time 2.791044 seconds, bootstrap likelihood -76784.398417, best rearrangement setting 13 -Bootstrap[44]: Time 2.934724 seconds, bootstrap likelihood -72855.508133, best rearrangement setting 7 -Bootstrap[45]: Time 2.642106 seconds, bootstrap likelihood -75501.667158, best rearrangement setting 14 -Bootstrap[46]: Time 2.615179 seconds, bootstrap likelihood -77131.871440, best rearrangement setting 14 -Bootstrap[47]: Time 2.792766 seconds, bootstrap likelihood -75247.220567, best rearrangement setting 11 -Bootstrap[48]: Time 2.900219 seconds, bootstrap likelihood -74163.285113, best rearrangement setting 11 -Bootstrap[49]: Time 2.864223 seconds, bootstrap likelihood -77604.775494, best rearrangement setting 15 -Bootstrap[50]: Time 2.786153 seconds, bootstrap likelihood -76515.975539, best rearrangement setting 8 -Bootstrap[51]: Time 2.818712 seconds, bootstrap likelihood -76977.812201, best rearrangement setting 5 -Bootstrap[52]: Time 2.790959 seconds, bootstrap likelihood -78377.652343, best rearrangement setting 7 -Bootstrap[53]: Time 2.784077 seconds, bootstrap likelihood -71766.787886, best rearrangement setting 10 -Bootstrap[54]: Time 2.677011 seconds, bootstrap likelihood -75973.200232, best rearrangement setting 7 -Bootstrap[55]: Time 2.729044 seconds, bootstrap likelihood -75724.499984, best rearrangement setting 8 -Bootstrap[56]: Time 2.729286 seconds, bootstrap likelihood -74888.001582, best rearrangement setting 5 -Bootstrap[57]: Time 2.851877 seconds, bootstrap likelihood -79652.708518, best rearrangement setting 12 -Bootstrap[58]: Time 2.792531 seconds, bootstrap likelihood -75964.690632, best rearrangement setting 15 -Bootstrap[59]: Time 2.798732 seconds, bootstrap likelihood -76742.838934, best rearrangement setting 6 -Bootstrap[60]: Time 3.020606 seconds, bootstrap likelihood -74747.910682, best rearrangement setting 9 -Bootstrap[61]: Time 2.812696 seconds, bootstrap likelihood -75865.927451, best rearrangement setting 9 -Bootstrap[62]: Time 2.901127 seconds, bootstrap likelihood -76123.007373, best rearrangement setting 10 -Bootstrap[63]: Time 2.864416 seconds, bootstrap likelihood -76587.113230, best rearrangement setting 12 -Bootstrap[64]: Time 2.899098 seconds, bootstrap likelihood -76942.463640, best rearrangement setting 11 -Bootstrap[65]: Time 2.784283 seconds, bootstrap likelihood -75986.725459, best rearrangement setting 8 -Bootstrap[66]: Time 2.704422 seconds, bootstrap likelihood -74022.760235, best rearrangement setting 13 -Bootstrap[67]: Time 2.789476 seconds, bootstrap likelihood -73645.645693, best rearrangement setting 15 -Bootstrap[68]: Time 2.776784 seconds, bootstrap likelihood -77333.259622, best rearrangement setting 10 -Bootstrap[69]: Time 2.768058 seconds, bootstrap likelihood -74276.085077, best rearrangement setting 13 -Bootstrap[70]: Time 2.863719 seconds, bootstrap likelihood -74543.721711, best rearrangement setting 11 -Bootstrap[71]: Time 2.712924 seconds, bootstrap likelihood -74674.083552, best rearrangement setting 11 -Bootstrap[72]: Time 2.820370 seconds, bootstrap likelihood -78340.751173, best rearrangement setting 13 -Bootstrap[73]: Time 2.790599 seconds, bootstrap likelihood -77601.131316, best rearrangement setting 5 -Bootstrap[74]: Time 2.778625 seconds, bootstrap likelihood -75849.707899, best rearrangement setting 6 -Bootstrap[75]: Time 2.751258 seconds, bootstrap likelihood -76734.985357, best rearrangement setting 11 -Bootstrap[76]: Time 3.001420 seconds, bootstrap likelihood -75929.712488, best rearrangement setting 6 -Bootstrap[77]: Time 2.936729 seconds, bootstrap likelihood -76003.356537, best rearrangement setting 8 -Bootstrap[78]: Time 2.726102 seconds, bootstrap likelihood -75427.659661, best rearrangement setting 13 -Bootstrap[79]: Time 2.854278 seconds, bootstrap likelihood -74403.801286, best rearrangement setting 13 -Bootstrap[80]: Time 2.932036 seconds, bootstrap likelihood -77528.948929, best rearrangement setting 9 -Bootstrap[81]: Time 2.862943 seconds, bootstrap likelihood -77222.989909, best rearrangement setting 10 -Bootstrap[82]: Time 2.785410 seconds, bootstrap likelihood -75812.368570, best rearrangement setting 7 -Bootstrap[83]: Time 2.775612 seconds, bootstrap likelihood -78151.460391, best rearrangement setting 6 -Bootstrap[84]: Time 2.780776 seconds, bootstrap likelihood -75949.438281, best rearrangement setting 15 -Bootstrap[85]: Time 2.873042 seconds, bootstrap likelihood -75937.261665, best rearrangement setting 10 -Bootstrap[86]: Time 2.779905 seconds, bootstrap likelihood -78273.082126, best rearrangement setting 9 -Bootstrap[87]: Time 2.682864 seconds, bootstrap likelihood -80080.144193, best rearrangement setting 5 -Bootstrap[88]: Time 2.820337 seconds, bootstrap likelihood -74737.458630, best rearrangement setting 12 -Bootstrap[89]: Time 2.685485 seconds, bootstrap likelihood -75303.912997, best rearrangement setting 6 -Bootstrap[90]: Time 3.036829 seconds, bootstrap likelihood -76905.246932, best rearrangement setting 13 -Bootstrap[91]: Time 2.760195 seconds, bootstrap likelihood -79653.636750, best rearrangement setting 8 -Bootstrap[92]: Time 2.739485 seconds, bootstrap likelihood -76693.109057, best rearrangement setting 7 -Bootstrap[93]: Time 2.833615 seconds, bootstrap likelihood -74497.658518, best rearrangement setting 11 -Bootstrap[94]: Time 2.816307 seconds, bootstrap likelihood -77134.348437, best rearrangement setting 15 -Bootstrap[95]: Time 2.802382 seconds, bootstrap likelihood -75483.518060, best rearrangement setting 15 -Bootstrap[96]: Time 2.640518 seconds, bootstrap likelihood -74528.094785, best rearrangement setting 5 -Bootstrap[97]: Time 2.780421 seconds, bootstrap likelihood -73237.919062, best rearrangement setting 14 -Bootstrap[98]: Time 2.724797 seconds, bootstrap likelihood -75401.187043, best rearrangement setting 7 -Bootstrap[99]: Time 2.912125 seconds, bootstrap likelihood -74969.185954, best rearrangement setting 10 - - -Overall Time for 100 Rapid Bootstraps 281.389323 seconds -Average Time per Rapid Bootstrap 2.813893 seconds - -Starting ML Search ... - -Fast ML optimization finished - -Fast ML search Time: 756.295974 seconds - -Slow ML Search 0 Likelihood: -74928.461521 -Slow ML Search 1 Likelihood: -74928.461521 -Slow ML Search 2 Likelihood: -74928.461521 -Slow ML Search 3 Likelihood: -74928.461521 -Slow ML Search 4 Likelihood: -74928.461521 -Slow ML Search 5 Likelihood: -74928.461521 -Slow ML Search 6 Likelihood: -74928.461521 -Slow ML Search 7 Likelihood: -74928.461521 -Slow ML Search 8 Likelihood: -74928.461521 -Slow ML Search 9 Likelihood: -74928.461521 -Slow ML optimization finished - -Slow ML search Time: 602.354747 seconds -Thorough ML search Time: 73.895558 seconds - -Final ML Optimization Likelihood: -74928.461530 - -Model Information: - -Model Parameters of Partition 0, Name: No Name Provided, Type of Data: AA -alpha: 2.776473 -Tree-Length: 55.515763 -rate A <-> R: 0.399182 -rate A <-> N: 0.259945 -rate A <-> D: 0.371058 -rate A <-> C: 2.337364 -rate A <-> Q: 0.910775 -rate A <-> E: 0.975241 -rate A <-> G: 1.940106 -rate A <-> H: 0.336984 -rate A <-> I: 0.140697 -rate A <-> L: 0.371240 -rate A <-> K: 0.503815 -rate A <-> M: 1.055520 -rate A <-> F: 0.238237 -rate A <-> P: 1.105868 -rate A <-> S: 4.439041 -rate A <-> T: 2.009090 -rate A <-> W: 0.169702 -rate A <-> Y: 0.205613 -rate A <-> V: 2.392567 -rate R <-> N: 0.706048 -rate R <-> D: 0.116398 -rate R <-> C: 0.501968 -rate R <-> Q: 2.636754 -rate R <-> E: 0.341785 -rate R <-> G: 0.366408 -rate R <-> H: 2.278690 -rate R <-> I: 0.119250 -rate R <-> L: 0.283449 -rate R <-> K: 5.940467 -rate R <-> M: 0.454623 -rate R <-> F: 0.049508 -rate R <-> P: 0.312264 -rate R <-> S: 0.805843 -rate R <-> T: 0.543695 -rate R <-> W: 0.557424 -rate R <-> Y: 0.295274 -rate R <-> V: 0.160471 -rate N <-> D: 4.766737 -rate N <-> C: 0.496537 -rate N <-> Q: 1.592389 -rate N <-> E: 0.508692 -rate N <-> G: 1.350015 -rate N <-> H: 4.234381 -rate N <-> I: 0.179830 -rate N <-> L: 0.064256 -rate N <-> K: 2.014327 -rate N <-> M: 0.348390 -rate N <-> F: 0.084068 -rate N <-> P: 0.151925 -rate N <-> S: 3.764032 -rate N <-> T: 1.878729 -rate N <-> W: 0.042610 -rate N <-> Y: 0.574720 -rate N <-> V: 0.078587 -rate D <-> C: 0.058743 -rate D <-> Q: 0.491483 -rate D <-> E: 4.924234 -rate D <-> G: 0.793424 -rate D <-> H: 0.870603 -rate D <-> I: 0.010038 -rate D <-> L: 0.014157 -rate D <-> K: 0.265711 -rate D <-> M: 0.023991 -rate D <-> F: 0.016354 -rate D <-> P: 0.370412 -rate D <-> S: 1.164675 -rate D <-> T: 0.399902 -rate D <-> W: 0.028068 -rate D <-> Y: 0.126872 -rate D <-> V: 0.035653 -rate C <-> Q: 0.079639 -rate C <-> E: 0.003286 -rate C <-> G: 0.534566 -rate C <-> H: 0.601499 -rate C <-> I: 0.301083 -rate C <-> L: 0.557800 -rate C <-> K: 0.012457 -rate C <-> M: 0.839207 -rate C <-> F: 1.037881 -rate C <-> P: 0.070787 -rate C <-> S: 2.614753 -rate C <-> T: 1.073780 -rate C <-> W: 0.629281 -rate C <-> Y: 1.094488 -rate C <-> V: 1.839864 -rate Q <-> E: 3.876936 -rate Q <-> G: 0.251626 -rate Q <-> H: 4.520102 -rate Q <-> I: 0.068413 -rate Q <-> L: 0.546954 -rate Q <-> K: 3.037150 -rate Q <-> M: 1.570619 -rate Q <-> F: 0.033669 -rate Q <-> P: 0.586241 -rate Q <-> S: 1.149231 -rate Q <-> T: 1.014297 -rate Q <-> W: 0.221802 -rate Q <-> Y: 0.241650 -rate Q <-> V: 0.197511 -rate E <-> G: 0.327583 -rate E <-> H: 0.398044 -rate E <-> I: 0.041567 -rate E <-> L: 0.065426 -rate E <-> K: 1.697022 -rate E <-> M: 0.163145 -rate E <-> F: 0.017664 -rate E <-> P: 0.393844 -rate E <-> S: 0.574671 -rate E <-> T: 0.567695 -rate E <-> W: 0.073107 -rate E <-> Y: 0.112720 -rate E <-> V: 0.230098 -rate G <-> H: 0.292498 -rate G <-> I: 0.008174 -rate G <-> L: 0.041563 -rate G <-> K: 0.278555 -rate G <-> M: 0.131033 -rate G <-> F: 0.084125 -rate G <-> P: 0.184955 -rate G <-> S: 1.633930 -rate G <-> T: 0.121922 -rate G <-> W: 0.252125 -rate G <-> Y: 0.051346 -rate G <-> V: 0.072026 -rate H <-> I: 0.102245 -rate H <-> L: 0.343988 -rate H <-> K: 0.654763 -rate H <-> M: 0.415502 -rate H <-> F: 0.640560 -rate H <-> P: 0.477834 -rate H <-> S: 0.929667 -rate H <-> T: 0.548649 -rate H <-> W: 0.560661 -rate H <-> Y: 4.983361 -rate H <-> V: 0.111759 -rate I <-> L: 3.892408 -rate I <-> K: 0.149373 -rate I <-> M: 4.013113 -rate I <-> F: 1.044902 -rate I <-> P: 0.073509 -rate I <-> S: 0.060198 -rate I <-> T: 0.970728 -rate I <-> W: 0.104854 -rate I <-> Y: 0.218350 -rate I <-> V: 10.000000 -rate L <-> K: 0.129119 -rate L <-> M: 5.927594 -rate L <-> F: 2.434657 -rate L <-> P: 0.233879 -rate L <-> S: 0.171176 -rate L <-> T: 0.284471 -rate L <-> W: 0.581863 -rate L <-> Y: 0.281383 -rate L <-> V: 1.598956 -rate K <-> M: 0.616581 -rate K <-> F: 0.022460 -rate K <-> P: 0.366530 -rate K <-> S: 0.703048 -rate K <-> T: 1.067567 -rate K <-> W: 0.046864 -rate K <-> Y: 0.123890 -rate K <-> V: 0.173913 -rate M <-> F: 1.689205 -rate M <-> P: 0.093763 -rate M <-> S: 0.325811 -rate M <-> T: 1.897216 -rate M <-> W: 0.653740 -rate M <-> Y: 0.451968 -rate M <-> V: 1.782983 -rate F <-> P: 0.088706 -rate F <-> S: 0.339765 -rate F <-> T: 0.154944 -rate F <-> W: 2.307349 -rate F <-> Y: 7.328222 -rate F <-> V: 0.614777 -rate P <-> S: 1.256567 -rate P <-> T: 0.536635 -rate P <-> W: 0.089332 -rate P <-> Y: 0.084151 -rate P <-> V: 0.278428 -rate S <-> T: 6.077767 -rate S <-> W: 0.233693 -rate S <-> Y: 0.376132 -rate S <-> V: 0.092373 -rate T <-> W: 0.132241 -rate T <-> Y: 0.230856 -rate T <-> V: 2.054781 -rate W <-> Y: 2.959699 -rate W <-> V: 0.177959 -rate Y <-> V: 0.234116 - -freq pi(A): 0.079066 -freq pi(R): 0.055941 -freq pi(N): 0.041977 -freq pi(D): 0.053052 -freq pi(C): 0.012937 -freq pi(Q): 0.040767 -freq pi(E): 0.071586 -freq pi(G): 0.057337 -freq pi(H): 0.022355 -freq pi(I): 0.062157 -freq pi(L): 0.099081 -freq pi(K): 0.064600 -freq pi(M): 0.022951 -freq pi(F): 0.042302 -freq pi(P): 0.044040 -freq pi(S): 0.061197 -freq pi(T): 0.053287 -freq pi(W): 0.012066 -freq pi(Y): 0.034155 -freq pi(V): 0.069146 - - -ML search took 1433.381314 secs or 0.398161 hours - -Combined Bootstrap and ML search took 1714.774499 secs or 0.476326 hours - -Drawing Bootstrap Support Values on best-scoring ML tree ... - - - -Found 1 tree in File /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bestTree.dmso_refs.fasta - - - -Found 1 tree in File /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bestTree.dmso_refs.fasta - -Program execution info written to /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_info.dmso_refs.fasta -All 100 bootstrapped trees written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bootstrap.dmso_refs.fasta - -Best-scoring ML tree written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bestTree.dmso_refs.fasta - -Best-scoring ML tree with support values written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bipartitions.dmso_refs.fasta - -Best-scoring ML tree with support values as branch labels written to: /home/projects-wrighton-2/Pipeline_Development/DRAM2-Nextflow/DRAM2-Trees-Development/dmso/RAxML_bipartitionsBranchLabels.dmso_refs.fasta - -Overall execution time for full ML analysis: 1714.841682 secs or 0.476345 hours or 0.019848 days diff --git a/assets/trees/dmso/dmso.refpkg/Untitled 1.csv b/assets/trees/dmso/dmso.refpkg/Untitled 1.csv deleted file mode 100644 index 1ed57cf6..00000000 --- a/assets/trees/dmso/dmso.refpkg/Untitled 1.csv +++ /dev/null @@ -1,87 +0,0 @@ -gene call notes info -A_Nitrobacter_hamburgensis_YP_578638 NxrA Cytoplasmic Nitrite oxidoreductase -Acidovorax delafieldii_NARG NarG Nitrogen reductase -ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 ACTB1 Not sure if we want this -ACTB1_Bdellovibrio_bacteriovorus_NP_96849 ACTB1 Not sure if we want this -ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 ACTB1 Not sure if we want this -ACTB1_Candidatus_Solibacter_usitatus_YP_821785 ACTB1 Not sure if we want this -ACTB1_Chloroflexus_aggregans_YP_002464666 ACTB1 Not sure if we want this -ACTB1_Cytophaga_hutchinsonii_YP_678817 ACTB1 Not sure if we want this -ACTB1_Flavobacterium_psychrophilum_YP_001295304 ACTB1 Not sure if we want this -ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 ACTB1 Not sure if we want this -ACTB1_Geobacter_metallireducens_GS_15_YP_384764 ACTB1 Not sure if we want this -ACTB1_Geobacter_sp_M18_YP_004200644 ACTB1 Not sure if we want this -ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 ACTB1 Not sure if we want this -ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 ACTB1 Not sure if we want this -ACTB1_Leptospira_interrogans_serovar_NP_713447 ACTB1 Not sure if we want this -ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 ACTB1 Not sure if we want this -ACTB1_Methylobacterium_sp_4_YP_001772545 ACTB1 Not sure if we want this -ACTB1_Nitrosococcus_oceani_YP_343269 ACTB1 Not sure if we want this -ACTB1_Opitutus_terrae_gb_ACB77208 ACTB1 Not sure if we want this -ACTB1_Ralstonia_eutropha_YP_298623 ACTB1 Not sure if we want this -ACTB1_Rhodothermus_marinus_gb_ABV55245 ACTB1 Not sure if we want this -ACTB1_Salinibacter_ruber_emb_CBH25246 ACTB1 Not sure if we want this -ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 ACTB1 Not sure if we want this -Alkalilimnicola_ehrlichii_ABI55571 ArxA Anaerobic arsenite oxidase -ArrA_Bacillus_selenitireducens_gb_AAQ19491 ArrA Arsenate reductase -ArrA_Chrysiogenes_arsenatis_gb_AAU11839 ArrA Arsenate reductase -ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 ArrA Arsenate reductase -ArrA_Sulfurospirillum_barnesii_gb_AAU11840 ArrA Arsenate reductase -ArrA_Wolinella_succinogenes_NP_906980 ArrA Arsenate reductase -ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 ArxA Anaerobic arsenite oxidase -B_Caldithrix_abyssi_ZP_09550397 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase double check -B_Nitrobacter_hamburgensis_YP_578186 NxrA Cytoplasmic Nitrite oxidoreductase -Beggiatoa_sp_PS_ZP_02000390 Unknown Function -DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| DmsA Dimethl sulphoxide reductase -DmsA_E_coli_sp_P18775 DmsA Dimethl sulphoxide reductase -DmsA_Haemophilus_influenza_sp_P45004 DmsA Dimethl sulphoxide reductase -Gemmatimonas_aurantiaca_YP_002761548 Alternative complex III -Halorhodospira_halophila_YP_001001949 ArxA Anaerobic arsenite oxidase -Hydrogenobacter_thermophilus_YP_003433365 Unknown Function -Hydrogenobaculum_sp_Y04AAS1_YP_002121006 Unknown Function -I_OP1_uncultured_candidate_division_bacterium_BAL57377 Unknown Function -II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 Unknown Function -NarG_Escherichia_coli_NP_415742 NarG Nitrogen reductase -NarG_Halomonas_maura_gb_AAT47523 NarG Nitrogen reductase -NarG_Pseudomonas_fluorescens_gb_AEV63780 NarG Nitrogen reductase -NarG_Pseudomonas_stutzeri_gb_AAZ43099 NarG Nitrogen reductase -Natrinema_pellirubrum_YP_007282293 Unknown Function double check -Nitrobacter_sp_Nb_311A_ZP_01048070 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrobacter_winogradskyi_gb_ABA05326 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrococcus_mobi_EAR23355 NxrA Cytoplasmic Nitrite oxidoreductase -NxrA_Candidatus_K_stuttgartiensis_CAJ72445 NxrA Periplasmic Nitrite oxidoreductase -NxrA_planctomycete_KSU_1_ZP_10101005 NxrA Periplasmic Nitrite oxidoreductase -NxrA1_Nitrospira_defluvii_YP_003798853 NxrA Periplasmic Nitrite oxidoreductase -NxrA2_Nitrospira_defluvii_YP_003798871 NxrA Periplasmic Nitrite oxidoreductase -PhsA_Wolinella_succinogenes_NP_906934 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Carboxydothermus_hydrogenoformans_YP_361367 Psra Thiosulphate reductase -PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermus_thermophilus_YP_004130 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Wolinella_succinogenes_NP_906381 Psra Thiosulphate reductase -QrcB_delta_proteobacterium_NaphS2_ZP_07200609 QrcB Not sure if we want this -QrcB_Desulfatibacillum_alkenivorans_YP_002430439 QrcB Not sure if we want this -QrcB_Desulfococcus_oleovorans_YP_001530428 QrcB Not sure if we want this -QrcB_Desulfomicrobium_baculatum_YP_003159879 QrcB Not sure if we want this -QrcB_Desulfovibrio_magneticus_YP_002953179 QrcB Not sure if we want this -QrcB_Desulfovibrio_vulgaris_YP_967712 QrcB Not sure if we want this -QrcB_Syntrophobacter_fumaroxidans_YP_844744 QrcB Not sure if we want this -RBG1_10 Not sure if we want this -RBG1_1305 Not sure if we want this -RBG1_855 Not sure if we want this -TMAO_Citrobacter_youngae_ZP_06352135 TMAO No info on tree -TMAO_E_coli_CAA52095 TMAO No info on tree -TMAO_Photobacterium_profundum_YP_129680 TMAO No info on tree -TMAO_Salmonella_enterica_gb_AEZ47489 TMAO No info on tree -TMAO_Shewanella_massilia_CAA06851 TMAO No info on tree -TMAO_Vibrio_vulnificus_YP_004189064 TMAO No info on tree -TtrA_Aeropyrum_pernix_NP_148724 TrtA Tetrathionate reductase -TtrA_Haemophilus_somnus_gb_ABI25172 TrtA Tetrathionate reductase -TtrA_Photobacterium_profundum_YP_133039 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_aerophilum_NP_559177 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_arsenaticum_YP_001152643 TrtA Tetrathionate reductase -TtrA_Wolinella_succinogenes_NP_907142 TrtA Tetrathionate reductase -TtrA_Yersinia_enterocolitica_YP_001005907 TrtA Tetrathionate reductase diff --git a/assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed b/assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed deleted file mode 100644 index 2f537895..00000000 --- a/assets/trees/dmso/dmso.refpkg/bipartitionsBranchLabels.dmso_refs.fasta_mode_low.renamed +++ /dev/null @@ -1 +0,0 @@ -(Beggiatoa_sp_PS_ZP_02000390:0.31018678994441711838,(Natrinema_pellirubrum_YP_007282293:0.62627241139953637727,((Hydrogenobaculum_sp_Y04AAS1_YP_002121006:0.25202562736528244525,Hydrogenobacter_thermophilus_YP_003433365:0.22525561709713604053):0.30165783563945486323[100],((((Acidovorax:0.13667246099892554900,((NarG_Pseudomonas_stutzeri_gb_AAZ43099:0.03393658559446594003,NarG_Pseudomonas_fluorescens_gb_AEV63780:0.04907565545382640976):0.11325289427816984111[100],(NarG_Halomonas_maura_gb_AAT47523:0.14646439078919698540,NarG_Escherichia_coli_NP_415742:0.14944442674389668557):0.04669707032807739883[63]):0.08860689645843677908[81]):0.28323472060421345242[100],(Nitrococcus_mobi_EAR23355:0.17092574999759441168,(Nitrobacter_sp_Nb_311A_ZP_01048070:0.01046015345712418033,((A_Nitrobacter_hamburgensis_YP_578638:0.00851203468703114544,B_Nitrobacter_hamburgensis_YP_578186:0.02695906079380491413):0.02171289090283912496[94],Nitrobacter_winogradskyi_gb_ABA05326:0.03093192783563805323):0.01026905465586188879[78]):0.17248328026687961834[100]):0.33751197543721728200[100]):0.99152762326621168842[100],(((((TMAO_Vibrio_vulnificus_YP_004189064:0.08824900046563541323,TMAO_Photobacterium_profundum_YP_129680:0.08590352010876725619):0.18306761819681807713[100],TMAO_Shewanella_massilia_CAA06851:0.20825829024465955519):0.17862368552796076271[100],(TMAO_Citrobacter_youngae_ZP_06352135:0.41133442915839824039,(TMAO_Salmonella_enterica_gb_AEZ47489:0.06565565202990467086,TMAO_E_coli_CAA52095:0.06018585519821552376):0.23462434322473377235[100]):0.10347742396753679961[75]):0.92112695451955228787[100],(DmsA_E_coli_sp_P18775:0.23322212943307793487,(DmsA_Haemophilus_influenza_sp_P45004:0.08081484463360698312,DmsA_Actinobacillus_succinogenes_130Z:0.10868685038622999395):0.12598399783029093357[100]):0.57382198141086615539[100]):0.26440844330547474961[90],(((((TtrA_Haemophilus_somnus_gb_ABI25172:0.30384068025070881669,TtrA_Yersinia_enterocolitica_YP_001005907:0.36541021578513749324):0.18490699160553386582[91],(TtrA_Wolinella_succinogenes_NP_907142:0.64153003857806889521,TtrA_Photobacterium_profundum_YP_133039:0.94160881467741908146):0.14870581556773784793[62]):0.74286956410734672485[100],((TtrA_Pyrobaculum_arsenaticum_YP_001152643:0.16132115694270368622,TtrA_Pyrobaculum_aerophilum_NP_559177:0.08788089082126224194):0.28471506447190164657[100],TtrA_Aeropyrum_pernix_NP_148724:0.19811327077554555243):0.99152820694335630503[100]):0.56849048977295146834[100],((((((QrcB_Desulfatibacillum_alkenivorans_YP_002430439:0.69062666806863026725,QrcB_Desulfococcus_oleovorans_YP_001530428:0.52799062697662879629):0.21107589090264863851[97],(QrcB_delta_proteobacterium_NaphS2_ZP_07200609:0.60046780137077260253,QrcB_Syntrophobacter_fumaroxidans_YP_844744:0.80694048976353893732):0.09044026801852970976[32]):0.09373951901508625895[37],(QrcB_Desulfomicrobium_baculatum_YP_003159879:0.54928820408861156466,(QrcB_Desulfovibrio_magneticus_YP_002953179:0.54930955444688378542,QrcB_Desulfovibrio_vulgaris_YP_967712:0.47778813401120456827):0.12147059864301178178[49]):0.51927964796344860954[100]):0.27886064724177378471[100],((ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524:0.11021967570082565058,(ACTB1_Geobacter_sp_M18_YP_004200644:0.22414922514809035303,ACTB1_Geobacter_metallireducens_GS_15_YP_384764:0.19478125699568066276):0.02772326548080589897[21]):0.58363416355970954008[100],((ACTB1_Mariprofundus_ferrooxydans_ZP_01451016:0.49055905401768445939,(ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268:0.21080659146162344930,ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257:0.26440906971492933453):0.35237320222753865107[100]):0.27523086952627628943[100],(((ACTB1_Leptospira_interrogans_serovar_NP_713447:0.79307148795825910259,(ACTB1_Bdellovibrio_bacteriovorus_NP_96849:0.69991229166566804043,RBG1_1305:0.89737144652423395108):0.09288663579756109567[60]):0.16716761244359509830[71],((ACTB1_Flavobacterium_psychrophilum_YP_001295304:1.02606743524938170964,ACTB1_Cytophaga_hutchinsonii_YP_678817:0.50283093158201408457):0.28799005578471925659[99],(ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862:0.96646104346107775118,((ACTB1_Methylobacterium_sp_4_YP_001772545:0.63567467187472281864,ACTB1_Ralstonia_eutropha_YP_298623:0.82860248741955488949):0.13581998044218268618[33],(((ACTB1_Rhodothermus_marinus_gb_ABV55245:0.38865363015662424129,ACTB1_Salinibacter_ruber_emb_CBH25246:0.59233821425909760627):0.40688523208875704285[100],(ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266:0.68381691055352000763,ACTB1_Opitutus_terrae_gb_ACB77208:0.83025728066530646299):0.14219255226486615662[50]):0.12468269714690130567[49],(ACTB1_Chloroflexus_aggregans_YP_002464666:0.46873659447195903383,((ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078:0.50464784810003238125,ACTB1_Candidatus_Solibacter_usitatus_YP_821785:0.54245637379061018013):0.13733595525661521086[61],ACTB1_Nitrosococcus_oceani_YP_343269:0.49410400734252379884):0.10917412309064457310[21]):0.08450438372508251028[17]):0.12072458219781251332[16]):0.15098607158503560277[24]):0.59860089891352907809[100]):0.08727823617340259299[29]):0.69877093272090162746[100],Gemmatimonas_aurantiaca_YP_002761548:0.84260059047056301562):0.13752307751231809818[65]):0.28006707903346222954[100]):0.23466558402636081282[100]):0.17614184128090995540[87],((II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4:0.33467215681677725536,RBG1_855:0.82161967860182749668):0.12971199868024066437[76],(Alkalilimnicola_ehrlichii_ABI55571:0.16927440252820141753,(Halorhodospira_halophila_YP_001001949:0.15823128010931214460,ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308:0.31283575163699722799):0.07568817065129679333[35]):0.71169409868301625188[100]):0.10732618473035443474[35]):0.18919835836582774014[53],(ArrA_Chrysiogenes_arsenatis_gb_AAU11839:0.55861722570644156693,((ArrA_Bacillus_selenitireducens_gb_AAQ19491:0.57862013020904345950,(ArrA_Wolinella_succinogenes_NP_906980:0.11656277792250165082,ArrA_Sulfurospirillum_barnesii_gb_AAU11840:0.25535586149819144985):0.25704715855239179678[100]):0.10824894176711383209[52],ArrA_Halarsenatibacter_silvermanii_gb_ACF74513:0.46929511501429799214):0.04484475421107837756[41]):0.55088216920711008395[100]):0.17320965912547314769[100]):0.19386424023928239269[96],((PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324:0.46895807528927402341,PsrA_Carboxydothermus_hydrogenoformans_YP_361367:0.36278131760523796290):0.30501332134095587856[100],((PhsA_Wolinella_succinogenes_NP_906934:0.83556313083303890288,(PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207:1.02028532974974517344,(PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237:0.39406116350918174440,PsrA_Wolinella_succinogenes_NP_906381:0.56906242612948243487):0.37309846673540075779[100]):0.07083616780588812556[32]):0.10606547837054894345[26],(PsrA_PhsA_Thermus_thermophilus_YP_004130:0.52048385599284674452,((B_Caldithrix_abyssi_ZP_09550397:0.29162331030389027076,PsrA_PhsA_Acidiphilium_cryptum_YP_001233491:0.47229408641539760705):0.21497328944652449589[99],PsrA_PhsA_Geobacter_lovleyi_ZP_01593406:0.42362772298653567082):0.09681557138376449545[35]):0.48200494710375846319[100]):0.06133241697114610869[45]):0.32256472661171109451[100]):0.43399518039056000918[100]):0.42841990737161983471[100]):0.57877135424072545522[100],(((NxrA_planctomycete_KSU_1_ZP_10101005:0.07351303248959742409,NxrA_Candidatus_K_stuttgartiensis_CAJ72445:0.10665101974941076923):0.18189417316903719324[100],(NxrA1_Nitrospira_defluvii_YP_003798853:0.06498836035058985772,NxrA2_Nitrospira_defluvii_YP_003798871:0.07400335506604591163):0.28809352956461248274[100]):0.24410407282623491909[100],RBG1_10:0.21737233260787308664):0.28017652615537430583[100]):0.25972423664656024700[100]):0.04838674611379127632[31]):0.04397292308026813645[52],I_OP1_uncultured_candidate_division_bacterium_BAL57377:0.26884323213695593413); diff --git a/assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv b/assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv deleted file mode 100644 index 1ed57cf6..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso-tree-mapping.tsv +++ /dev/null @@ -1,87 +0,0 @@ -gene call notes info -A_Nitrobacter_hamburgensis_YP_578638 NxrA Cytoplasmic Nitrite oxidoreductase -Acidovorax delafieldii_NARG NarG Nitrogen reductase -ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 ACTB1 Not sure if we want this -ACTB1_Bdellovibrio_bacteriovorus_NP_96849 ACTB1 Not sure if we want this -ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 ACTB1 Not sure if we want this -ACTB1_Candidatus_Solibacter_usitatus_YP_821785 ACTB1 Not sure if we want this -ACTB1_Chloroflexus_aggregans_YP_002464666 ACTB1 Not sure if we want this -ACTB1_Cytophaga_hutchinsonii_YP_678817 ACTB1 Not sure if we want this -ACTB1_Flavobacterium_psychrophilum_YP_001295304 ACTB1 Not sure if we want this -ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 ACTB1 Not sure if we want this -ACTB1_Geobacter_metallireducens_GS_15_YP_384764 ACTB1 Not sure if we want this -ACTB1_Geobacter_sp_M18_YP_004200644 ACTB1 Not sure if we want this -ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 ACTB1 Not sure if we want this -ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 ACTB1 Not sure if we want this -ACTB1_Leptospira_interrogans_serovar_NP_713447 ACTB1 Not sure if we want this -ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 ACTB1 Not sure if we want this -ACTB1_Methylobacterium_sp_4_YP_001772545 ACTB1 Not sure if we want this -ACTB1_Nitrosococcus_oceani_YP_343269 ACTB1 Not sure if we want this -ACTB1_Opitutus_terrae_gb_ACB77208 ACTB1 Not sure if we want this -ACTB1_Ralstonia_eutropha_YP_298623 ACTB1 Not sure if we want this -ACTB1_Rhodothermus_marinus_gb_ABV55245 ACTB1 Not sure if we want this -ACTB1_Salinibacter_ruber_emb_CBH25246 ACTB1 Not sure if we want this -ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 ACTB1 Not sure if we want this -Alkalilimnicola_ehrlichii_ABI55571 ArxA Anaerobic arsenite oxidase -ArrA_Bacillus_selenitireducens_gb_AAQ19491 ArrA Arsenate reductase -ArrA_Chrysiogenes_arsenatis_gb_AAU11839 ArrA Arsenate reductase -ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 ArrA Arsenate reductase -ArrA_Sulfurospirillum_barnesii_gb_AAU11840 ArrA Arsenate reductase -ArrA_Wolinella_succinogenes_NP_906980 ArrA Arsenate reductase -ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 ArxA Anaerobic arsenite oxidase -B_Caldithrix_abyssi_ZP_09550397 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase double check -B_Nitrobacter_hamburgensis_YP_578186 NxrA Cytoplasmic Nitrite oxidoreductase -Beggiatoa_sp_PS_ZP_02000390 Unknown Function -DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| DmsA Dimethl sulphoxide reductase -DmsA_E_coli_sp_P18775 DmsA Dimethl sulphoxide reductase -DmsA_Haemophilus_influenza_sp_P45004 DmsA Dimethl sulphoxide reductase -Gemmatimonas_aurantiaca_YP_002761548 Alternative complex III -Halorhodospira_halophila_YP_001001949 ArxA Anaerobic arsenite oxidase -Hydrogenobacter_thermophilus_YP_003433365 Unknown Function -Hydrogenobaculum_sp_Y04AAS1_YP_002121006 Unknown Function -I_OP1_uncultured_candidate_division_bacterium_BAL57377 Unknown Function -II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 Unknown Function -NarG_Escherichia_coli_NP_415742 NarG Nitrogen reductase -NarG_Halomonas_maura_gb_AAT47523 NarG Nitrogen reductase -NarG_Pseudomonas_fluorescens_gb_AEV63780 NarG Nitrogen reductase -NarG_Pseudomonas_stutzeri_gb_AAZ43099 NarG Nitrogen reductase -Natrinema_pellirubrum_YP_007282293 Unknown Function double check -Nitrobacter_sp_Nb_311A_ZP_01048070 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrobacter_winogradskyi_gb_ABA05326 NxrA Cytoplasmic Nitrite oxidoreductase -Nitrococcus_mobi_EAR23355 NxrA Cytoplasmic Nitrite oxidoreductase -NxrA_Candidatus_K_stuttgartiensis_CAJ72445 NxrA Periplasmic Nitrite oxidoreductase -NxrA_planctomycete_KSU_1_ZP_10101005 NxrA Periplasmic Nitrite oxidoreductase -NxrA1_Nitrospira_defluvii_YP_003798853 NxrA Periplasmic Nitrite oxidoreductase -NxrA2_Nitrospira_defluvii_YP_003798871 NxrA Periplasmic Nitrite oxidoreductase -PhsA_Wolinella_succinogenes_NP_906934 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Carboxydothermus_hydrogenoformans_YP_361367 Psra Thiosulphate reductase -PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_PhsA_Thermus_thermophilus_YP_004130 PsrA;PhsA Thiosulphate reductase;Thiosulphide reductase -PsrA_Wolinella_succinogenes_NP_906381 Psra Thiosulphate reductase -QrcB_delta_proteobacterium_NaphS2_ZP_07200609 QrcB Not sure if we want this -QrcB_Desulfatibacillum_alkenivorans_YP_002430439 QrcB Not sure if we want this -QrcB_Desulfococcus_oleovorans_YP_001530428 QrcB Not sure if we want this -QrcB_Desulfomicrobium_baculatum_YP_003159879 QrcB Not sure if we want this -QrcB_Desulfovibrio_magneticus_YP_002953179 QrcB Not sure if we want this -QrcB_Desulfovibrio_vulgaris_YP_967712 QrcB Not sure if we want this -QrcB_Syntrophobacter_fumaroxidans_YP_844744 QrcB Not sure if we want this -RBG1_10 Not sure if we want this -RBG1_1305 Not sure if we want this -RBG1_855 Not sure if we want this -TMAO_Citrobacter_youngae_ZP_06352135 TMAO No info on tree -TMAO_E_coli_CAA52095 TMAO No info on tree -TMAO_Photobacterium_profundum_YP_129680 TMAO No info on tree -TMAO_Salmonella_enterica_gb_AEZ47489 TMAO No info on tree -TMAO_Shewanella_massilia_CAA06851 TMAO No info on tree -TMAO_Vibrio_vulnificus_YP_004189064 TMAO No info on tree -TtrA_Aeropyrum_pernix_NP_148724 TrtA Tetrathionate reductase -TtrA_Haemophilus_somnus_gb_ABI25172 TrtA Tetrathionate reductase -TtrA_Photobacterium_profundum_YP_133039 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_aerophilum_NP_559177 TrtA Tetrathionate reductase -TtrA_Pyrobaculum_arsenaticum_YP_001152643 TrtA Tetrathionate reductase -TtrA_Wolinella_succinogenes_NP_907142 TrtA Tetrathionate reductase -TtrA_Yersinia_enterocolitica_YP_001005907 TrtA Tetrathionate reductase diff --git a/assets/trees/dmso/dmso.refpkg/dmso.aln b/assets/trees/dmso/dmso.refpkg/dmso.aln deleted file mode 100644 index 22bfa700..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso.aln +++ /dev/null @@ -1,2838 +0,0 @@ ->Natrinema_pellirubrum_YP_007282293 ------------------------------------------------------------- -------------MANRDRSVDSANERSAEGTSVSRRTLLGGAGAAGV--AGFAGCLRLFT -DD-GEGNGNGTSTASKLNPLTEYPNREWESHYRDVWDV----------DDTYYLACRPND -THNCYLEANVK-NGV----VTRLGP--------SMNYGEAE------------------- ----DLYGNQASDRWDPRVCQKGLSMVERFYGER-RVTSPMIRQGFKDWVDEGFPREEDG- ----------SMPEEYA--KRGEDS-WYEASWD-EAYEYA--------AKTFLELADHYSG -A-DAQELLLEQGYDDRVVEEMQGVGTR--------------------------------- --------------------------TMKFRGGMPMLSTIGLFGEYRFAN-SMALVDHHVR -DVGEDEALGGVG-GDNYT-FHTDLPPGHPMVTGQQ---TVDFD-LANV-EYADNIVLAGI -----------NWMCTKMADSHWLTEARM---------NGAN----VTGIFTDYNATSSKC -D----ELVIIRPATDSALFLGVAQQIIATDGYDA----------EFVRSNTDLPLLVRMD -TGDHLRASDVFEDYDPADLERTQVAPADEHPAPTTVDTADQWITPDQR--EDWDDFVVYD -DAAGGVRAVDREAVGEEFDVDAALEGSWELELAD-------------------------- -------GDIVEVRPVFDLVKEYLDTT---------------------------------- -------------WDPESTAEVTGTEP---------EAVTNLAEQFADN----KESTLLLT -GMGP---NQYFNGDLKDRAAFLVASLTSNVGTHSGNVGSYAGNY---------------- -----RAAMLNGIPHYHLEDPFDPELDPDADSRVDSRITMES------------------- ------------------------MHFYSNLDKPLKIEGEYHMGDSHMNTP----TKSLWV -AGSNSILGN------------------------------AKGSYKIIEGLLR---TGKLE -AFFCNEWWWTMTCEY--SDIVFPA-DSWAEQNVHDLTASVTN----------PFLMVFPE -TGIDRVY-D---T--------RHD------CQIYQGVA-EKLAEKLDE------------ -------------PRLEQMWE--FIDE--------------------DEYRGKPYVQRILD -N---SNMTKGYDAETLIEKAERGEPALM--------MSTTYPKKIGTRQANDD------- -------------EPWYTKTGRLEFLREEETWTEVGETLPVHREAVDGTIYKPNVIVDDGD -HPLIDPETPDDLGWDDDNIEDA--------------------SARQVRNEVVSTDALVNS -SHPLQDVDPGFKYSFMTPKYRHGAHTFCNALP-----------NIAVWWG-PFGDRDRKD -DRKPYFG-----EGYVEMNPEDAKE-EGF-------------E-------------DGDY -VWVDADPND-RPYPSANGDPDEY--SR---A--L-MRVRYQPAMPRGVTRSWHN-LNQAS -HGTTEATPDR-TGMAK-------NEETDYVSLYRRGGHQSMTR-SWLRPTILTDEMNR-- ------KGLMGQSIGKGFAPD----VHCANGAPRESFVKFEKEGDAGEDGEGLWRPAEMGL -RPGYETETMQRYLDGDFTSTEGD------------------------------------- -- ->RBG1_10 ------------------------------------------------------------- -------------------------------MTLSRRRFLK---------ISSLSAAGALV -DL-PELKF-LQFLETVENPLEYYPNRDWEKIYRDQYRY----------DSSFTFVCTPND -THACRLRAYVR-NGI----VIRVEQ--------AYDVQNYT------------------- ----DLYGNKASVMWSPRGCNKGYNLPRRVYGPY-RVKHPMVRKGWKEWAEAGFPDPTLP- ----------ENQQKYF--RRGEDS-WVKVSWD-EGFELV--------AKGLLHTMEKYSG -E-KGAEILRKQGYPEEMIEAMHGSGAQ--------------------------------- --------------------------TIKIRGAMPLLGATRIFGFYR----FANMLGLYD- -G-----KLGARG-WSNFS-WHGDLPPGHPMVTGVK---CSDPE-LNDF-RHSKLLVFLGK -----------NMVESKMADAHWWIETIE---------RGGK----VVNISPEYSATSSKS -D----YWIPIRPGTDTALLLGVTQIIIQEKLYDQ----------DFIKKHTDLPLLIRMD -NLKLLRPTDIIKGYKNQILTGYSVKVQKIKPELR----------------EKWGDFVVWD -LKTKKPQTVTREDLGEKIERKGLNPALEGNYKIKL------------------------- -----VNGKEIEVKTVFQLYKELLSE----------------------------------- -------------YDLETVSQITGSPK---------NLIYQLAQDLATI----KP-ASIHT -GEGV---NHFFHCDLVTRAVWLPLALTGNIGKPGANVGHWAGNY---------------- -----KGEVFDGLGVYLNEDPFNPNLDPSAKLEDIKLKKYYKGEE---------------- ------------------------VCYWNYEDRPLIVKGKCFTGKTHMPTP----TKAEWV -GNGNLLNN-------------------------------AKWAHNMIANVEG-----KVE -MIVYNEIEWTASCEY--ADVVFPV-HSWMELTLPDMTASCSN----------PFLQV-WK -GGIKPIF-D---T--------KQD------NEVLAGVA-AKLSELTHD------------ -------------NRYKDYWK--FVLE----------------------GNNEVYLQRILD -A---CSTTKGYKIDELLKSDRGWLMNFRTYP-----RIPFWE-QIQ----ESK------- --------------PFYTKTGRMEFYREEDEFIDYGENLIVHREPVEATPYLPNVILGTHK -AIRPNSYGISPESINADER-----------------------QVRNLKMSWKQ-VKLSKN -P----LWEKGFRFYCLTPKSRHTVHSSWSVLD-----------WNMIWQS-NFGDPYRMD -NRTPGVG-----EHQMHMNPLDAKE-LGI-------------N-------------DGDY -AYVDANPED-RPYTGWKEEDPFYKVSR---L--M-VRVKYNPAYPRGITMIKHASFIATH -KSVKAHESRPDKRAV--------SEDTGYQSSFRYGSQQSITR-GWLQPTMMTDSLVR-- ------KNYMGQEIGEGYEID----VNAPNTCPKETLVKIIKAEDGGMGGKGKWEPARTGY -TPAGENKDMKKFLEGGFILKV--------------------------------------- -- ->NxrA1_Nitrospira_defluvii_YP_003798853 ------------------------------------------------------------- ------------------------------MMQLSRRQFLKVS-------AGTVAVAAVAD -K--ALALTALQPVVEVNNPLGEYPDRSWERVYHDQYRY----------DSSFTWVCSPND -THACRIRAFVR-NGV----VMRVEQ--------NYDHQTYE------------------- ----DLYGNRGTFAHNPRMCLKGFTFHRRVYGPY-RLKGPLMRKGWKQWMDDGSPELTS-- ----------DVKRKYKFDSRFLDD-MVRVSWD-TAFTYV--------AKGLIVIGTRYSG -EAGARRLREQG-YAPEMIEMMKGAGVR--------------------------------- --------------------------TFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIR -KVNPDQAQGGRY-WNNYT-WHGDQDPSQPWWNGTQ---NCDVD-LSDM-RFTKLNTSWGK -----------NFVENKMPEAHWKLESME---------RGAR----LVIITPEYNPTASRA -D----YWIPVRPETDGALFLGASKIILDENYQDI----------DFIKGFTDMPLLVRTD -TLQYLDPHEVLKDYQVPDF--------------TKSYSGRVQGLSQDQV-QRLGGMMVWD -LAKGKAVPLHREQVGVHLAQSGIDPALTGTYRIKL------------------------- -----LNGREVDVMPIYQLYTIHLQ-D---------------------------------- -------------YDLDTVHQVNRAPK---------DLIVRWARDCGTV----KPAA-IHN -GEGV---CHYFHMTSMGRAAALVMMLTGNIGKFGTGCHTWSGNYKVGIWQA--------- -----APWSGAGASVYLGEDPWNLNLRDDVHGKEIKYRKYYYGEEPGYWNHG--------- ------------------------DNALIVNTPKYG--RKVFTGKTHMPSP----SKVRWV -VNVNILNN-------------------------------AKHHYDMVKNVDP-----NIE -MLVTQDIEMTSDVNH--ADVAFAV-NSWMEFTYPEMTATVSN----------PWVQI-WK -GGIRPLY-D---T--------RND------LDSFAGVA-AKLKEMTGE------------ -------------QRMADTYK--FVYH----------------------NRVDIYVQRILD -A---STTFFGYSADVMLKSEKG-----WMVMCRTYPRHPLWE-ETN----ESK------- --------------PHWTRSGRLETYRIEPEAIEYGENFISHREGPECTPYMPNAIMTTNP -YVRPEDYGIPVTAQHHDDK-----------------------TVRNIKLPWSE-IKQHPN -P----LWEKGYQFYCVTPKTRHRVHSQWSVND-----------WVQIYES-NFGDPYRMD -KRTPGVG-----EHQIHINPQAAKD-RGI-------------N-------------DGDY -CYVDGNPVD-RPYRGWKPSDPFYKVAR---L--M-IRAKYNPSYPYHVTMAKHAPYVSTA -KSVKGHETRPDGRAI--------AVDTGYQSNFRYGAQQSFTR-SWLMPMHQTDSLPG-- ------KQANALKFKWGFEID----HHAVNTVPKECLIRITKAEDGGIGARGPWEPVRTGF -TPGQENEFMVKWLKGEHIKIKV-------------------------------------- -- ->NxrA2_Nitrospira_defluvii_YP_003798871 ------------------------------------------------------------- -----------------------------MQVSVSRRQFLK-I-------SAGTVAAVAVA -DK-VLALTALQPVIEVGNPLGEYPDRSWERVYHDQYRY----------DSSFTWCCSPND -THGCRVRAFVR-NGV----VMRVEQ--------NYDHQTYE------------------- ----DLYGNRGTFAHNPRMCLKGFTFHRRVYGPY-RLKGPLMRKGWKQWMDDGSPELT-P- ----------DVKRKYKFDSRFLDD-LNRVSWD-TAFTYV--------AKAAVLIATRYSG -EAGARRLREQG-YAPEMIEMMKGAGVR--------------------------------- --------------------------TFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIR -KVDAEKAQGGKY-YSNYT-WHGDQDPSHPFWNGTQ---NCDVD-LSDM-RFSKLNTSWGK -----------NFVENKMPEAHWKLESIE---------RGAR----IVVITPEYNPTAYRA -D----YWIPVRPETDGANFLGAAKIIFDENLQDI----------DYIKEFTDLPLLVRTD -TLQYLDPRDVIADYKFPDF--------------SKSYSGRIQSLKPEQV-ERLGGMMVWD -LAKGKAVPLHREQVGFHFKESGIDPALTGTFRVKL------------------------- -----LNSREIDVMPIYQMYQVHLQ-D---------------------------------- -------------YDLDTTHQITRAPK---------DLIVRWARDSGTI----KPAA-MHN -GEGV---CHYFHMTEMGRAAAFIMTITGNIGKFGTGCHTWSGNYKAGIWNA--------- -----VPWSGAGLAVHTGEDPFNLTLDPNAHGKEIKTRSYYYGEEVGYWNHG--------- ------------------------DTALIVNTPKYG--RKVFTGKTHMPSP----SKVRWV -TNVNILNN-------------------------------AKHHYDMVKNVDP-----NIE -MIVTQDIEMTSDVNH--ADVAFAC-NSWMEFTYPEMTGTVSN----------PWIQI-WK -GGIRPLY-D---T--------RND------ADTFAGVA-AKLAEMTGD------------ -------------ARFRGVFH--FVYM----------------------NRVDVYPQRMLD -A---SATCYGYSADVMLKSEKG-----WMVMGRTYPRHPLWE-ETN----ESK------- --------------PQWTRSGRIETYRIEPEAIEYGENFISHREGPECTPYLPNAIFSNNP -FIRPDDYGIPITAQHHD--DK---------------------HVRNIKLPWAE-IKRHPN -P----LWEKGYQFYCVTPKTRHRVHSQWSVND-----------WVQIYES-NFGDPYRMD -KRTPGVG-----EHQLHINPQAAKD-RGI-------------N-------------DGDY -VFVDGNPVD-RPYRGWKPSDPFYKVAR---L--M-IRAKYNPAYPYHVTMAKHAPYVATA -KSVKGHETRPDGRAI--------AVDTGYQSNFRYGAQQSFTR-NWLMPMHQTDSLPG-- ------KHTIAWKFKWGYAID----HHGINTVPKECLIRITKAEDGGIGARGPWEPVRTGF -TPGQENEFMIKWLKGEHIKIKV-------------------------------------- -- ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 ------------------------------------------------------------- -------------------------------MKLTRRAFLQ-V-------AGATGATLTLA -KN-AMAFRLLKPAVVVDNPLDTYPDRRWESVYRDQYQY----------DRTFTYCCSPND -THACRIRAFVR-NNV----MMRVEQ--------NYDHQNYS------------------- ----DLYGNKATRNWNPRMCLKGYTFHRRVYGPY-RLRYPLIRKGWKRWADDGFPELT-P- ----------ENKTKYMFDNRGNDE-LLRASWD-EAFTYA--------SKGIIHITKKYSG -PEGAQKLIDQG-YPKEMVDRMQGAGTR--------------------------------- --------------------------TFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNR -GVGPDQALGGRN-WSNYT-WHGDQAPGHPFSHGLQ---TSDVD-MNDV-RFSKLLIQTGK -----------NLIENKMPEAHWVTEVME---------RGGK----IVVITPEYSPSAQKA -D----YWIPIRNNTDTALFLGITKILIDNKWYDA----------DYVKKFTDFPLLIRTD -TLKRVSPKDIIPNYKLQDI--------------SDGPSYHIQGLKDEQR-EIIGDFVVWD -AKSKGPKAITRDDVGETLVKKGIDPVLEGSFKLKT------------------------- -----IDGKEIEVMTLLEMYKIHLR-D---------------------------------- -------------YDIDSVVSMTNSPK---------DLIERLAKDIATI----KPVA-IHY -GEGV---NHYFHATLMNRSYYLPVMLTGNVGYFGSGSHTWAGNYKAGNFQA--------- -----SKWSGPGFYGWVAEDVFKPNLDPYASAKDLNIKGRALDEEVAYWNHS--------- ------------------------ERPLIVNTPKYG--RKVFTGKTHMPSP----TKVLWF -TNVNLINN-------------------------------AKHVYQMLKNVNP-----NIE -QIMSTDIEITGSIEY--ADFAFPA-NSWVEFQEFEITNSCSN----------PFIQIWGK -TGITPVY-E---S--------KDD------VKILAGMA-SKLGELLRD------------ -------------KRFEDNWK--FAIE----------------------GRASVYINRLLD -G---STTMKGYTCEDILN-GKYGEPGVAMLLFRTYPRHPFWE-QVH----ESL------- --------------PFYTPTGRLQAYNDEPEIIEYGENFIVHREGPEATPYLPNAIVSTNP -YIRPDDYGIPENAEYWEDR-----------------------TVRNIKKSWEE-TKKTKN -F----LWEKGYHFYCVTPKSRHTVHSQWAVTD-----------WNFIWNN-NFGDPYRMD -KRMPGVG-----EHQIHIHPQAARD-LGI-------------E-------------DGDY -VYVDANPAD-RPYEGWKPNDSFYKVSR---L--M-LRAKYNPAYPYNCTMMKHSAWISSD -KTVQAHETRPDGRA---------LSPSGYQSSFRYGSQQSITR-DWSMPMHQLDSLFH-- ------KAKIGMKFIFGFEAD----NHCINTVPKETLVKITKAENGGMGGKGVWDPVKTGY -TAGNENDFMKKFLNGELIKVDA-------------------------------------- -- ->NxrA_planctomycete_KSU_1_ZP_10101005 ------------------------------------------------------------- -------------------------------MKLTRRTFLQ-V-------TGATGATFTLA -NK-AMAFRLLKPAVEVGNPLDAYPDRAWESVYREQYRY----------DRTFTYCCSPND -THACRVRAFVR-NEV----LMRVEQ--------NYDHQNYA------------------- ----DLYGNKATRNWNPRMCLKGYTFHRRVYGPY-RLRYPLIRKGWKQWADDGFPELT-P- ----------ENKSKYMFDARGQDE-LLKASWD-DAWTYA--------AKGIIHITKKYSG -E-EGARKLLDQGYPKEMVDAMKGAGTR--------------------------------- --------------------------TFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNR -GVGPDKALGGRN-WSNYT-WHGDQAPGHPFSHGLQ---TSDVD-MNDV-RFSKLVIQTGK -----------NLIENKMPEAHWLTQVFE---------RGGK----LVVITPEYSPSAQKA -D----YWIPIKCNTDTALFLGITRILMDEKLYDA----------DYVKKFTDFPLLVRTD -TLKRLQAKDIFPDYKLEDISHGASYKIHGLHDDQR---------------EIIGDFVVWD -AKTKSPKAITRDDVGDKLVAKGIDPALDGTFKVKT------------------------- -----VDGKEIEVMPLFEMYKIHL-KD---------------------------------- -------------YDIDSVVEMTNSPK---------ELIVRLAHDIATI----KP-VAIHY -GEGI---NHWFHATLFNRSTYLPLMLTGNIGYPGSGSHTWSGNYKAGNFQA--------- -----SKWSGPGFYGWVAEDVFNPNLDPDAPAMDLKVKGRAYDEEVAYWNHN--------- ------------------------DRPLIVDTPKYG--RKCFTGKTHMPTP----TKIMWF -TNVNLVNN-------------------------------AKHVYQMLKNVNP-----NIE -QIMSNDIEMTGSIEY--ADFAFPA-NSWAEFETHEITTSCSN----------PFIQI-WK -GGIKPVN-D---S--------KDD------VMILAGMA-AKLGELLRD------------ -------------MRFHDVWK--FALE----------------------GRPEVYIQRLLD -G---STTTKGYSFVDIIN-GKYGEPGVALLLYRTYPRHPFWE-QVH----ESI------- --------------PFYTPTGRLQGYNDESEIIEYGENFIVHREGPEATQYLPNVIVSTNP -YIRPDDYGIPEDAEHWD--ER---------------------TVRNIKKSWAE-TKKTKN -F----LWEKGYKFYCVTPKSRHTVHSQWAVTD-----------WNFIWNN-NFGDPYRMD -KRMPGVG-----EHQIHMNPEAAKD-LGI-------------N-------------DGDY -VYVDANPAD-RPYEGWKPSDPFYKVAR---L--M-LRCKYNPAYPYGVTMMKHSAWISTE -RSVKAHETRPDGRAL--------SAGTGYQSSFRYGSQQSITR-NWSMPMHQLDNLFH-- ------KSKTSMKFVFGYEAD----NHGINTTPKETLVKITKAEDGGIGGKGLWDPAKTGY -TAGNENDFMKKYLNGELIKVEKA------------------------------------- -- ->Hydrogenobaculum_sp_Y04AAS1_YP_002121006 ------------------------------------------------------------- --------------------------------MISRRDFLKN--------GSVFLAALSTP -GF-GKKLF--EPLVIVGNPLASYPNRGWEKIYRDIYKP----------DETTVILCNPND -THGCYLNAYVK-NGI----ITRLEP--------TYKYGDAT------------------- ----DIYGIKASHRWEPRCCNKGLALVRRFYGDR-RIRGPFVRKGYYEWYKADFPRDEN-- ----------GKPPSKYFINRGKDE-WLKVSWE-EVSDII--------AKSLINIAKTYSG -EKGKAYLKAQG-YPEEMIDTMAGAGTR--------------------------------- --------------------------TLKFRGSMPWLAVLRYVGQYRMSN-MMALLDSNIR -KVEPDKALGGVG-WDNYS-EHTDLPPAHTLVTGQQ---TVDFD-LVTW-EHAKLIVLWGM -----------NPYGTKMPDSHWLTEAQI---------KGIK----VIVISNDFMATARTA -D----KVVITRTATDGALALSMAYVIMKEKLYDE----------NFVKSFTDLPLLVRMD -NAKLLRASDIIPNYIPKAL-NQAVVYNPSKQMPPPPMKQEKQYIPIQLRDQDINDFVVWD -VKTNSPKVVTRDEVGKYFDMSSLDPALTGEYEVEL------------------------- -----VNGEKVKVKPNFQAYIELLEEN---------------------------------- -------------YTPETVEEITGVPA---------NVIRELALEIANH----KGTTKITT -GMGV---NQYFHGDLIVRAIFLVAALTGNVGRESGNIGSYAGNY---------------- -----RLAVFNGVGQWNAEDPFNIELDPSKLAKVKFYWKGES------------------- ------------------------QHYFADGDRPLKVGDKMLTGKTHMPVP----TKFMWM -ADNNSGLGN------------------------------QKWAYNVMFNVLP-----NVE -CVVTNDWWWSLSCEY--SDIILGV-DAWDENRFWDISGSCTN----------PFFLVWPR -TKQKRLF-D---T--------KND------IETYALVA-KRLSELTGD------------ -------------KRFKEYWH--FVFE----------------------EKPEVYIQRIIN -A---SSNLKGYKIEEVAAKAEQGIPSLVMTRFYP--KFIGYD-QTV----DGK------- --------------PWYTKTGRLEFYREEDTFINVGENLIVHREAIDSTPYEPNTIVIAKK -HPLLRPLDPKSYGLSSEEMLKDT-------------------ELRQARAVFIS-PAKLKD -TKHPLRVSFGATHIVHTPKFRHTTHSATGDVD-----------IVALLFG-PYGDMYRHD -KRTPYVV-----DAFIEINTHDLQK-LGI-------------N-------------DGDY -VWVDADPQD-RPFIGWQNKPEEYEVAR---L--L-LRVRGSFSTPPGLAKIWFNMYGSSH -GSVKGTKVNKNGLAE--------NPVTGYQSFYRRGSQQSVTR-GWLNPTLMGDTLVR-- ------KDLFGQTLNKGFMLD----VYCPTGAPREGFAKITKAENGGIGNVGLWRPLSIGF -RPQNPNKYFKKYLEAGYVIFV--------------------------------------- -- ->Hydrogenobacter_thermophilus_YP_003433365 ------------------------------------------------------------- ------------------------------MSDLTRRDLLK-M-------GGLSLTAMLSP -SF-AFRVMEPVVRV--ENPLAYYPNRDWERFYRDIFKS----------EATFTFLCAPND -THNCLLTAHVK-NGV----ITRIEP--------TYKFGEAT------------------- ----DIYGLKASHRWDPRCCNKGLALMRRFYGDR-RVKGPMVRRGFYEWYKAGFPRDPIT- ----------GKPLEKYF-QRGKDK-FIKVTWD-EVADII--------AKTLINIATTYSG -EEGRKRLEAQGHYPKPMLDAMEGAGTR--------------------------------- --------------------------VLKFRGSMPFLAVVRYTSPYRFAN-MMALLDSHIR -GVGPDKALGGRG-WDNYA-FHTDLAPGHPMVSGQQ---NVEFD-LCMW-EHSKLIILWGM -----------NPFTTKMPDCHWLTEARI---------KGSK----VIVISNDYSPTARAS -D----ELIVVRTGTDTALALSIAYVIMKEKLYQE----------RFVKSFTDMPLLVRMD -NGKVLRARDIIPNYQPQPLQKAVVFKP--GETLPPFYKQDKQYIPEPIRKGDMDDFVVWD -TKSNSPKVITRDHVGEDFWKLGIDPALYGTYRVKT------------------------- -----VEGKEVEVKPLFQVYLEFFEKS---------------------------------- -------------YTPKQAEVITGVPA---------KKIEKLAREIASH----PRNMKLAQ -GMGV---NQYQHADLKDRAMYMICALTDNIGHATGNIGSYAGNF---------------- -----RLALFNGAPQYLAEDPFNIELDPEKPA---KVKFYWKPESAHYYSH---------- ----------------------------DDHPQYMG--EHLITGKTHMPTP----TKFVWF -VDANSALGN------------------------------AKWQYNIIMNTLP-----KIE -CIVTNEWWWSMTCEY--SDIVLGV-DAWNENKYWDIAGSVTN----------PFVYVWPK -TGHRRFF-D---T--------KND------AEAFAIVA-NRLSELTGD------------ -------------ERFRNYWK--FVLE---------------------GKQDVVYVQRVIN -A---SSNLRGYRLEEIAKKAHEGIPSLI--------MTRSYPKYVGEDQTKEG------- -------------MPWYTKSGRLEFYREEPEFMDAGENLPVYREPIDSTHHEPNVIVARPH -PLLRPKKPEDYGLSAKDALLST--------------------EWRQARNVLVS-PEKLPN -TKHPLMVTVGATHIVHTPKYRHSAHTTTGDTD-----------IIVLLFG-PFGDIYRHD -KRMPFVS-----EAYIDINPKDLKK-MGI-------------Q-------------DGDY -VWVDADPQD-RPFAGWQKRPEDYEVGR---L--L-LRARASNNTPPGCAKIWFNMYGSSH -GSVRGTKENPNGLAK--------NPNTGYQSLYRRGSHQSITR-GWFKPTYQTDTLVR-- ------KNLMGQIIGKGFELD----VHGLIGAPREGFCKIAKAEDGGIGGKGVWRPVRLGY -RPMTANEMLKKYLKGEYVK----------------------------------------- -- ->I_OP1_uncultured_candidate_division_bacterium_BAL57377 ------------------------------------------------------------- -------------------------------MAVSRRRFVKAT-------AALTGAALVTD -TL-GLQGF-KFVP-EIKNPLEFYPNRDWEKIYRDQFRY----------DSSFTFLCAPND -THNCLLRAYVR-NGV----IVRIGP--------TYGYNEAR------------------- ----DLYGNKVSARWEPRCCQKGLALGRRFYGDR-RVNGVWVRKGFFDWVRAGFPRDPHT- ----------GAPPKEYF-NRGQDS-WLKLSFD-EAYGIV--------AQALFNIVQTYSG -PEGAARLKAQN-YDPTMLEAMHEAGTQ--------------------------------- --------------------------TVKVRGGMPFLGATRIYGLARFAN-MLALLDAHIR -NVSPDQALGGRV-WDSYS-WHTDLPPGHPMVTGQQ---TVEFD-LFTA-ENAKLITLWGM -----------NWICTKMPDAHWLTEARQ---------RGAK----VITIATEYQATANKA -D----EVIIIRPGTDAAFALGVASVIINEKLYDE----------EYVKTFTDLPLLVRMD -TLKLLRASDIIRDYQPAELTNYAKVLKPDEKPGPPL-AQRVQYIPERAR-QAWGDFVVWD -STKNAPEVITRDHVGQFFAARGIDPALEGSFTVQT------------------------- -----TDHQEITVRPVFDLIKEYLK-E---------------------------------- -------------FTPPKVAEMSWAPS---------EAIVNLARQIAAN----KASTLLSH -GMGP---NHFFNADLKDRALFLIAALTKNIGHFGGSPGSYAGNY---------------- -----RVALFNGLPQYIAEDPFNIELDPTKPATVKSYAKSES------------------- ------------------------AHYYNYGDRPLRVGKKLFTGKTHTPTP----TKFMWF -ANSNSLLGN------------------------------SKWGYDVIHNTLP-----KIE -AIVVNEWWWTMSCEY--ADVVFGV-DSWGELKYPDMCGSVTN----------PFVQVFPR -TPLPRIF-D---T--------RSD------IETYMGVA-EKFAELTGD------------ -------------ARFRDYWH--FVRE----------------------NRVDVYLQRICD -A---SSSLRGYKFTDLEEQARQGTPMLKLLRTYP--KIVGWE-QTQ----ESK------- --------------PWYTKTGRLEFYREEDEFIEYGENLPVYREPVDATPHEPNVIVAPKT -LSALKPAPPEQYGLKRDDLS----------------------TETRQVRNVIK-TPEEVV -RSQHPRTKDGLKFIFITPKYRHGAHTTPVDLD-----------VLAVYFG-PFGDIYRRD -KRSPWVG-----EVYADINPQDAKE-LGI-------------E-------------DGDY -IWIDADPED-RPYRGAKPSDPDYKIAR---L--M-GRARYYNGTPRGVVRMWFNMYQATH -GTVNAHETRPDKLAK--------DPQTNYQAMFRYGGHQSCTR-AWLRPTLMTDSLVR-- ------KDVFGQTIGQGFAPD----IHCPVGAPKESFVKITRAEPGGADLKSLWRPAQLGY -RPTYESDEMKQYLAGGFIEVT--------------------------------------- -- ->Beggiatoa_sp_PS_ZP_02000390 ------------------------------------------------------------- --------------------------------------------------MAVTGAGAAVI -SQQAISATQLLTPVAIDNPLSNYPNRDWEKTYRDLYHY----------DSSFTFLCAPND -THNCLLRGYVK-NGV----VTRIAP--------TYGYQKAK------------------- ----DLDGNQSTQRWDPRCCQKGLALVRRFYGDR-RCKRPMIRKGFKDWVEAGFPRLPET- ----------GAVDQKYL-QRGRDS-WVGASWD-EAFELA--------GKALTNIAQTYTG -EEGQKKLLAQG-YDPLMVEATEGAGTQ--------------------------------- --------------------------VLKFRGGMPPLGMTRVFAQYREAN-AMALLDDKIR -GKGTD-SLGGRG-FDNYS-WHTDLPPGHPMVTGQQ---TVDFD-LCNV-ERTNLLIVWGM -----------NWITTKMPDSHWMTEARM---------KGTK----VVVIAAEYSATSSKA -D----EVFVVRPGTTPALALGIAQVLISENLYDA----------PYVKANTDLPLLVRMD -TAEMLRAGDVFKDYQLAKLENNTLVV-PTGEKGPPMHQQKGPILDEKQR-ADWGDFVYWD -ASESKPVAMNHDQVGKHFSG---NPQLTGEFAVPL------------------------- -----ASGETVQCRTVFDVTKEMLDGS---------------------------------- -------------YTPEDVAKLTWTSA---------DGIRGLARQIAAN----QSNTLFTV -GMGP---NQFFNSDLKDRNIFLVAALTQNIGKIGGNVGSYAGNY---------------- -----RASFFNGLAQFIGEDPFNPELDPTKPA---KLRKRWKAESVHYFNHGD-------- ------------------------------TILRMG--KAVLTGKTHIPTP----TKAFHV -SNSNSLIGN------------------------------VKGHYDFVINTLS-----RVE -FIAQNEWWWTASCEY--ADIVFAV-DSWAELKYPDMTISVTN----------PFLYTFPA -TPLPRIH-D---T--------RSD------LEVAAGIC-GAIGKVTND------------ -------------SRHKDYWH--FINK----------------------GEVRPHIQRVLD -H---SNATRGYKIEDLEKLANEGIP--AILQTRTYPKVGAWE-QGN----ENK------- --------------PWYTKTGRLEFYREEPEFRDSGENIVVHREPIDSTRFEPNVIVAKSH -PLLRPKTPEDYGVPSSD--MS---------------------GDTRQARHVVK-TVDEVL -NSEHPLHKEGYDFVFHTPKYRHGAHTTAVDTD-----------IVAAWFG-PFGDMLRRD -RRMPFVA-----EAYVDINPDDAKG-LGI-------------E-------------DGDY -VYIDADPHD-RPFKGWQKYPEGYKVAR---L--L-VRARYYPGTPRGVTRMWHNMFGATF -SSVRGQETNPTGLAK--------SPETGYQSLYRGGSHQSCTR-GWLKPTWMTDSLYV-- ------KGLMGQKITQGFVPD----VHCPTGAPREALVRIIKAENGGIDGKGLWSPAARGL -RPTYENDILKQFMAGKFVELA--------------------------------------- -- ->Nitrococcus_mobi_EAR23355 ------------------------------------------------------------- --------------------------------------------------MGWIQD---LI -NP-KTRRW-EEF-----------YRNRWQH------------------DNIFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLLGRGEGGRGIPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYGKGVLLDFWREARSSHNNPV -EAWSSIVTDENKRKRWQKARGKGG-YRRTTWD-ELLELI----------ASACLYTAQKY -G-------------PDRVM----------------------------------------- --------------------------GFSPIPAMSM---------------LSYAAGSRFL -Q-----LFGGVN-MSFYD-WYADLPNSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NLNMTRTPDVHFISEARH---------EGAK----FVVLAPDFSQVSKYA -D----WWIPVKKGEDLGLWMAAGHVIYTEFYVKR----QVPYFIDYVTRYTDMPFLVKLE -K----DGDG----YRPGRYLTSEEVKKYKKQENA-AWKQLVFDRKSNEA-RCPKGQIGHR -HGK-HGQ-----WNLKMEDGLDNSPIEPVLSFLGE---SDDVAMVQFYEFA--------- -------SQTVYKRGVPAKKIDTGSGS----VLVATVYDLNMGQYAVNRGL--------PG -DYPESYDDLK-PYTPAWQEQFSGIGR---------QTVIRFAREFAGTAEKTKGRSMVIV -GASA---NHWYHNNHIYRAAINCLIACGCCGRNGGGMNHYVGQEKLAIVAPWNALALAGD -WGIKPRLQQSPVWHYVNSDSWRYEGSFEEYAPS-PPNAKWAKGHSVDLVAKSVRMGWMPH -YPQFNRSPLEVAREAEKAGAKDDKGMADYVVQALK--KKNLSFSVDDPDAPENWPRVWFI -WRGNAMQSSAKGAEFFLRHYLGTHDNAVAEERAKP----HVKHVKFREPAPR----GKFD -LVVDINFRMDSTALY--SDIVLPT-AFWYE-KNDLNSTDLH-----------SFIHP-LG -QAVPPVW-E---S--------KSD------WDIFKAFA-KKISEMAPSVFSEPFKDVVAA -PLTHDTPDEIAQRDVKD-WL--EGECEPIPGKTMPHFRVVERDYSLLYNKYISLGSAIRE -N---GISGNGCSFPITKQYDELTNQPVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLL -YLAPETNGEVAYQAFKSEQEHCGVPLTDLAEPYRGHQVTFYDLTRQPRRLLCSPVWTGNC -GDGRAYSAWTLQIDRLV--PFRTLTGRQHIYIDHPWYMDFGEHLCTYRPKLDY-KKIHDL -DN-SPIDDKTLILNYITPHGKWNIHSTYKDNH-----------RMLTLSR--GMDP---- ------VW----------INDKDAAR-VGL-------------K-------------DNDW -VEVY---ND-N--------------GV---I--V-TRANVSRRVQSGMCLYYHA-VERTI -Y----------------------IPKSQIRGGRRAGGHNSVTR-TRINPVYLAG-GNA-- ------QFTYL-------FNY----WGPTGIMTRDTHVAVRKLEKLEW------------- ------------------------------------------------------------- -- ->A_Nitrobacter_hamburgensis_YP_578638 ------------------------------------------------------------- --------------------------------------------------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYIRGPLLDMWREAKASSADPV -QAWGALIGDEQKRSRIQKARGKGG-FRRAKWE-ELVELI----------AAASLHTARKH -G-------------PDRIM----------------------------------------- --------------------------GFSPIPAMSM---------------LSFAAGTRFL -S-----LMGGSL-MSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NMNMTRTPDVHFISEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYVDR----QVPYFVDYIKRYTDLPFLVELE -S----NGNT----YKTGRLLRSNRVPRYKDVENG-DWKMLLLDANSGEL-RAPKGQVGDR -WGSVHGK-----WNLSGEDTLDNSPLDPVLSFIDR---SDDVVQVGFDDFA--------- -------NGRIVSRGVPVKRVATDKGE----ILCATGFDIMMSQFGISRGL--------EG -AFATSYDDEDAPYTPAWQERHTGIGR---------ETAIRFAREFATNAELTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWATVALALD -WAKPPRLVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPKWAKGHAIDLEAKAVHNGWMPF -TPHFNRNPIEVAAEAERSGAKNVQDIETYVVDQVV--SKKLQMAIDDPDAAENWPRMWFI -WRGNAIQSSAKGHEFFLRHYLGAHDNAIAEDRAKG----KAQVVKYHETAPR----GKYD -LVIDLNFRMNTTSLY--SDIVLPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WEIFKLIG-KKVSELAPLAFSKPVRDVVLQ -PLMHDTPDELAQPEILD-WS--LGECKAVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GISAVGVQIPIKKQYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTVL -LCAPEANGEVCYQAFHNEEHHVGLPLVDLAEPNRNVAATFYDLTRQPRRIITSPCWTGMV -NDGRAYSAWCMNVERLV--PWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RMLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-TRINPLFLAG-GYA-- ------QFTYG-------WNY----WGPTGILTRDTHVVVRKMEKLEW------------- ------------------------------------------------------------- -- ->B_Nitrobacter_hamburgensis_YP_578186 ------------------------------------------------------------- --------------------------MTTGLAAGQRTEETQ---------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RIKYPYVRGPLLDMWREAKASSADPV -QAWGALVGDEQKRARMQKARGKGG-YRRAKWE-ELVELI----------AAASLHTARKH -G-------------PDRIM----------------------------------------- --------------------------GFSPIPAMSM---------------LSFAAGTRFL -S-----LMGGSL-LSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NLNMTRTPDVHFIAEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYVDR----QVPYFIDYVKRYTDLPFLVELE -P----NGTT----YKTGRLLRARHVPRYKDVENG-DWKMLLLDANSGEL-RAPKGQVGDR -WGSVHGK-----WNLSGEDTLDNSPLDPVLSFIDR---SDDVVQVGFDDFA--------- -------NGRIVSRGVPVRRIATDKGE----ILCATGFDIMMSQFGISRGL--------EG -AFATSYDDEDAPYTPAWQERHTGIGR---------ETAIRFAREFATTAEYTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWASIALALD -WSKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPRWAKGHAIDLEAKAVRSGWMPF -TPHFNRNPIEVAAEAERAGAKSTEDIATHVIDQVA--SKKLNLAIEDPDAAENWPRLWFI -WRGNAIQSSAKGHEFFLRHYLGTHDNAIAEDRAKG----KTHTVKYHDTAPR----GKYD -LVVDLNFRMDTSSLY--SDIVLPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WDIFKLIA-KKVSELAPLAFSKPVRDVVLQ -PLMHDTPDELAQPEILD-WA--EGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GVSAVGVNVPIKKQYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVL -LCAPEANGEVCYQAFHNEEHHVGLPLVDLAEPTRNVATTFYDLTRQPRRLLTSPCWTGMM -NDGRAYSAWCMNVERLV--PWRTLTGRQTLYIDHQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RMLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-TRINPLFLAG-GYA-- ------QFTYG-------WNY----WGPTGILTRDTHVVVRKMEKLEW------------- ------------------------------------------------------------- -- ->Nitrobacter_winogradskyi_gb_ABA05326 ------------------------------------------------------------- --------------------------------------------------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYIRGPLADLWHEAKASYPDPV -QAWASLVEDEEKRNRIQKARGKGG-FRRAKWE-ELIELI----------AASCLYTARKH -G-------------PDRVM----------------------------------------- --------------------------GFSPIPAMSM---------------LSFAAGTRFL -S-----LFGGGL-MSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAS -----------NMNMTRTPDVHFISEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYIDR----QVPYFIDYVKRYTDLPFLVELE -P----NGNT----YKTGRLLRSNRVARYKDVENG-EWKMLVLDTATGEP-RAFKGQVGDR -WGSTHGK-----WNLSAEDTLDNSPIDPVLSFIDQ---SDGVVQVGFDDFV--------- -------NGSVVSRGVPVKRIATDKGE----VLVTTGFDIMMSQFGHSRGL--------EG -SFATSYDDEDAPYTPAWQERHTGIGR---------ETAIRFAREFATNAELTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWSTVAMALD -WNKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPRWAKGHAIDLEAKSVRCGWMPF -TPNFHRNPIEVVAEAERAGAKSTADIATYVADQVA--SKKLDLAINDPDAEENWPRVWFI -WRANAIQSSAKGHEFFLRHYLGAHDNVIAEERAKG----KTTTVKYRDTAPQ----GKYD -LVVDINFRMNTTGLY--SDIILPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WEIFKLIA-KKVSELSPLAFSKPVRDIVLQ -PLMHDTPDELAQPEILD-WA--EGECKLVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GISAVGVNIPIKKQYDQMLENPIMPMPDSRHMRCVEWGGKRYPSLEDVLDACNVVL -LCAPVANGEVSYQGFVNEEQHVGLPLADIAEPTRGVSSTFYDLTRQPRRILTSPCWTGLV -NDGRAYSAWCMNIERLV--PWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RLLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-IRINPLFLAG-GYA-- ------QFTYG-------WNY----WGPTGIFTRDTHVVVRKMEKVEW------------- ------------------------------------------------------------- -- ->Nitrobacter_sp_Nb_311A_ZP_01048070 ------------------------------------------------------------- --------------------------------------------------MSWILD---LV -NP-RERKW-EEF-----------YRNRWSH------------------DNVFRSTHGVNC -TGGCSWAIYVK-DGIITWEMQQTDYPLL-----ERSLPPYE------------------- ----------------PRGCQRGISASWYVYSPI-RVKYPYIRGPLYDLWREAKASHPDPV -QAWASLVGDEQKRLRMQKARGKGG-FRRAKWE-ELVELI----------AAAALYTARKW -G-------------PDRVM----------------------------------------- --------------------------GFSPIPAMSM---------------LSYAAGSRFL -Q-----LFGGVN-MSFYD-WYADLPTSFPEIWGDQ---TDVCE-SADW-YNSKFIVSMAA -----------NMNMTRTPDVHFIAEART---------EGTK----FVVLSPDFSQIAKYC -D----EWIPIQAGQDTALWMAANHVILKEYYIDR----QVPYFIDYVKRYTDLPFLVELE -P----NGNT----YKTGRLLRAKRVARYQDVENG-DWKMLVLDSKTGEP-RAFKGQVGDR -WGSTHGK-----WNLSAEDTLDNSPIDPVLSFIDQ---SDGVVQVGFDDFV--------- -------NGSVVSRGVPVKRIATDKGE----VLVTTGFDIMMSQFGHSRGL--------EG -SFATSYDDENAPYTPAWQERHTGIGR---------ETAIRFAREFATNAELTNGKSMVIV -GASA---NHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVAPWNTIAMALD -WTKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLT-APNPRWAKGHAIDLQAKAVRSGWMPF -TPHFNRNPIELAAEAERAGAKSTDDIVTHVVDQVA--SKKVNFAIDDPDAEESWPRMWFI -WRGNAIQSSAKGHEFFLRHYLGAHDNSIAEDRAKG----KTQRVKYRDTAPR----GKYD -LVVDLNFRMNTTSLY--SDIVLPT-AFWYE-KNDLNTTDLH-----------SFLHV-LG -QAVPPVW-E---S--------KTD------WEIFKLIA-KKVSELSPLAFSKPVRDVVVQ -PLMHDTPDELAQPEILD-WA--EGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKARE -D---GVSAVGVQIPIKKQYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTLL -MCAPEANGEVCYQGFHNEEHHVGLPLVDIAEPTRGVSSTFYDLTRQPRRILTSPCWTGMT -NDGRAYSAWCMNVERLV--PWRTLTGRQTLYIDSQWYLDFGEHIPTYKPRLNP-RKTGDI -VKSR-VDDRSLVLNYITPHGKWNIHSTYKDNH-----------RMLMLSR--GMDP---- ------VW----------INDRDAEK-VGI-------------E-------------DNDW -VEVY---ND-N--------------GV---V--V-TRANVSRRIQPGTCMYYHA-VERTV ------------------------YIPKSQERKWRGGGHNSLTR-TRINPLFLAG-GYA-- ------QFTYG-------FNY----WGPTGIFTRDTHVVVRKMEKLEW------------- ------------------------------------------------------------- -- ->Acidovorax delafieldii_NARG ------------------------------------------------------------- -----------------------------MSHFLDRLSYFSQP-------RENFAQGHGQT -NG-EDRTW-EDA-----------YRDRWAH------------------DKIVRSTHGVNC -TGSCSWKIYVK-GGIVTWETQQTDYPRT-----RPDLPNHE------------------- ----------------PRGCARGASYSWYLYSAN-RVKYPMVRGRLLKHWRAAMALAKSPV -DAWASIVENDASRSEWQKQRGLGG-FVRSTWD-EVNQMI----------AAANVYTIKKH -G-------------PDRII----------------------------------------- --------------------------GFSPIPAMSM---------------ISYAAGSRYL -S-----LIGGVC-MSFYD-WYCDLPPSSPQVWGEQ---TDVPE-SADW-YNSSYIIAWGS -----------NVPQTRTPDAHFLTEVRY---------KGTK----VVSITPDYSEVAKLG -D----LWMHPKQGTDAAVAMAMGHVILKEFYFKDGGKGRSAYFDDYARRYTDLPLLVVLK -EKTLPDGRTV---MVPDRYVRASDFPGQLDQSNNPDWKTVGYD-ELGQV-TLPNGSIGFR -WGA-DGRADQGLWNLENKEARTGNTVKLKLSVIEDGVQAHDVADVAFPYFGGVQTPNFTA -NEQ---GGDVIVRRVPVSHLELAGHEAQGRVMVATVFDLLAGNYGIDRGL-------PGE -EPGGSYDADR-PYTPAWQEKITGVPR---------DQIITVARQFADNADKTHGKSMVII -GAAM---NHWYHCDMNYRGIINMLMLCGCIGQSGGGWAHYVGQEKLRPQTGWTALAFALD -WIRPPRQMNSTSFFYAHTDQWRYEKLGMEEILSPLADKKSYSGSMIDYNVRAERMGWLPS -APQLKTSPLQVAKDAAAKG----MDAKDYVVQSLK--NGSLTMSCEDPDHPDNWPRNMFV -WRSNILGSSGKGHEYFLKHLLGTTHGVQGKDLGQDEA--KPEEVQWHAKAPE----GKLD -LLVTLDFRMSTTCLY--SDIVLPT-ATWYE-KNDLNTSDMH-----------PFIHP-LS -TAVDPAW-Q---A--------KSD------WEIYKGFA-KAVSEVSVGHLGVE-KDVVLT -PIMHDTAGEMAQPYGVRDWK--RGECELIPGKTAPQVTVVERDYPNLYKRFTALGPLMDK -A---GNGGKGIGWNTQTEVGQLGDLNGRV-------KEEGVT-QGMPRIVTDIDATEVVM -MLAPETNGHVACKAWEALGKQTGRDHVHLALHREDEKIRFRDIQAQPRKIISSPTWSGLE -SEKVSYNAGYTNVHEYI--PWRTLTGRQQFYQDHPWMRDFGEGFVSYRPPVHL-KALHEV -EGKKPNGNREIALNFITPHQKWGIHSTYSDNL-----------IMLTLNR--GGSV---- ------VW----------LSEDDAAR-AGI-------------V-------------DNDW -VELF---NA-N--------------GA---I--A-ARAVVSQRVNPGMVMMYHS-QEKII -N----------------------TPGSEIT-GTRGGIHNSVTR-VVLKPTHMIG-GYA-- ------QYSYG-------FNY----YGTIGT-NRDEFVLVRKMDRVDWLDDDVSDAPAHA- ------------------------------------------------------------- -- ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 ------------------------------------------------------------- -----------------------------MSHLLDQLRFFNRK-------QGEFADGHGET -RI-ESRDW-ENV-----------YRSRWQY------------------DKIVRSTHGVNC -TGSCSWKIYVK-NGLITWETQQTDYPRT-----RNDLPNHE------------------- ----------------PRGCPRGASYSWYIYSAN-RLKYPKVRKPLLKLWREARRNMT-PV -DAWASIVEDKAKAESYKSKRGMGG-FIRSSWD-EVNEII----------AAANVYTVKQY -G-------------PDRVI----------------------------------------- --------------------------GFSPIPAMSM---------------VSYAAGSRYL -S-----LIGGVC-LSFYD-WYCDLPPASPQIWGEQ---TDVPE-SADW-YNSNYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVAITPDYAEVAKLT -D----LWLNPKQGTDAALAQAFAHVIFKEFHLEK----PSEYFRDYAKRYTDLPVLVRLN -EK---DGS-----YIADRFLRASDLADNLGQENNPEWKTIAVDGSTGEL-VSPLGSIGYR -WGE-KGK-----WNIEAREGKDGRDVDLSLTQIEG----GETAEVAFPYFGGILHEHFQH -AE----GESIQLRRVPVRTITLADGST---TKVATVFDLMAANLGIDRGL-------GGG -NVASSYDDASVPGTPAWQEVITGVSR---------EKAIQIAREFADNADKTHGRSMIIV -GAAM---NHWYHMDMNYRGLINMLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLD -WSRPPRQMNGTSFFYNHSSQWRHEKMSIHEVLSPLADKSQFPEHMLDYNIRAERAGWLPS -APQLNRNPLQICRDAEAAG----MSPVDYVTQSLK--DGSLKFACEQPDNPDNFPRNMFV -WRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDLGKRADGFKPTEAEWQDEGAI----GKLD -LVTTLDFRMSSTCVY--SDIVLPT-ATWYE-KDDMNTSDMH-----------PFIHP-LS -AAIDPAW-E---A--------KSD------WEIYKGIA-KAFSKMAEGQLGVE-KDLVTV -PLLHDSPGELAQPFGGTDWK--TAGVDPQPGKNCPNMAVVERDYPATYKKFTSLGPLLDK -L---GNGGKGINWNTQDEVDFLGELNYKV-------RDEGVS-QGRPQIESAIDAAEVIL -SLAPETNGHVAVKAWAALSEFTGRDHSHLALPKEHEAIRFRDIQAQPRKIISSPTWSGLE -DEHVSYNAGYTNVHEYI--PWRTITGRQQFFQDHPWMQAFGEQLMSYRPPINT-RTIDYV -KGKKSNGNPEIVLNWITPHQKWGIHSTYSDNL-----------IMLTLSR--GGPI---- ------VW----------MSEVDAKK-AGI-------------E-------------DNDW -IECF---NA-N--------------GA---L--T-ARAVVSQRVMEGMVMMYHA-QERIV -N----------------------VPGAEST-KTRGGHHNSVTR-VVLKPTHMIG-GYA-- ------QQAYG-------FNY----YGTVGC-NRDEFVVVRKMAKVDWLDGPNGNDLPQPL -PQDI-------------------------------------------------------- -- ->NarG_Pseudomonas_fluorescens_gb_AEV63780 ------------------------------------------------------------- -----------------------------MSHLLDQLRFFNRK-------QGEFSDGHGET -RK-ESRDW-ENV-----------YRSRWQY------------------DKIVRSTHGVNC -TGSCSWKIYVK-NGLITWETQQTDYPRT-----RNDLPNHE------------------- ----------------PRGCPRGASYSWYIYSAN-RLKYPKIRKPLLKLWREARQTLP-PV -EAWASIVEDKAKADSYKSKRGMGG-FIRSNWE-EVNEII----------AAANVYTVKEH -G-------------PDRVV----------------------------------------- --------------------------GFSPIPAMSM---------------VSYAAGSRYL -S-----LIGGVC-LSFYD-WYCDLPPASPMVWGEQ---TDVPE-SADW-YNSNYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVAITPDYSEVAKLT -D----LWLNPKQGTDAALAQAFNHVIFKEFHLDK----PSAYFTEYAKRYTDLPVLVMLK -PM---LGAAPGAGYQPDRFLRASDLTDNLGQDNNPEWKTIALD-AAGEL-VSPQGSIGYR -WGE-KGK-----WNILPREGGEGREIDLKLSLI-G----GDVAEVAFPYFAGEAQEYFQH -VA----GDAVQFRRVPVHSVVLADGSV---AKVATVFDLSAANLAIDRGL-------GGA -NVAKDYNDASVPGTPAWQEQITGVSR---------EKAIQIAREFADNADKTRGRSMIIV -GAAM---NHWYHMDMNYRGLINMLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLD -WNRPPRQMNGTSFFYGHSSQWRHEKMSMHDVLSPLADKSQFPEHALDYNIRAERAGWLPS -APQLNTNPLHICRDAAAAG----MEPKDYVVKSLQ--DGSLRFACEQPDSPVNFPRNMFI -WRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDIGHSTEC-KPTEAEWVDEGAI----GKLD -LVTTLDFRMSSTCVY--SDIVLPT-ATWYE-KDDMNTSDMH-----------PFIHP-LS -AAIDPAW-E---S--------RSD------WEIYKGIA-KAFSAMSVGHLGVE-KDLVTV -PLMHDSVGELAQPFGGTDWK--SAGVAPVPGKNAPNLQVVERDYPNIYKQFTSLGPMLEK -L---GNGGKGINWNTDTEVKFLGELNHKE-------VEAGIS-QGRPKIDSAIDAAEVIL -SLAPETNGHVAVKAWAALSEFTGIDHSHLAISKEHEAIRFRDIQAQPRKIISSPTWSGLE -DDHVSYNAGYTNVHESI--PWRTITGRQQFYQDHPWMQAFGEQLMSYRPPVNT-RTIAGV -KGKRSNGETEIVLNWITPHQKWGIHSTYSDNL-----------LMLTLSR--GGPI---- ------VW----------LSEIDAKR-AGI-------------E-------------DNDW -IECF---NV-N--------------GA---L--T-ARAVVSQRVKEGMVMMYHA-QERIV -N----------------------VPGSETT-KTRGGHHNSVTR-VVLKPTHMIG-GYA-- ------QQAYG-------FNY----YGTVGC-NRDEFVVVRKMVKVDWLDGSSGDDLPRPL -PTDIEEN----------------------------------------------------- -- ->NarG_Halomonas_maura_gb_AAT47523 ------------------------------------------------------------- -----------------------------MSHFIDRLNFFRKA-------REPFANDHGEV -RD-ESRGW-EDG-----------YRQRWQH------------------DKVVRSTHGVNC -TGSCSWKIYVK-NGLVTWETQQTDYPRT-----RPDLPNHE------------------- ----------------PRGCPRGASYSWYLYSAN-RLKHPLVRKPLLKLWREALEEKGDPV -DAWASIVEDPAKTKQYKRARGMGG-FVRADWN-ELNELI----------AASNVYTAKQY -G-------------PDRII----------------------------------------- --------------------------GFSPIPAMSM---------------VSYAAGSRYL -S-----LIGGVC-MSFYD-WYCDLPPASPMTWGEQ---TDVPE-SADW-YNSGYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVSVTPDYAEVSKLT -D----EWLSAKQGTDAALAMAMGHVILKEFHLDR----PSAYFTDYVRRYTDMPCLVELE -ARE--DGS-----YVPGKQLRASDFEASLGQDNNPEWKTVAWDETRDQL-VVPRGSIGFR -WGE-EGK-----WNLEPRDAE-GAEIKTRLSLAEA---HDDVARVAFPYFGGIAHEHFDH -VKSGGASDELLFHSLPAKRLTLADGRE---ILAVTVFDLMCANYGIDRGFRSQEGKEGED -DGATAYDQVK-PYTPAWQEKITGVPA---------EQCLRIAREFADNADKTHGRSMIIV -GAGM---NHWYHMDMNYRGLINMLVMCGCIGQSGGGWSHYVGQEKLRPQTGWLPLAFGLD -WQRPPRHMNSTSFFYNHSSQWRYXKLEIKEILSPLAKPADYSGSLIDFNVRSERMGWLPS -APQLATNPLSLAGKAAEAG----QSTADYVVDQLK--AGGLRFAAEDPDDPQNFPRNMFI -WRSNLLGSSGKGHEYLLKYLLGTRHGIQGKDLGEDGGQ-KPEEVVWHEAAPE----GKLD -LLVTLDFRMSTTCLY--SDIVLPT-ATWYE-KDDLNTSDMH-----------PFIHP-LT -AATDPAW-E---S--------RSD------WDIYKGIA-RAFSKACVGHLGEE-TDLVTL -PLQHDSPAELAQPEVKD-WK--RGECEPIPGKTMPALVEVKRDYPATYERFTSVGPLLDS -L---GNGGKGIGWKTEKEVELLGKLNY---------VKTEGPAKGRPRIESAIDAAEVIL -TLAPETNGQVSVKAWEALSKITGRDHRHLAEPKEEEKIRFRDVVAQPRKIISSPTWSGLE -DEHVSYNAGYTNVHELI--PWRTVSGRQQFYQDHAWMRAFGESLLVYRPPIDT-KAAVSL -ADDKGNGNPEIALNWITPHQKWGIHSTYSDNL-----------LMQTLSR--GGPI---- ------VW----------LSKDDARS-IGV-------------E-------------DNDW -IELY---NA-N--------------GA---I--A-ARAVVSQRVKNGMAMMYHA-QERIL -N----------------------MPGSEVT-GTRGGIHNSVTR-VCPKPTHMIG-GYA-- ------QLAYS-------FNY----YGTVGS-NRDEFVIVRKMKKIDWLDGEGNDYEQEAV -K----------------------------------------------------------- -- ->NarG_Escherichia_coli_NP_415742 ------------------------------------------------------------- ------------------------------SKFLDRFRYFKQK-------GETFADGHGQL -LN-TNRDW-EDG-----------YRQRWQH------------------DKIVRSTHGVNC -TGSCSWKIYVK-NGLVTWETQQTDYPRT-----RPDLPNHE------------------- ----------------PRGCPRGASYSWYLYSAN-RLKYPMMRKRLMKMWREAKALHSDPV -EAWASIIEDADKAKSFKQARGRGG-FVRSSWQ-EVNELI----------AASNVYTIKNY -G-------------PDRVA----------------------------------------- --------------------------GFSPIPAMSM---------------VSYASGARYL -S-----LIGGTC-LSFYD-WYCDLPPASPQTWGEQ---TDVPE-SADW-YNSSYIIAWGS -----------NVPQTRTPDAHFFTEVRY---------KGTK----TVAVTPDYAEIAKLC -D----LWLAPKQGTDAAMALAMGHVMLREFHLDN----PSQYFTDYVRRYTDMPMLVMLE -ER---DGY-----YAAGRMLRAADLVDALGQENNPEWKTVAFN-TNGEM-VAPNGSIGFR -WGE-KGK-----WNLEQRDGKTGEETELQLSLLGS---QDEIAEVGFPYFGGDGTEHFNK -VE----LENVLLHKLPVKRLQLADGST---ALVTTVYDLTLANYGLERGL-------NDV -NCATSYDDVK-AYTPAWAEQITGVSR---------SQIIRIAREFADNADKTHGRSMIIV -GAGL---NHWYHLDMNYRGLINMLIFCGCVGQSGGGWAHYVGQEKLRPQTGWQPLAFALD -WQRPARHMNSTSYFYNHSSQWRYETVTAEELLSPMADKSRYTGHLIDFNVRAERMGWLPS -APQLGTNPLTIAGEAEKAG----MNPVDYTVKSLK--EGSIRFAAEQPENGKNHPRNLFI -WRSNLLGSSGKGHEFMLKYLLGTEHGIQGKDLGQQGGV-KPEEVDWQDNGLE----GKLD -LVVTLDFRLSSTCLY--SDIILPT-ATWYE-KDDMNTSDMH-----------PFIHP-LS -AAVDPAW-E---A--------KSD------WEIYKAIA-KKFSEVCVGHLGKE-TDIVTL -PIQHDSAAELAQPLDVKDWK--KGECDLIPGKTAPHIMVVERDYPATYERFTSIGPLMEK -I---GNGGKGIAWNTQSEMDLLRKLNY---------TKAEGPAKGQPMLNTAIDAAEMIL -TLAPETNGQVAVKAWAALSEFTGRDHTHLALNKEDEKIRFRDIQAQPRKIISSPTWSGLE -DEHVSYNAGYTNVHELI--PWRTLSGRQQLYQDHQWMRDFGESLLVYRPPIDT-RSVKEV -IGQKSNGNQEKALNFLTPHQKWGIHSTYSDNL-----------LMLTLGR--GGPV---- ------VW----------LSEADAKD-LGI-------------A-------------DNDW -IEVF---NS-N--------------GA---L--T-ARAVVSQRVPAGMTMMYHA-QERIV -N----------------------LPGSEIT-QQRGGIHNSVTR-ITPKPTHMIG-GYA-- ------HLAYG-------FNY----YGTVGS-NRDEFVVVRKMKNIDWLDGEGNDQVQESV -K----------------------------------------------------------- -- ->TtrA_Photobacterium_profundum_YP_133039 ------------------------------------------------------------- ----------------------------MAALIMDRRQFLK-MGAATTFTGGMAGISKATA -GD-SNQDISRYAPLSAEPEFILGPDNKLTN----------------NPNQRFAFTKCFGC -YNVCGARIRID-NNT--DQILRVCG--------NPYALSTQ-----SGNPVAME--VSPQ -EAMLQLVGEQGNENRATLCGRGNAVPDAITDSR-RVTQCLKRVG---------------- -------------------KRGENH-WQSISYE-QLIKEVVEGGNLFGEGHVEGLSDIYDD -KTVANPAYPDFGPKKNQL------------------------------------------ --------------------------LMTGCSEDPA---------------RWGFYKRFSE -A-----SWGTPN-IGNKD-SYCGHQQVAGCALGVEDGANSGALPTTDF-EHCEFAIFIGT -NPGLSG-------ISLNSASKRLADART-------QNPNFK----YVVIDPILRSLTSSS -TPENCEWVPIRSSGDTALMHAMMQYIINNERYNK----------SYLASCSQ-------- ---------------------EGAYKVSEINYTNAPYLVVTDKKHPLYRKFLTAAACGKGD -ADTKMVIDAKSQQLTTSDSSEPCNIKFSGKVTTED------------------------- -------GQAVKVETAFSLLAKRVNE----------------------------------- -------------HSMADYAAECQVPE---------AKIIELAKEFTSH-----GRRVSIE -TNTG---CNASDGSQFAFAMIMLTTLVGAHNAKGGMLHTGSMGFE--------------- -----NTSPLYDMMAFEHAHLSGFNAERSGDYRQSNEFKEKVKNGINPYPSEM-------- ------------------------PWNETFIQDNAG--ELLVAHANGNPFK----FKAWIA -WANNPLYA-------------------------------CSGLKDQVEASIKDPK--QLG -LIIASDPYFNETNVY--ADYFVPD-LAQYE-QWGASRQWGSE----------LMGDVVSF -PIITP---K---TPLNAEGNRVCM------EQFLIDVA-KQIKLNGFGENAFKDTAGNAK -AI----------NTPEDYYI--PVLA-------------------NLAHSDEVLPTPTEE -DVKFTSVDRIYSQLKERL------------------KAEEIG-PTMFLFTRGG------- --------------RYLTVNSRYEGEF-----------------------FNEMMRWDAQF -QVYNEGLAHITNFHSG--------------------------EYLDGLPVFDKQRFWDGT -AIRDLWSENEYPFYFSTFKHQLRSP------------------YSVALKS--ITAL---- ------GV-----SNFIQMNENDAKK-YGL-------------T-------------TGDK -ARIA---TPKG--------------AA---I--E-GIVQADTTVAKGCIAVPLG-YGHTA -FGASDITIDGKT-----------LTGIPERKGGMAVNAFNAV-----DPTRKGASLYR-- ------DVTFG-------STA----RH--GI-----PMKIEKV------------------ ------------------------------------------------------------- -- ->TtrA_Wolinella_succinogenes_NP_907142 ------------------------------------------------------------- -------------------------------MEEGRRRFLLGS-------GVVAGSAAVVG -YKETLGAVALLKDKGERAKDSIYGEAAEPEVRFESGRT------LINPKYSIRPSVCNGC -TTHCGIRVKINQESG---AVERVFGNPYSLLSSDPWLPYNT------------P--LKES -LEVLSAQKESGLHHRSTACARGNAVYDKLNDSF-RVTKPLKRVG---------------- -------------------KRGENA-WVEISPE-QLIQEILEGGNLFGEGEVEGLRSIRQL -DKLIDEENPEYGSSANRLC----------------------------------------- --------------------------VLGTADEGR----------------QVVMVQRFV- -Q-----SFGTVN-FMGHT-SICGLSMRAGEAAYLNDFVGYPHL-KPDF-KNCKFLLNIGT ---APAH----AG-NPFKRQAKLLAQART--------TGECR----YVTVTPILANSDNIA -VGERSRWLPVAPSGDLALVMGMIRLIIEEKRYLA----------DYLAIPSL-------- -------------------------ESQKALEEVSFTNATHLIIQKGEKEGQILKDSQGSP -W----VIDVKEGVLRDSKSVLRGELDFAGEVTLE-------------------------- -------GVSYEVKSAFLLLKESALA----------------------------------- -------------YTLEEYASFSGIDS---------KEIVHLAREFTSY-----GRSVGVD -CHGG---TMHTTGFYATYAVMMLGALVGNLNHKGGMSMGGGKFEDFNG------------ -----EAYNLIAYPNKPKPQGARIDRARMAYEKTSEFKRKVAQGENPYPAK---------- ------------------------APWYGLANALES--DVITNSEEGYPYK----LGALIS -WCANFIYG-------------------------------QSGSEHLLE-SLKDPKR-AIP -LFIAIDPFINETSRW--ADYIVPD-SVMYE-TWGVVSPWGASLT--------KASHL-RY -PILPSPNAK---WSNGEP---VSM------DSFIIELG-KALGLPGFGKNGIVAKSGEKF -PF----------DRPEELYL--RAFE-------------------NIALSG-KAVPEISD -EEIELAGLKEYASKLQ-AI-----------------NGENWR-RVAYVMARGG------- --------------RFAPIEDAYKGDS-----------------------LSR--AYPKAI -SIYNEALGTSKNSLTG--------------------------ERYSGVPRFYAPRFTDGR -ALEEAGLGDSRSFLAFSYKSNVLSA------------------PTTASRH--LKEL---- ------RY-----TTFVDMNSQSAKA-LGI-------------V-------------HGER -VRVV---SK-G--------------GF---V--I-GICRLREGIHPRSIGIEHG-AGREG -EGAIDLLINGNV-----------IRGEIARRSGVNINKLGLK-----DASKGKVGTLS-- ------DFVIG-------SNA----RQ--GI-----PVWIEKLS----------------- ------------------------------------------------------------- -- ->TtrA_Haemophilus_somnus_gb_ABI25172 ------------------------------------------------------------- -------------------------------MNKQRRNLIKGA-------LATTAATAFVA -GY-SPKVK-EIAKGVIEGSSGQKTQDNINGNSLLPEYQVKEGNLLTNSQQVVCNTQCMGC -WTLCGLRVRIDLEKN---KVLRING--------NPYHPLSS------DHYLDYN--QSIK -QAELSVSGENGLQQRSTACARGAAFLDGINSPY-RITQPLKRVG---------------- -------------------KRGEGK-WKTISFE-QLIDEVVNGGDLFGEGHVDGLKAIRDL -QTPVNAQHPDFGAKVNQLM----------------------------------------- --------------------------VTFAGPEG-----------------RQPLLKRFAN -N-----SFGTIN-FASHG-SFCGLSYRAGSGAFMNDFANNSHA-KPDW-DHVEFILFMGT ---SPAQ----SG-NPFKRQSRQLAKKRT--------EDNFE----YVVIAPRLELTSTAA -Q-DKNRWVPIIPGKDLSLALAMLRWIIENERYNE----------DYLSIPSE-------- --------------IAMQQANGVSFCNATHLFIADPNHKQYGQAIRNFHI-EDLSEPEKLS -DSDILVKDRQTGKFIAAKDCQSAVLFVEDRISLKD------------------------- -------GSQVLAKSALQLFKESCFS----------------------------------- -------------YSIEEYSEQCGVPV---------DTIIQLAKKFTSH----GPRAAVIT -HGGT----MHSNGFYTAWAILLLNAMIGNMNKKGGMSMSGGKFKDFSAG----------- -----PRYNLANFPNMVKPKGTNLARSKKDYEKSSEFKQKVAQGISPYPAK---------- ------------------------AAWYPFVGGQMS--EMITSALQGYPYS----LKAWIN -HMGNPIYG-------------------------------MTGIHHITQQKLKDPK--ILP -LFISIDAFMNETTAL--ADYIVPD-THNFE-SWGFSTPWAGVPT--------KTSTA-RW -PVIASPN-E---K--------TSQGDTICMESFVIEIA-KMMQLPGFGDNAILDKQNHSY -PL----------NRSEDFFL--RAAA-------------------NIAYDGKQPVQDATQ -EDLLLTGVQRLMPSLQQVL-----------------KPEEIK-KVATIYCKGG------- --------------RFAPHSSAWQEDN-------------------------MQARWKNCL -QIWNENVAKAKHAQTG--------------------------KNYHGCPTYFEDQFADNS -TVESHYPKIQWPFKLISFKSNLMSS------------------ITAPLLR--LHSI---- ------KP-----NGIVAINQQDATE-YGL-------------Q-------------HGDL -VELN---TP-G--------------GK---A--V-VQLVVMNGVIKGTIAIEHG-YGHKQ -LGATGYTINGKL-----------IEGNAQIGSGVNINDLGLL-----DSTKEIASPWV-- ------DWVCG-------SAV----RQ--GI-----PAKLVKLA----------------- ------------------------------------------------------------- -- ->TtrA_Yersinia_enterocolitica_YP_001005907 ------------------------------------------------------------- ------------------------------MAKSTRRQWLKGS-------LALGGVVAFGA -SY-HAVAR-KTLAGLVDGSAGKLTLDPISGNALPTEGRVGP-QWQANPQQAVSMTQCFGC -WTLCGLRVRVDTQQN---KILRIAG--------NPYHPLSH------DHHFPYQ--LPVG -EALQHLGGEQGMTGRSTACARGATLLEGVDSPY-RITEPMKRVG---------------- -------------------PRGSGK-WQRISFE-QLVAEVTEGGDLFGEGPVEGLRAIRDL -DTPIDAKQPSLGPKANQLL----------------------------------------- --------------------------VTNAGDDG-----------------RDAFIQRFAN -Q-----AFGTKN-LGSHG-AYCGLAYRAGSGALMGDLDKNAHV-KPDW-DNVRFALFLGT ---SPAQ----SG-NPFKRQGRQLANARQ--------RDDFN----YVVVAPALPLTTTLA -N-QHNRWVPVLPGTDAALAMGIIRWIIEQHRFNH----------AYLAIPGE-------- --------------MAMQAAGERSWTNASHLVITTETHPLAGQFLRANML---SGETVAEG -EESPVLAQAIDGALQPAAQMLQAELFVTQDLTLHD------------------------- -------GQNVQVQSGMTCLQQAAAR----------------------------------- -------------FTLAEYSQQCGVPE---------ATIIGLAREFTAY----QRQAAVIS -HGGM----MGGNGFYTTWAVMMLNAMIGNLNLKGGVSVGGGKFDGFADG----------- -----PRYQLATFVGMVKPKGLPLSRSKQPYEKSEEYQQKIQQGQSGYPAR---------- ------------------------GPWYPFVGGQLT--EQLAPALAGYPYP----LKAWIS -HMTNPLYG-------------------------------VAGLRNLIEERLQDPR--QLP -LFIAIDAFMNETTAL--ADYIVPD-THNFE-SWGFSAPWAGVLV--------KASTA-RW -PVVEPRTAR---TAQGEP---VAM------ESFLIAVA-KAMKLPGFGANAMQDSEGNSL -SL----------DRAEDYYL--RAAA-------------------NIAYGGEKPLPAAVD -DELRLTGVDRLWPALQRSL-----------------YPDEQR-RVAYLLARGG------- --------------RFAPYEKSWNGDA-------------------------TGSQWKKPL -QIWNENVAKHHHAITG--------------------------ERYSGCPTWYPPRLADGS -DVFQHYPVSDWPLRLMSFKSHLMSS------------------STAMIER--LRAV---- ------KS-----TNLVAINPQDAQR-NGI-------------Q-------------HGDI -VRLM---TP-G--------------GQ---M--E-VQVSLLDGVMPGVVAIEHG-YGHRE -MGSRAHT----------------LDGVVMASDPRIGQGSNLNDLGFTDPTREIPNTWL-- ------DWVSG-------AAV----RQ--GL-----PAKLQRIS----------------- ------------------------------------------------------------- -- ->DmsA_E_coli_sp_P18775 ------------------------------------------------------------- --------------------MKTKIPDAVLAAEVSRRGLVK---------TTAIGGLAMAS ----SALTL---------------PFSRIAHAVDSAIPT-------KSDEKVIWSACTVNC -GSRCPLRMHVV-DGE----IKYVETDNTGD---DNYDGLHQ------------------- ----------------VRACLRGRSMRRRVYNPD-RLKYPMKRVG---------------- -------------------ARGEGK-FERISWE-EAYDII--------ATNMQRL--IKEY -G-------------NESIYLNYGTGTL--------------------------------- --------------------------GGTMTRSWPP---------------GNTLVARLM- -N-----CCGGYLNHYGDY-SSAQIAEGLNYTYGGW---ADGNS-PSDI-ENSKLVVLFGN ---NPGE----TR-MSGGGVTYYLEQARQ--------KSNAR----MIIIDPRYTDTGAGR -E---DEWIPIRPGTDAALVNGLAYVMITENLVDQ----------AFLDKYCV-------- ----------------------------------------------------------GYD -EKTLPASAPKNGHYKAYILGEGPDGVA--------------------------------- ------------------------------------------------------------- -------------KTPEWASQITGVPA---------DKIIKLAREIGST----KP-AFISQ -GWGP---QRHANGEIATRAISMLAILTGNVGINGGNSGAREGSYSL-------------- -----PFVRMPTLENPIQTSISMFMWTD--------------------------------- ------------------------AIERGPEMTALR--DGV-RGKDKLDVP----IKMIWN -YAGNCLIN-------------------------------QHSEINRTHEILQDDK--KCE -LIVVIDCHMTSSAKY--ADILLPD-CTASE-QMDFALDASCGNM--------SYVIF-ND -QVIKPRF-E---C--------KTI------YEMTSELA-KRLGVEQQFTE---------- -------------GRTQEEWMR-HLYA-------------------QSREAIPELPT---- -------------------------------------FEEFRKQGIFKKRDPQG------- --------------HHVAYKAFREDPQ-----------------------ANPLTTPSGKI -EIYSQALADIAATWELP-------------------------EGDVIDPLPIY-TP--GF -ESYQDPLNKQYPLQLTGFHYKSRVHSTYGNVD-----------VLKAACRQE-------- ------MW----------INPLDAQK-RGI-------------H-------------NGDK -VRIF---ND-R--------------GE---V--H-IEAKVTPRMMPGVVAL--G-EGAW- ------------------------YDPDAKRV------DKGG------CINVLTTQRPS-- ------PLAKG-------NPS----HTN--------LVQVEKV------------------ ------------------------------------------------------------- -- ->DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| ------------------------------------------------------------- ------------------------MNHLDLNSNTTRRRFIKTTG------LTAFAASAGIS -IPFATKAG---------------NQSITST--------------AGADEKVVWSACTVNC -GSRCPLRMHVK-DDQ----IIYVETDNTGS---ETYNLDHQ------------------- ----------------VRACLRGRSMRRRVYNPD-RLKYPMKRIG---------------- -------------------KRGEGK-FKRISWD-EALTEI--------AQSLQKN--IAQY -G-------------NESIYLNYGTGTL--------------------------------- --------------------------GGTVTKSWPP---------------GSTLIARLM- -N-----CIGGYLNHYGDY-STAQISVGLDYTYGGGWVLGNGMA---DI-ENTKLVVLFGN ---NPAET---RMSGGGLTYCIQQAKAKS----------NAK----LIVIDPRYTDTGVGK -E---DEWIPIRPGTDAALVSALAYVMITEELVDQ----------PFLDKYCV-------- ----------------------------------------------------------GYD -ENTLPADAPQNGHYKAYILGQGEDGIA--------------------------------- ------------------------------------------------------------- -------------KTPEWAAKITGIPA---------ERIIRLAREIGST----KP-AYISQ -GWGP---QRRSNGEIISRAIAMLPILTGNVGISGGNTGARESSYGV-------------- -----PFVMMPTLTNPVKASIPMFLWT---------------------------------- ------------------------DAITRATEMTAK--TDGIRGVERLTAP----IKFIWN -YAGNCLTN-------------------------------QHADINRTHEILQDES--LCE -MIVTIDNHMTSTAKY--SDIVLPD-CMTSE-QMDFCLDGYVANM--------SYVIF-AD -QAVKPSF-E---C--------RNI------YDMLSDLS-EKLGVKQQFTE---------- -------------DRTQEEWLRYIYRQ--------------------SREQLPELPV---- -------------------------------------FDEFRTQGIFKKVDPKG------- --------------FYIPYKEFRDDPQ-----------------------ANPLKTPSGKI -EIYSSRLAEIARSWKLD-------------------------EDEVIHPLPIHVDSFEHY -GD---PLMEKYPLQLTGFHYKARTHSTYGNVD-----------ILKS----ANPQE---- ------IW----------INPFDAEK-RGI-------------K-------------NGDM -LRMF---ND-R--------------GE---V--R-IHAKVTPRIIPGVVAL--G-EGAW- ------------------------HAP-----------DNQGID-HSGCINVLTTQRP--- ------SPLAK-------GNP----QH--SN-----LVQVEKL------------------ ------------------------------------------------------------- -- ->DmsA_Haemophilus_influenza_sp_P45004 ------------------------------------------------------------- ---------------------------MSNFNQISRRDFVK---------ASSAGAALAV- ----SNLTL---------------PFNVMAKETQRLNEN--------NQERIVWSACTVNC -GSRCPLRMHVK-DNR----ITYVETDNTGT---ETYNLDHQ------------------- ----------------VRACLRGRSMRRRVYNPD-RLKYPMKRIG---------------- -------------------KRGEGK-FKRISWD-EALTEI--------ADALKRN--IKKY -G-------------NESIYLNYGTGTL--------------------------------- --------------------------GGTMAKSWPP---------------ASTMIARFM- -N-----CIGGYLNHYGDY-STAQIAVGLDYTYGGG--WALGNG-MADI-ENTKLIVLFGN ---NPAET---RMSGGGLTYCIEQAKARS----------NAK----MIIIDPRYNDTGAGR -E---DEWIPIRPGTDAALVAALAYVMIQENLVDQ----------PFLDKYCV-------- ----------------------------------------------------------GYD -EKTLPTDAPKNGHYKAYILGYGNDGIA--------------------------------- ------------------------------------------------------------- -------------KTPEWAAKITGIPA---------ERIIKLAREIGST----KP-AFISQ -GWGP---QRRSNGELISRAIAMLPILTGNVGIHGGNTGARESAYSI-------------- -----PFVRMPTLKNPVKASIPMFLWTD--------------------------------- ------------------------AIIRGTEMTALT--DGI-RGVDKLSSP----IKVIWN -YASNCLIN-------------------------------QHAQINRTHDILQDDT--QCE -MIITIDNHMTSTAKY--SDILLPD-CTTSE-QMDFALDAFVSNM--------AYVIF-AD -QVIKPSF-E---C--------RPI------YDMLSDLA-EKMGVKEKFTE---------- -------------GRTQEEWLR-HIYE-------------------QSREKLPELPT---- -------------------------------------FEEFRQQGIFKKVDPNG------- --------------FKVAYKDFRDNPE-----------------------AHPLKTPSGKI -EIYSSRLAEIAKTWKLA-------------------------EDDVIHPLPIHAQSFEHY -GD---PLMEKYPLQLSGFHYKARTHSTYGNVD-----------VLKA----ANPQE---- ------VW----------MNPIDAEP-RNI-------------K-------------NGDM -IRIF---ND-R--------------GE---V--H-INVKITPRIIPGVVAL--S-EGAW- ------------------------YAP-----------DKDRID-HSGCINVLTTQRP--- ------SPLAK-------GNP----QH--SN-----LVQVERL------------------ ------------------------------------------------------------- -- ->TMAO_Shewanella_massilia_CAA06851 ------------------------------------------------------------- ---------------------------------MNRRDFLK----------GIASSSFVVL -GG-SSVLT---------------PLNALAK--------------AGINEDEWLT----TG -SHFGAFKMKRK-NGV----IAEV----------KPFDLDKY------------------- ----------------PTDMINGIRGMV--YNPS-RVRYPMVRLDFLLKGHKSNTH----- -------------------QRGDFR-FVRVTWD-KALTLF--------KHSLDEV--QTQY -G-------------PSGLH----AGQT--------------------------------- --------------------------GWRATGQLHS---------------STSHMQRAV- -G-----MHGNYVKKIGDY-STGAGQTILPYVLGSTEVYAQGTS-WPLILEHSDTIVLWSN ---DPYKNLQVGW-NAETHESFAYLAQLK----EKVKQGKIR----VISIDPVVTKTQAYL -G---CEQLYVNPQTDVTLMLAIAHEMISKKLYDD----------KFIQGYSL-------- ----------------------------------------------------------GFE -E------------FVPYVMGTKDGVA---------------------------------- ------------------------------------------------------------- -------------KTPEWAAPICGVEA---------HVIRDLAKTLV------KGRTQFMM -GWCI---QRQQHGEQPYWMAAVLATMIGQIGLPGGGISYGHHYSSIGV------------ -----PSSGAAAPGAFPRNLDENQKP---------LFDSSDFKGASSTIPV---------- ------------------------ARWIDAILEPGK--TIDANGSKVVYPD----IKMMIF -SGNNPWNH-------------------------------HQDRNRMKQ-AFH-----KLE -CVVTVDVNWTATCRF--SDIVLPA-CTTYE-RNDIDVYGAYANR--------GILAM--Q -KMVEPLF-D---S--------LSD------FEIFTRFA-AVLGKEKEYTRNMGEM----- -------------EWLETLYN--ECKA-------------------ANAGKFEMPD----- -------------------------------------FATFWK-QGYVHFGDGE------- --------------VWTRHADFRNDPE-----------------------INPLGTPSGLI -EIFSRKIDQFGY------------------------------DDCKGHPTWME-KTERSH -GG---PGSDKHPIWLQSCHPDKRLHSQMCESR-----------EYRETYAVNGREP---- ------VY----------ISPVDAKA-RGI-------------K-------------DGDI -VRVF---ND-R--------------GQ---L--L-AGAVVSDNFPKGIVRI--H-EGAW- ------------------------YGPVGKDGSTEGGAEVGALC-SYGDPNTLTLDIGT-- ------SKLAQ-------ACS----AY--TC-----LVEFEKYQGKVPKVSSFDGPIEVEI ------------------------------------------------------------- -- ->TMAO_Photobacterium_profundum_YP_129680 ------------------------------------------------------------- -----------------------------MNMSVSRRSFLK---------GLATTSAVSVI -GP-SLLAS---------------SKAMAAE---------------------TTGTWKTSG -SHWGAFRAHVY-AGK----VQEI----------KPLEMDKY------------------- ----------------PTDMLNGIKGII--YSPS-RVRYPMVRLDWLKKHKYSGE------ -------------------TRGNNR-FIRMTWD-DALDLF--------YRELERV--QKDY -G-------------PWALH----AGQT--------------------------------- --------------------------GWRQTGQFHS---------------CTSHMQRAV- -G-----MHGNFITKVGDY-STGAGQTILPYVLGSTEVYAQGTS-WSEILDHSKNIVLWAT ---DPVKNLQVGW-NCETHESFAYLEQLK----EKVAKGEIN----VLSVDPVKNKTQRFL -G---NDHMYINPQTDVAFMLAVAHTLYTEDLYDK----------EFIKMYCL-------- ----------------------------------------------------------GFD -E------------FVPYFMGKSKDNIE--------------------------------- ------------------------------------------------------------- -------------KTPEWAAEICGLPA---------DEIRDFARMLVAE------RTQILF -GWCI---QRQEHGEQPYWMGAVIAAMVGQIGLPGGGVSYGHHYSSIGV------------ -----PSTGFAAPGGFPRNVDEGQKP---------KWDNNDFNGYSRTIPV---------- ------------------------ARWVDCLLEPGK--EIKYNGSKVILPD----YKMMII -SGNNPWHH-------------------------------HQDRNRMKQ-AFQ-----KLQ -TVVTIDFAWTATCRF--SDIVLPA-CTQFE-RNDIDVYGSYSGR--------GLVAM--H -KLVDPLY-Q---S--------KTD------FDIFTELS-RRFGRHKEYTRGMDEM----- -------------EWVRSLYS--DCRD-------------------ANKAKFDMPE----- -------------------------------------FDEFWA-KGVLDFGEGT------- --------------PWVRHADFREDPE-----------------------INALGTPSGFI -EISSRKIDRFGY------------------------------EHCQGHPMWFE-KSERSH -GG---PGSKKHPFWMQSCHPDKRLHSQMCESE-----------EMRATYAVKGREP---- ------VY----------INPKDAAE-KGI-------------K-------------DGDI -VRVF---ND-R--------------GQ---L--L-AGAVLSDSYARGVIRI--E-EGAW- ------------------------YGPLNE--------KVGAID-TYGDPNTLTQDIPS-- ------SELAQ-------ATS----AN--TC-----LVDFEKFKGEVPPVTSFGGPIEVS- ------------------------------------------------------------- -- ->TMAO_Vibrio_vulnificus_YP_004189064 ------------------------------------------------------------- -------------------------------MAITRRSFLK---------GVATTSAASVI -GP-SLLAS------------------------------------ASANAVETTGTWKVSG -SHWGAFRAHIY-AGK----VQEI----------KPIELDQN------------------- ----------------PTEMLNGIKGII--YSPS-RVRYPMVRLDWLKKHKYSAD------ -------------------TRGNNR-FVRVTWD-EALDLF--------YRELERV--QKEY -G-------------PWALH----AGQT--------------------------------- --------------------------GWNQTGSFNN---------------CTAHMQRAV- -G-----MHGNYITKVGDY-STGAGQTILPYVLGSTEVYAQGTS-WSEILENADNIILWAN ---DPVKNLQVGW-NCETHESYAYLAQLK----EKVAKGEIN----VISVDPVKNKTQRYL -E---NDHLYVNPMTDVPFMLAIAHVLYTENLYDK----------KFIETYCL-------- ----------------------------------------------------------GFE -E------------FINYVQGKTKDKVE--------------------------------- ------------------------------------------------------------- -------------KTPEWAAPICGVKA---------DKIREFARMLV------KGRTQILM -GWCI---QRQEHGEQPYWAAAVVAAMIGQIGLPGGGISYGHHYSSIGV------------ -----PSTGFAGPGGFPRNLDAGMKP---------KWDNNDFNGYSRTIPV---------- ------------------------ARWIDCLLEPGK--EINYNGGKVKLPD----FKMMVI -SGCNPWHH-------------------------------HQDRNRMKQ-AFQ-----KLQ -TVVTIDFAWTATCRF--SDIVLPA-CTQWE-RNDIDVYGSYSSR--------GLIAM--H -RLVDPLF-Q---S--------KPD------FQIMKELT-ERFGRSEEYSRGMSEM----- -------------DWIRSLYN--DCKK-------------------SNEGKFEMPE----- -------------------------------------FDEFWE-KSVLDFGQGQ------- --------------PWVRHADFRQDPE-----------------------INPLGTPSGFI -EITSRKIGRYGY------------------------------EHCQEHPMWFE-KSERSH -GG---PGSDKHPFWLQSCHPDKRLHSQMCESE-----------EFRATYAVKGREP---- ------VY----------INPLDAKA-KGI-------------K-------------EGDL -VRVF---ND-R--------------GQ---L--L-AGAVLTDSYPRGVIRI--E-EGAW- ------------------------YGPLSE--------KVGAIC-TYGDPNTLTQDIGS-- ------SELAQ-------ATS----AN--TC-----IVDFEKFTGKVPPVTSFGGPIEVA- ------------------------------------------------------------- -- ->TMAO_Citrobacter_youngae_ZP_06352135 ------------------------------------------------------------- --------------------------------------------------MLAVGAASAL- ----APNPL---------------ISKVWAA-------------------GENPEQWIQSG -SHFGAFEAKVV-NGE------WLET--------RPFKHDKY------------------- ------------------PCDMLNAVREVVYNPS-RVRYPMVRLDWLRKREKSDRS----- -------------------QRGDNR-FVRVSWD-QALDLF--------YEELERV--QKTY -G-------------SSGVF----TGLA--------------------------------- --------------------------DWQMVGKYHK---------------AGGAMDRGL- -G-----LHGSYVTTVGDY-SAAAAQVILPHVIGSLEVYEQQTS-LPLVIQNSNTIVLWGC ---DPIKNLQIEFLVPDHDAFGYWQQIKE-----AVAQGKMR----VISVDPVRSKSQNYL -G---CEQLALRPQTDVALMLALAHTLYEEKLYDT----------AFINDYTV-------- ----------------------------------------------------------GFE -Q------------FLPYLLGESDKQP---------------------------------- ------------------------------------------------------------- -------------KNAEWAAEICGLTA---------EQIRDFARLLV------KGRTQFMG -GWCA---QRMHHGEQYPWMLVVLASMVGQIGLPGGGVGFGWHYNGGGTVTS--------- -----AGPVLSGLGGIANPPPAKY--------------KADFRGASEHIPT---------- ------------------------SRIVDCLLEPGK--KVAFNGETLTWPD----IKMAIY -SAANPFHA-------------------------------QQDRNRMIE-AWK-----KLE -TVVVLDHQWTASCRF--ADIVLPV-TTRFE-RNDIEQFGTHSNK--------GLMAL--H -QVVKPQY-E---A--------RHD------FDVFAGLC-KRFDKEAVYRE---------- -------------NRDEMQWIQALYDE--------------------GVKMGASLGVSLPD -------------------------------------FTTFWQGEGYIEYPAGQ------- --------------PWVRHGEFRDQPD-----------------------LNPLGTPSGLI -EIYSKTIAGFAY------------------------------EDCPGHPVWME-PFERNH -SA----KKNKYPLHLQSCHPDKRLHSQLCSSD-----------AFRNTYAVAGREP---- ------LY----------ISAQDAAA-RGL-------------K-------------AGDI -ARVF---ND-R--------------GQ---V--L-AGVVISPDFTPGVIRI--H-EGAW- ------------------------YSP-------QEGGKAGTLC-TYGDPNVLSADIGT-- ------SQLAQ-------GPS----AH--TV-----LVEVERYQQKAPQVTAFGGPETV-- -------KEEGGSAA---------------------------------------------- -- ->TMAO_Salmonella_enterica_gb_AEZ47489 ------------------------------------------------------------- -------------------------MKNKDSLHVSRRRFLAQL-------GGLTVAGMLGP -SLLTPRSA---------------RAADAVA------------------PGAATKEGILTG -SHWGAIRATVV-DGR------FVAA--------KPFEQDKY------------------- ----------------PSKMIAGLPDHV--HNAA-RIRYPMVRVDWMRKGHQSDTS----- -------------------QRGDNR-FVRVSWD-EALDLF--------YQELERV--QKTY -G-------------PSALL-----TAS--------------------------------- --------------------------GWQSTGMFHN---------------ASGMLARAI- -A-----LHGNSVSTGGDY-STGAAQVILPRVVGSMEVYEQQTS-WPLVLQNSKTIVLWGS ---DMVKNQQANW-WCPDHDVYQYYEQLK----EKVASGAIS----VISIDPVVTSTHDYL -GRDKVKHIAINPQTDVPLQLALAHTLYSEKLYDK----------NFLDNYCV-------- ----------------------------------------------------------GFD -Q------------FLPYLLGEKDGQP---------------------------------- ------------------------------------------------------------- -------------KDAAWAEKLCGIDA---------DTIRALARQMA------GDRTQIIA -GWCV---QRMQHGEQWSWMVVVLAAMLGQIGLPGGGFGFGWHYNGAGT------------ -----PGRKGIILSGFSGSTTVPPVHDSTDYKGYSSTIPI--------------------- ------------------------ARFMDAILEPGK--IINWNGKSVKLPP----LKMCVF -AGTNPFHR-------------------------------HQQINRIIE-GWR-----KLE -TVIAIDNQWTSTCRF--ADIVLPA-TTQFE-RNDLDQFGNHSNR--------GIIAM--K -QVVSPQF-E---A--------RND------FDIFRDLC-RRFNREAAFTEGLDEM----- -------------GWLKRIWQ--EGSQ-------------------QGKGRGIHLPT---- -------------------------------------FEVFWNQQEYIEFDHPQ------- --------------MFVRHQAFREDPD-----------------------LEPLGTPSGLI -EIYSKTIADMQY------------------------------DDCQGHPMWFE-KIERSH -GG---PGSQRWPLHLQSVHPDFRLHSQLCESE-----------TLRQQYAVGGKEP---- ------VF----------INPQDASA-RGI-------------R-------------NGDI -VRVF---NA-R--------------GQ---V--L-AGAVVSDRYAPGVARI--H-EGAW- ------------------------YDP-------DKGGDLNALC-KYGNPNVLTLDTGT-- ------SQLAQ-------ATS----AH--TT-----LVEIEKYTGPMDNVTAFNGPAEMVA -QCEYVPASQGNPHD---------------------------------------------- -- ->TMAO_E_coli_CAA52095 ------------------------------------------------------------- -------------------------MNNNDLFQASRRRFLAQL-------GGLTVAGMLGP -SLLTPRRA---------------TAAQAAT------------------DAVISKEGILTG -SHWGAIRATVK-DGR------FVAA--------KPFELDKY------------------- ----------------PSKMIAGLPDHV--HNAA-RIRYPMVRVDWLRKRHLSDTS----- -------------------QRGDNR-FVRVSWD-EALDMF--------YEELERV--QKTH -G-------------PSALLTAS-------------------------------------- --------------------------GWQSTGMFHN---------------ASGMRAKRI- -A-----LHGNSVGTGGDY-STGAAQVILPRVVGSMEVYEQQTS-WPLVLQNSKTIVLWGS ---DLLKNQQANWWCPDHDVYEYYAQLKR-----KSAAGEIE----VISIDPVVTSTHEYL -GGEHVKHIAVNPQTDVPLQLALAHTLYSENLYDK----------NFLANYCV-------- ----------------------------------------------------------GFE -E------------FLPYLLGEKDGQP---------------------------------- ------------------------------------------------------------- -------------KDAAWAEKLSGIDA---------ETIRGLARQMAAN------RTQIIA -GWCV---QRMQHGEQWAWMIVVLAAMLGQIGLPGGGFGFGWHYNGAGT------------ -----PGRKGVILSGFSGSTSIPP-----------VHDNSDYKGYSSTIPI---------- ------------------------ARFIDAILEPGK--VINWNGKSVKLPP----LKMCIF -AGTNPFHR-------------------------------HQQINRIIE-GLR-----NVE -TVIAIDNQWTSTCRF--ADIVLPA-TTQFE-RNDLDQYGNHSNR--------GIIAM--K -QVVPPQF-E---A--------RND------FDIFRELC-RRFNREEAFTEGLDEM----- -------------GWLKRIWQ--EGVQ-------------------QGKGRGVHLPA---- -------------------------------------FDDFWNNKEYVEFDHPQ------- --------------MFVRHQAFREDPD-----------------------LEPLGTPSGLI -EIYSKTIADMNY------------------------------DDCQGHPMWFE-KIERSH -GG---PGSQKYPLHLQSVHPDFRLHSQLCESE-----------TLRHEYTVAGKEP---- ------VF----------INPQDASA-RGI-------------R-------------NGDV -VRVF---NA-R--------------GQ---V--M-AGAVVSDRYAPGVARI--H-EGAW- ------------------------YDP-------DKGGELGALC-KYGNPNVLTIDIGT-- ------SQLAQ-------ATS----AH--TT-----LVEIEKYNGTVEQVTAFNGPVEMVA -QCEYVPASQVKS------------------------------------------------ -- ->TtrA_Aeropyrum_pernix_NP_148724 ------------------------------------------------------------- --------------------------------MVSRRDFVK---------GSIAIASLLVA -GA-GLQPV--------------LSQLVRPKFERIAPDL------QMGANVRYVYSSCLGC -NVRCGIKARVVKVGDLEI-VERIEG--------NPYHPYNRAVSLNGNGKLGSQHLRFYH -LPYNTPVKEALTKWHGTLCPRGQDGIYYLYDPY-RVLVPLKRAG---------------- -------------------PRGSGK-WKPISWEQLIREVVEGGVIEETGERLPGLRDFFVY -G----KLREAGFEDPNAILSDMKKDVQEILEYAKKPETSYEDIVMKIEEFKEKWSKILGE -KGLKLDDILIDPDRPDLGTKANMVAYLRGRGQGH----------------TDYMSARWI- -A-----GFGSVN-WLRHT-SACQLGYYAANYLWAG---YHDIQ--PDP-VSSKVIIMAGA -SMGRLH-------PGTTGQGLLISRAGE---------GDLK----IYYVNPTAPRTDAGG -N---IVWIPIKPGYDAALAFALIRWIIENERYNK----------EFLEIPNE-------- ----------------------EAAERKGYPVHSNATWLVIMEEGHEKWGEYLKAKDVGLE -D-SDKPVVFTGEGLATYDSVDNAEIDWEGEVVLTT------------------------- -------GERVKVKTSFRILKDEALSR---------------------------------- -------------SIDQWLSVASPYEPGSSEFREWKEKVLEMARDFAEA----APMAGTYV -HRGV---GMHSNGEYAVWAYRALDTLVGNYHRKGGLLARAGHTKYNSY------------ -----VYHVDKKGFGEPVKWGPPIDRHKAKYEDTLEYWLKVKKGENPYPAKR--------- ------------------------PWYPHTPEESYT--EIFAGIAEEYPYK----MGALIL -FYANPVLS-------------------------------ANYGVKFIE-VLKDTK--KLP -LFIAITTTINETMLY--ADYIVPD-TTYLE-TGTLGMQYLYASSGGV-----LLAEAARS -PVVMPLT-----QKIGEPERYASF------WEFFIDTG-KALGMPGFGKG---------- -------------AIKGLKYH--EGKS-------------------YDLDSLWDYIMRVYA -NAAMHAKDMGIIPENVPEEEVKFVEENYPVAKFKHLIPDEWP-YVAYMLARGG------- --------------VFTSYEESFHPNGVSKRKV----------PSKRKKFKKTLMLWNEDL -AKTRNSVTG---------------------------------AKFWGGPKYIP-PSTYAP -VKGGSKSFYGTPLREIYPESEYPFHLVFTTGPLFTKHRSQFYYAIKQISP---------- -------------ENYLVVNPKDAEK-LGL-------------E-------------TGDV -VEVE---TP-T--------------GR---F--K-APVVVEPTVPPGVIMVPYG-MGRWA -DTVVKKPSYFE------------VKDSRLASLINELPEREEIPEEAVNPVKKLPELKK-- ------KVLFTKSTPAYYNQAEPDKWRFNGITPN--VAEMSDPSLGGWPLLSIIGAAQAYY -FNVARIRKTGEKHEFEKTYPYIVW------------------------------------ -- ->TtrA_Pyrobaculum_arsenaticum_YP_001152643 ------------------------------------------------------------- --------------------------------MTSRRTYLK---------AIAAAA---AL ----GVALW-GYWPVV--------DKIIKPKRNPYGPDP------QYGKNVRYVHTTCLGC -NVRCGIRVRVVKYGDVEV-IERIEG--------NPYHVYNRAVSFD----SQVK--RYKQ -LPYNTPVKEALERWSGTLCPRGVDGIHYVYDPY-RVLKPLKRAG---------------- -------------------PRGSGK-WKVITWEQLNNEVVNGGIIEETGERLPGLKDFFVY -G----KLKEAGFEDPNAVLSEMKADVDNIMKIARDPNKTYDELVKAIEGFKAKWSQKLGE -KGLKLEDVFIDPDRPDLGTKANMVMYLRGRGQPP----------------TDYFSQRWI- -Y-----AFGSVN-WTRHT-SACQLGFYTGNRIWAG---YTDIQ-A----DPVGAKVIIGA -----------GWSMGRLHPGATGQGLII----ERACEGDLK----LYYINPVAPRTPCNG -N---IIWIPVKPGEDATLAFAVIRWLIENKRYNE----------EFLSLPNR-------- ------------------------DSAKKAGYPVNTNATWLVITEGQRFGEYLKARDIGLE -N-SDKPVVWTGEKFATYDSVDKADLYYVGKVTLPT------------------------- -------GEAVAVKTAFMILREEAFSR---------------------------------- -------------SFEEWLAIASPYEPGTPEFRDYVKKVEQMARDFADA----APRAGTMI -HRGV---GMHPNGEYITWAYRAIDTLIGNFHRMGGLLGRAANTSYLSYVYNVGYSGFGEP -PRWGPPIDRHNYAYEATLEYWLRVKEAL------KEGKSWEDAVKAAFPTKR-------- ------------------------PWYPLTPEESYT--EIFAGIAEGYPYK----IGAFIM -FYANPVLA-------------------------------TNYGVKFVE-VLKDTS--KIP -LFIAITTTINETAMY--ADYIVPD-TTYLE-TGTMGVQFLYATSGGV-----TLAEPWRS -PAIMPLT-QRISDCPNGHPRYASF------WEFFIDTA-KALGMPGFGDRAVPGVKG--- -------------KKYEGRWF--PLHC-----------------------EWEYVMRVFAN -AALDAKDRGLIPEQVPEEEVKFVEENYPIAQFKDIIPPEEWK-YVAYGLARGG------- --------------VFTSYEQSFDERGV----------------------SKRSVPGRGTL -YLWDETLAKTRNSVTGEKFW----------------------GGPKYFPIATY-APAGPA -FQKADKWLHGTPLRQLYPEKDWPFMLVFYTGPIYTKHRSQFYYWIKQIAP---------- -------------ENFVLINPEDAAK-IGV-------------E-------------TGDV -VRVE---TP-V--------------GF---F--E-APAVVEPTVAPGVIMVPYG-MGRWA -DTVLVKPKYFELRDAKLKLTVDGLPEKMEVPEDAVNPVKGLPDVVKKILFTKSPAEYY-- ------EKGLA-------PDK----WRFNGVTPN--VVQMSDPSLGGWPLLSWLGASQAYF -DTPVRITKTGQKHKFETPYIVW-------------------------------------- -- ->TtrA_Pyrobaculum_aerophilum_NP_559177 ------------------------------------------------------------- --------------------------------MTSRRAYLK---------AIAAAA---TL ----GIALW-GYWPVV--------DKIIKPKRTPYGPDP------QFGTNVRYVFSSCLGC -NVRCGIVARVVKYGDVEV-IERIEG--------NPYHVYNRAVSFD----KQIK--RYAP -LPYNTPVKEALEKWSGTLCPRGADGIHYVYDPY-RVLKPLKRAG---------------- -------------------PRGSGK-WKAITWEQLINEVVNGGVIEETGERLPGLKEFFAY -G----KLKEAGFEDPNAILSEMKIDVDNIMKVARDPNKTYDDLIKAIEEFKAKWSQRLGE -KGLKLEDLLIDPDRPDLGTKANMVMYLRGRGQGHT----------------DYFSQRWI- -Y-----AFGSVN-WTRHT-SACQLGYYAGNSIWAG---YHDIQ-A----DPIGAKVIIGA -----------GWSMGRVHPGATGQGLMI----ERACEGELK----LYYVNPVAPRTTCNG -N---IIWIPVKPGEDAALAFAVIRWLIENKRYNE----------EFLSIPNR-------- ------------------------DSAKKLGYPVNTNATWLVITEGERFGEFLKARDVGIE -D-SDKPVVWTGERFATYDSVDKADLYYVGKVTLPS------------------------- -------GETVTVKTAFMIVRDEAFSK---------------------------------- -------------SFEDWLAIASPYERNTPEFADYVKKIEQMAKDFADA----APKAATTL -HRGV---GMHPNGEYIVWAYRTIDTLVGNFHRMGGLLARAAHTAYENYVYNVGRSGFGEP -VRWGPPIDRHRYAYENTLEYWLRVKKAL------KEGKSWDEAVKAAFPTKR-------- ------------------------PWYPHTPEESYT--EIFAGIAEGYPYR----IGALIL -FYANPVLA-------------------------------TNYGVKFIE-VLKDPA--KLP -LFIVITTTINETALY--ADYIVPD-TTYLE-TGTMGIQYLYATSGSV-----TLAESWRS -PVIMPLT-QRISDCPNGHPRYASF------WEFFIDTA-KALGMPGHGDKAIPGVKG--- -------------KKYEGKWF--SMHC-----------------------EWEYILRVFAN -AALDAKDKGLIPEDVPEEEVKFVEENYPIAQFRDILPPDEWK-YVAYGLARGG------- --------------VFTKYEESFDERGI----------------------SKRRVPGRGTL -YLWSEEVAKTRNNVTGEKFW----------------------GGPKYFPIATY-APAVPA -FQKADEWLHGTPLRQLYPEKEWPFILILYTGPLYTKHRSQFYYWIKQVVP---------- -------------ENFVLINPEDAAK-LGV-------------E-------------TGDV -IKVE---TP-V--------------GA---F--E-APAVVEPAVAPGVIMVPYG-MGRWA -DTVVVKPKYFE------------LKDARAKSLIDELPDKVEIPEDAVNPVKHLPDVVK-- ------KLLFTKSPAEYYEKGLAVDKWRFNGVTPN-VAEMADPSLGGWPLLSWLGAAQAYF -DTPARIVKTGQRHKFEVPYIVW-------------------------------------- -- ->ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 -----------------MPSLGLPIYGQK----------QGAGLDARRWRSVEEAA---EA -REVPPGEFPDDAAAVPE--G----------FT--RRGFLQ-V-------LGASVA---LA ----GLEAC--KPP----------RENVVSY--VRPPAG------VTPSLPSAYATVASRG -GYAVGVVVTSH-EGR----PTKIEG--------NREHPSSR------------------- ----------------GGSDAMLQASILDLYDPR-RLKG-FTRAG---------------- ---------------------------RPLGFA-TLLREV---------SALARSHAQDGG -A---------------RLR----------------------------------------- --------------------------FLVEPTSSPA---------------VADLRRRIL- -E-----RFPRAR-FDAWA-PVGADAGRAGAAIAFG---KPLDA-AASL-ADADVILSLES ---DFL-----ALEGDSLRLAREFGARRT-------AERMNR----LYVAESAYTVTGGAA -D----HRFRMRSADVLGFGRAVAAELAAKHGLAQ-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------LAPLG-APAGGERA---------KAAAAVAADLARA----RGRSAVLA -GDRQ--------PAAVHALAAALNGALGNAGKTVAYR----------------------- -----PTALLDPAAG---------------------------------------------- ------------------------PDRLRALAGELE--AGK--------------VDALVV -TAWNPAHT-------------------------------APADVPLRK-LLP-----KAK -DTIALALREDDTVRL--ATWKIAA-THPLE-AWGDLRAAD------------GTASI-QQ -PLIAPLH-E---S--------LSE------LELLAAFL----DEGDHGTW---------- -------------RIVREGWR-------------------------RRAGEAG-------- -------------------------------------FDGRWD------------------ --------------GWLAAGVV--------------------------------------- -------------------------------------------AGSAVPPEPAQADLARVA -EAVRAVAAPGASLELGFAADYKVLDGRFLENA-----------WLQEYPH-PITKL---- ------TW-----DNAAQLSAATAKQ-LGV-------------E-------------SGDL -VELS---WR-G--------------RT---L--T-APALVVPGHADGSVLLTLG-YGQA- ------------------------LSGPVGK-------GVGH------DAYALRT------ -------------------SD----APWFGA-----GVEVRKTGKRHPL------------ ------------------------------------------------------------- -- ->ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 ------------------------------------------------------------- -----MPSLDGLPGDEREWIGRFPHLEQALAHPLDRRRTLK-------------LMALALA -GG-GLAGCDPGT-----------PDRGFVSAVRAAPGV-------IPGVPNVYASAHVRD -GYANGILVTHQ-MGR----PTKVEG--------NPGHPSSL------------------- ----------------GATDVFAQAAIQDFYDPD-RASGPL-------------------- ---------------------HDG---MPAAWQ-EV------------TTALQVLRAAPNG -GVPQG---------ASGLR----------------------------------------- --------------------------ILTGTVTSPT---------------LGAAIDALL- -A-----AYPGAI-WHRWD-AIGRDTVRQGAELAYG---RPAMV-IPDL-RQVDVALAVDS ---DLLD----SA-PGHLRHARAFAGRRN-----PVQGPMNR----LYAVEPTPSLTGVAA -D----HRFITAPAACDEIIGRLAAAVLRNEAPSG-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------GPDW--------------------LGAVVADLRAH----PGRALIHL -GPDH--------GAQAQAAVHAMNEALGGRGRAFDVFDAPDHR----------------- -----PARPTSTLPA---------------------------------------------- ------------------------------LMDDME--NG----------R----VRALLI -LDVNPVYQ-------------------------------VP---RFAA-ALP-----RVP -LSVALADRPHETAQA--ARWHVPL-AHGFE-EWGDARADD------------GTATI-LQ -PQAMPLY-G---G--------VSA------ATILHLCA-GDVARPAR------------- -------------DLVRQTWR--QHLP---------------------------------- -------------------------------------SERDWRAALAAGVVPGT------- --------------ASARLDTPLA------------------------------------- -------------------------------------------PVMPPAPPPAP-PV---- ------------DLTLLLRPDPHLWDGREANNP-----------WLQELPR-PLSKI---- ------VW-----GNPLLIPPDLARS-MGL-------------R-------------NGDE -VALS---VG-A--------------RR---A--V-LPIWVQPGQASGCVVGLLG-SGRR- ------------------------RAG---------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Opitutus_terrae_gb_ACB77208 -------------------MKRKSDHSAP---------ANSEPTGPKYWRSLDELAATPGF -QEQLHREFPEGASELN---G----------VD--RRHFLK-I-------MAASFA---LG -GV-GLAGC-RR-P----------EKYVLPY--GKSVEG------MIPGLPLYFATAMPLR -RTAIPVLAETH-QGR----PTKIEG--------NPTYQQHG------------------- ----------------GSASLLAQASVLDLYDPE-RATQ---------------------- -------------------HTREGR---KLNVA-DLNEQL----------AQIGTSHAANG -G--------------AGLA----------------------------------------- --------------------------FLAEESSSPT---------------RARLLAQLR- -A-----RLPRAI-WAEYE-PVADEAPVSAATAAFG---QPVRP-LYRF-ARARRIVSLDA ---DFL-----RPDGAGLYYAREFAKGRR-VVNREDAQQMNR----LYVAESAFTITGSMA -D----HRLRLASSHMLALAAALAVKITGSAAFAP-------------------------- ------------------------------------------------------------- --------------LSAGLD----------------------------------------- ------------------------------------------------------------- -------------IDPKW--------------------IDECAADLLAH----RGTSVFVA -GAHL--------PEQVHAIAYAINAALGNIGATVDFVAP--------------------- -----PTNDAASIQT---------------------------------------------- ------------------------------LATAIR--DGA--------------IDTLVI -LGGNPVYN-------------------------------APADLDWAA-LQK-----SVK -NVVRLGYHTDETTVASPAGAHLAA-AHYLE-SWGDARTAD------------GTIVP-IQ -PMILPLF-G---G--------LTE------LEVLARIV----GANNPDPY---------- -------------ALVLETIT--ALAG---------------------GD----------- -------------------------------------AEKAFQ-QFL----HDG------- --------------LLANSAYPTVAVS---------------------------------- -------------------------------------------YNAAGVARLLG-AG--AG -NP---AALSKDNLEVRFVTDYKMDDGRFANNG-----------WLQELPD-PITKI---- ------SW-----DNAILVSPRLARE-LGV------------YP-------------DGST -LQVARVEMA-GFHQGKEQAFIGELTVNGRTV--R-APIHIQPGLSNYTVVLPLG-YGRT- ------------------------QSGHVGR-------GMGH------DFYPLRTSAGL-- ------HFTVGGKLVPTQDVKAMPNTQEHWSMEGRDIIREANVDEFLENPRFVAAFGMESH -SPSI-------------------------------------------------------- -- ->ACTB1_Ralstonia_eutropha_YP_298623 ------------------------------------------------------------- ------------MTRARVIPLVPVDEPSDAPRSPARRHFLRTT-------MAASAALAGAA -CS-GPP-----------------AEMIVPY--VQMPEG------IVPGRPLFYATALTRH -GYGMGVLVETN-MGR----PTKIEG--------NPRHPASL------------------- ----------------GATHPFDQAAVLQLWDPD-RSQAPYR------------------- -------------------GGALSG------WA-AFDAAL--------ATQRVQWRDRDGE -G----------------LR----------------------------------------- --------------------------LLTGNVGSPT---------------LSAQIAQWL- -D-----RYPKAV-WHVHD-PLYDEDPS--PRMAFG---DDVDL-LIDP-KPATTIVTLDA ---DLVG----HG-PAAVRHAHDFMADRR----GVAPMLACR----LYAIESSPTLTGEIS -D----NRLALPPHEIERLAWSLARKLGVPDVPVD-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------TP---EPASDTAR---------HWIAVLARRLREAP---PGSSLLIA -GGAL--------SGPTRALVWRLNARLGNLGKSVRPVAGT-------------------- -----PRRPLGE------------------------------------------------- ------------------------AHSIGALTEAMR--AGA--------------VSALLM -IDVNPAYD-------------------------------APCGLGFDA-ALR-----HVP -WSSHMGVYRDETARL--TTWHAPM-AHDLE-RWSDARAWD------------GTASI-VQ -PVIAPLN-G---G--------RSA------HELLS----AAVDEHQSGY----------- -------------DLVRAHWRARQRDD---------------------------------- -------------------------------------FDAFWE-QAL----RTG------- --------------VIADTAAPP-------------------------------------- -------------------------------------------ATTDMRQPITP------- ------PSFAAPPLVARFMPDPATDAGELANNA-----------WLQELPR-ALTRH---- ------TW-----DNAALIGPLTARA-RRL-------------S-------------TGDI -VVIRRTDRQ-G--------------NP---I--E-APVWVLPRHAEGVVSLPLG-YGRRH ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Salinibacter_ruber_emb_CBH25246 -------------------MIELDVIDSETAARDEESGARDGSSEPTFWRHWSESDADEDG -DDLT--EFVPGDSEPPS--G----------AS--RRQFLQ-L-------MGAAMA---MA ----GLAGC-RR-P----------EEKILPY--AREPET------VTPGIEDHYATSMPFR -GVLRPVVAQSN-EGR----PTKIKG--------NSDHPSGQ------------------- ----------------SGTSPYEQASVLNLYDPD-RSRS---------------------- -------------------VRQEGR---AASWS-DFVSFC---------RQLGNEADQHQV -A----------------------------------------------------------- --------------------------VLAEKTSSPT---------------VQAMRQRMA- -D-----RFPNLQ-WVPYA-PTGTDPRRLGMQQAFG---RPLRP-RFEL-GEAEVIVSLDA ---NFLD----GRTHDFGYHTQGFAEGRR---LDDAEDTMSR----LYTVESRYSTTGGSS -D----HRLAMRAGRIPALAAALAAELGVGEAPDV-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------SWSERER-------------LHVREMARDLQAA----GEHGVVMA -GEAQ--------PPEVHALAMAVNQRLGGLGTTVTLFDPGDDEIQ--------------- -----PQ------------------------------------------------------ ------------------------DEALADLTASMR--AGE--------------VDTLFM -LGVNPVYD-------------------------------APSELGFEE-ALS-----NVR -DTVHLGRLRNETAQA--ARWHLPR-THYLE-QWGDGRAYD------------GTKSI-VQ -PLIRPLYDD---A--------HSL------IEVLNLAA-TGVDASGH------------- -------------DLVREQWR--AQLP---------------------------------- -----------------------------------APFQERWR-KAL----HDG------- --------------YLEGSGYETAS------------------------------------ -------------------------------------------VGTATVPSIDA-PA--SD -PD---------EIEVVFRTDSKLLAGRFSNNP-----------WMQELPD-PISKI---- ------VW-----DNVAVMSRATADE-LGV-------------EVQRREGSF-----YADR -VELT---LD-G--------------QS---V--K-LPVWVQPGYPDGSIGVSMG-YGRTI -ASTRESESTP-------------FWDTSDQTNIYNGSPIAGGVDSSGEPVDVVGGNVAPM -RPNGGRVATGANVTQVGSGYLLATTQEEGSMQGRPIVRWATLDEFKENPEFVNESQPPVP -DLGHESGGHGDGGHGDGGGHGGGDGHSGDGAAGNVSGQGLEAGPGADAHGADEMPEQAAH -G ->ACTB1_Rhodothermus_marinus_gb_ABV55245 -------------------MIELPVVNPD--------GAETPGSGKRLWRSTADLRRDPEW -VKLAHDEFMPGVAEPPS--G----------TS--RRQFLQ-I-------MGASMA---LA ----GLTAC-RR-P----------VEKILPY--VRQPEE------IIPGIPLYYATAMPFR -GSVRPLLVESH-EGR----PTKIEG--------NPDHPLSR------------------- ----------------GATGVFEQASLLNLYDPD-RSQQVL-------------------- -------------------RKGEPA-----SWG-DFVQF---------ARSL-----AAEA -G-------------TKRLA----------------------------------------- --------------------------VLCEPSSSPT---------------LAALRRELE- -R-----RYAQVR-WVTYR-PEGDDHEALGLQQAFG---RPVRA-RYRF-SEARVIVSLDA ---DFLG----PTDRNFVENTREFAASRR---MERPEDEISR----LYVIESTYTVTGGMA -D----HRLRLRAGDIPAFAAALAAELGVGELREA-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------GARFAGHPY-----------VVEIARDLRAA----GARGVVLA -GETQ--------PPAVHALCAVINDLLGSLGRTVILHALDEP------------------ -----ATAQHAALAE---------------------------------------------- ------------------------------LVQAMQ--AGA--------------VDALLL -LNVNPVYD-------------------------------APAALGFAE-ALA-----QVP -EVIHLGLHMDETARR--STWHLPS-THYLE-AWGDGRAYD------------GTLSV-IQ -PLIAPLYEA---A--------HSP------LEVLALLA---TGEEQSAY----------- -------------DLVRNTWR--RLLA----------------------GRGA-------- -------------------------------------FEQAWQ-RVL----HDG------- --------------FLPDSGYPTVSLR---------------------------------- -------------------------------------------PNRQALADWPQ------- --------AAEGGLEVVFRLDPTVLDGSFANNA-----------WAQELPD-PITKI---- ------VW-----DNVAILSPKTAAA-LGV-------------KAEYHKGVY-----IADV -IELS---LD----------------GR---A--VELPVWVLPGHPDDSITVYLG-YGREI -TSTRPERKTPFFDLDE-------YTDMYGHGAIATGVGPRTWPRCGGPDNTWVAYGAQ-- ------VRKTG-------RTYKIVTTQDHGSMVGRPLVRLSTVEEFRKNPDFAKEAEPPLE -GLEP-------------------------------------------------------- -- ->ACTB1_Methylobacterium_sp_4_YP_001772545 ------------------------------------------------------------- ------------------------MPPLSGPRTVSRREALR-----------AFAAGITLA -AG-ACAKP---------------DEEIVPY--VVQPER------VTGGVPLVFASTLPLA -GYGRGCRVRSV-DGR----PIKVEG--------NPRHPGSL------------------- ----------------GATDVFAEAAVLSLYDPD-RSKTLR-------------------- -------------------QGGDIG-----TWS-ALQRAL--------VAKVAAWRETRGE -G----------------MR----------------------------------------- --------------------------LLTGRVTSPT---------------LQRQIARLL- -D-----AYPRAA-WHAHE-PTEDASARAGAALAFG---RPLWP-VPHL-DRAAVIVSLDA ---DPLG----PG-PDQIRNGRGFGSRRV----PAAGEGFSR----LYAVEAAPTLTGAKA -D----HRLALPPHRIGEVAVALARALGADL------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------RAPTLPEEAARLAA-------------RAAQDLRAR----RGAALVLA -GPTL--------PPEIHALAHWIN---GVLGAPLDWIEP--------------------- -----PDLIGGRAPGTLSD------------------------------------------ ------------------------------LARDLA--AGG--------------VQDLVM -LGVNPVYD-------------------------------APADLALAE-RLG-----RAP -FRLHLGPAVDETAVL--ATWHVPE-THPLE-AWGDLRAVD------------GTASL-VQ -PLIRPLY-A---T--------RTA------EEVVCALL----GEGDAASY---------- -------------DLVRETWR--PGRE---------------------------------- -----------------------------------AGFEEWWR-RAL----HEG------- --------------VVQDSAAA--------------------------------------- -------------------------------------------PVATGSPRLPD-PGPPAA -AQ---------DLTLVLRPDPGTWDGRMANNA-----------WLQECPA-PLTKQ---- ------VW-----GNALALAPDEAAR-RGL-------------A-------------QGDL -VRVA---AG-G--------------RS---I--E-VPVATVPGHAAGVASLTLG-HGRS- ------------------------RAGAIGN-------GIGA------SAYALRREDAL-- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Nitrosococcus_oceani_YP_343269 ------------MAGSSIKPLDLAPIRAR---------LAEAQ-GRAFWKSLEELAGSEEF -ERFLYQEFPF----FRELSQ----------ASLSRRDFMR-L-------MGASLA---LA ----GLSAC-STPP----------PEEILPY--IRAPEG------LVPGESLFFATAMPLD -GFATGVLVESR-MGR----PTKVEG--------NPLHPASL------------------- ----------------GGTDIFAQASVLQLWDPD-RAQVIS-------------------- -------------------HRGEIS-----TWQ-TFLAAM--------GEKMRTFEGNQGK -G----------------LY----------------------------------------- --------------------------LLTPTVSSPT---------------LISQLRTLG- -K-----RFPHAH-WHQYQ-PINQDNSYEGARLAFG---ESLET-RYHL-ERAEVILSLDG ---DFLG----SL-PGHLRYARDFAKKRR---VDSAQSTMNR----LYVAESSPTITGTMA -D----HGVSLRASQIEVLALQLARALGI-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------GVPRREETASDLPE---------QWVRAVAEDLRQH----RGTSLVIT -GEKQ--------PPFVHGLVHAVNQALGNVGTTLTYSAPRAFN----------------- -----PRNQNESLNH---------------------------------------------- ------------------------------LVAQMD--AGK--------------VDTLIM -LGGNPAYN-------------------------------APADLAFSK-QLA-----KVK -SSIYLGLYEDETAAH--SHWHIPE-THYLE-RWGDARAYE------------GTVSL-LQ -PLIAPLY-Q---G--------KSD------YELLAVLL----GQTDRSDY---------- -------------DWVRGYWQ--KQWP---------------------------------- ----------------------------------KSDFKSIWN-QAL----QAG------- --------------FIEGTALRS-------------------------------------- -------------------------------------------KSVKLRDDWVA-HLSRGQ -SK----SKETSGMEIIFMPDPTIWDGQFTNNG-----------WLQELPK-PLTKL---- ------TW-----DNAALISPRTAEN-LGL-------------A-------------NEEV -VALR---YQ-E--------------RQ---V--Q-APIWIMPGHPEGAVTVTLG-YGRA- ------------------------KTGQVGA-------GTGF------NAYALRSSRAP-- -------------------------WFGWGLE----------------------------- ------------------------------------------------------------- -- ->ACTB1_Chloroflexus_aggregans_YP_002464666 ---------------MTQHQSDLEAIRAQ---------LRDAR-GPQFWRSLDQLADSPAF -RELVEREFPRGASEMSD--G----------MS--RRTFLK-L-------MGASLA---LA ----GVTAC-TYQP----------RQYIAPF--DRQPEG------RIPGVPQYFASTLTLG -GYGTGVLVRAN-EGR----PTKVEG--------NPRHPASL------------------- ----------------GSTDLFAQAEILTMYDPD-RSTTVLRQ------------------ --------------------------GVPSTWA-EFTTTL--------ANALTAAQATQGA -G----------------VR----------------------------------------- --------------------------LLTTTVTSPS---------------LAAQIEQFL- -Q-----AYPQAR-WYQYE-PVNRDNVVEGARLAFG---RDVTT-RYDL-AAAQVIVSLDA ---DFLA----PG-PGFIAYARAFADGRK---VRKDSTGMNR----LYVIEASPSTTGTAA -D----HRLALRADAIAAFAGALAHELGIGGAPAT-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------LAAKAE---------EFLKAIAKDLEEH----RGRSVVIA -GDQQ--------PPIVHALAHLINAELGNVGKTVFYHEPVEAR----------------- -----PTNQTNELVT---------------------------------------------- ------------------------------LVSEMA--AGR--------------VELLVM -IGGNPVYN-------------------------------APGDLRFAE-RMA-----TVP -LTVHLSQFVDETSVQ--ATWHIPQ-AHPLE-SWGDARAFD------------GTASI-VQ -PLIEPLY-G---G--------KTA------NELLAAML----GQPDAESY---------- -------------DLVRGYWE--ERIG---------------------------------- --------------------------------------NTNWNVALATGVIADT------- ------------------------------------------------------------- -------------------------------------------SAPVINPTLNE-AAIRAT -A----IPQPGDGVEIVFRPDPSVFDGFYANNG-----------WLQELPR-PLTKL---- ------VW-----DNAALMSPRTAIKLLGLPFSADRLVGNEADDRERQRYLEQLSKVNGTI -ARIE---YR-G--------------GV---V--E-LPIWLLPGHAEDSITLNLG-YGRT- ------------------------NAGRVGN-------GVGI------NVYP--------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 -MDNGSKKNGADVCPSKKGKLELADVKQQ---------LAAAKDGPQYWRSLDELSNTDEF -QEMLHREFPRQASEWVDDGG----------SS--RRDFLK-L-------MSASLA---LA ----GLTAC-TKQP----------IEPIVPY--VRQPEE------LTLGKPLFFATANTVG -GYAVPVLAESH-EGR----PTKLEG--------NPQHPATL------------------- ----------------GGTDVFTQASVLTMYDPD-RSQVVMLD------------------ --------------------------NEIRTWG-SFVGAV--------ANPLAAQKAVQGA -G----------------LR----------------------------------------- --------------------------LLTRSTTSPT---------------LGAQIKQLL- -Q-----TYPQAK-LVQYD-PAGRDNARAGSQLAFG---QYVET-QYNL-DKADIILSLDG ---DFLS----SGFPGFHKYARNFSQRRQ----PDLKEKMVR----FYMAESTPTNTGGKA -D----HRIPMRASDVEQFGRAIAAGIGVAGAGGS-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------AKQEWQ-----------------NQVAAIVSDLNKH----KGAAVVVV -GEHQ--------PPAVHALAHSMNAALGAVGTTVTYTEPIEQI----------------- -----PADQTAGLKE---------------------------------------------- ------------------------------LVADMN--SGK--------------VDLLVV -MGANPVYE-------------------------------APADLAFLD-AFK-----KVA -VRIHHGLYVDETAVL--SHWHING-THFLE-QWGDVRAFD------------GTVTI-QQ -PLIAPLY-N---G--------KSQ------YEFVAALN----GQGSTSGY---------- -------------ELVKGTWQ--KQHT----------------------GAD--------- -------------------------------------FEAWWR-KAV----HDG------- --------------LIAGTAAPAKT------------------------------------ -------------------------------------------VSAKGAPAATN------- -------AASDSAMELIFRRDPMIYDGEYSNNG-----------WLQEAPK-PITQL---- ------TW-----DNPIEMNVTQAEQ-MGI-------------K-------------TEDE -LEIT---VD-G--------------RK---I--V-GGAWLTPGHPKNSVTVFLG-YGRT- ------------------------RAGRVGT-------GTGY------NAYQARTSDKQ-- -------------------------W----------------------------------- ------------------------------------------------------------- -- ->ACTB1_Candidatus_Solibacter_usitatus_YP_821785 -------------MSDPRNQLDLAAVQKR---------LEGAR-GRDYWRSLDDLAATPEF -QDLLEREFPRQAVGWADDED----------ANEGRRNFLK-V-------MGASLA---LA ----GMTAC-TRQP----------TEHIMPY--VRQPEE------LIPGRPLFFATAMTVN -GVANGLLAESH-MGR----PTKMEG--------NPEHPATL------------------- ----------------GACDPYSQASVLQLYDPD-RSQALT-------------------- -------------------FNGEIR-----SWG-RFTGEL--------REALALQKTKNGS -G----------------IR----------------------------------------- --------------------------ILTETVTSPT---------------MAAQLRAIQ- -Q-----VYPSSK-WHQWD-PAGPHMARAGSVQAFG---QPTNT-YYDF-THANVVVSLDS ---DFLA----SG-PGYLRYARQFSARRR---IHEPSDSMNR----LYVAEPMPTPTGTKA -D----HRLQLRAGDIEEFAWGLAISL------------------GIAEGPKN-------- ----------------------------------------------------------GEN -H----------------------------------------------------------- ------------------------------------------------------------- -------------DIYKW--------------------LGPMARDLQSN----KGASLVIA -GAHQ--------PPIVHALAAIMNEKLGNVGKTVFYTDPIEAN----------------- -----PGDQLASLMD---------------------------------------------- ------------------------------LVKDLD--AGA--------------VDVLLI -LGGNPAFN-------------------------------SPVELGMRD-RLK-----KAK -LRIRLGLYADETTEV--CQWQVPE-AHFLE-TWGDARAFD------------GTITI-QQ -PLIQPLY-N---G--------RSA------LQLLQNFT----DQPESSPY---------- -------------DVVKGYWR--TQHQ----------------------GAD--------- -------------------------------------FENWWR-RAV----HDG------- --------------FVANSALPTKT------------------------------------ -------------------------------------------PTVRGEALSAR-AGARHL -GG---------KLEVIFRPDPTIFDGRFANNG-----------WLQEMPK-PVTKL---- ------TW-----DNAAILSPYDANR-FGV-------------Q-------------NGDM -LKLT---YD----------------GR---S--LNAPVFIQPGHVNGATTLHLG-YGRW- ------------------------AGGRAAK-------GMGF------DPYGLRTSKAL-- -------------------------WQDVGMDA---------------------------- ------------------------------------------------------------- -- ->RBG1_1305 ----------------------MNNKENP---------------HKKYWSTLSEFHQDAEF -KKLKKEEFLSKPQSFFESNG-------NNDTTFSRRDILK-L-------AGAAAV---FT ----AAACA--RRP----------VEKIVPY--LDPSEE------VIPGKAVWYSST-SGT -SDGCGMLVKTR-EGR----PIKLEG--------NPDHPLNK------------------- ----------------GTLSAREQAAILDLYDPD-RLKHPA-------------------- -------------------KISAGQ-VLKSDWK-SADTEI--------ARSLKSA------ ---------------KGKMV----------------------------------------- --------------------------LLTGTIHGPA---------------RKRLIREFLF -------SFSNAE-HITFD-ALSEEEILEAQELCYG---NRVLP-RYRF-DKAEALVFLGA ---DPLA----SG-HSKTEFAYGFGHQRK-----INSNQMSK----VISFEPALSLTGQNA -D----LHYLVKPQDLIKVGLALAHQLIVAEKKSK-------------------------- ------------------------------------------------------------- --------------LASDLLVQNLLEN---------------------------------- ------------------------------------------------------------- -------------YSAKKVETEIGLPE---------GTIKSVAADLWLA----RGRGLVYT -GSLT---VRDNSALALHLVTNLLNSALENEGNTVDGVQSVSQQ----------------- -----SQGSYSELMN---------------------------------------------- ------------------------------LISDMK--SGK--------------VEAVLI -YGNNPAYG-------------------------------LPQSAGFEE-ALQ-----KVK -TKIYLGDRADETGSL--CDFVLPS-LHFLE-SWGDAEPQQ------------SLYSL-MQ -PTISPLH-D---N--------RGW------EDSLLALM-REIKGVALGKE---------- ----------------YASWH--DFLK-------------------DTWYKEIYLKNDLVA -S-----------------------------------FEDFWI-SVL----RQG------- --------------LFDTVNR---------------------------------------- -------------------------------------------SAEKSSPRQFRTTALSNI -GK---IKNVDSKFTLALYTPAMQFDGRTNNNS-----------WLLETPD-PVSKI---- ------AW-----DNYVNIAPRTSVE-LGL-------------Q-------------ESDV -VSLT---VN----------------GV---T--QEIPVHIQPGIHPEVFTVAVG-WGRE- ------------------------KVGRVGNNVGVNAFRWSKIQNRHLVSSSLPVEIKKTG -KQIKLANVQG-------HNY----INGRPVIYEATLAEYQKNPTAGRAGEEKLTSIWPSH -PYE--------------------------------------------------------- -- ->ACTB1_Leptospira_interrogans_serovar_NP_713447 --------------------MDQKNFQKE---------------KKAHWLSYDLKDKDEEV -KEMQKSEFFTSPDPLIARIK---------SGEFDRKSFLK-L-------MGAGVA---MT ----SLNCI--RKP----------VEKIVPYVDLNKTDENSQYDFVKHGHSYYYTSVVAG- ----TGVLIKAR-DGR----PLKLEG--------NPDHPVSQ------------------- ----------------GALSAAGQASIFDLYDPD-RAQNPA-------------------- --------------------TIEGGIEVKSDWA-TVDAKV--------KSALAAN------ ---------------KGKTV----------------------------------------- --------------------------VVTKLLDSPS---------------TQSIIGDFL- -R-----TVGGGK-HYEISLTSAEEVVSKGQAASYG---KAIVP-NYHF-DLANVILSIDC ---DFMG----NW-LSGEEHQKDFSKRRNLRPNGSLKQNNLADVNLFIAAESVPTMTGSNA -D----LRLAIRPGDQTKLALAIAAALGELGANTK----------DALNG----------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------ATLSALVSELGVSE---------ENIRKTAKALWSN----KGRSLVVA -GSLA---ATTKDAVDLQILVNLLNSVLENDGKTVDHSNP--------------------- -----KKEGLADSSGNLKS------------------------------------------ ------------------------------LAAELK--QGK--------------VGVLFV -NDVNLVYQ---------------------------------AGEEWKN-LLH-----QAA -LVVSLSDRADETALS--SNVLATT-THFLE-SWGDAEVTK------------GIFSI-QQ -PAIRPLF-N---S--------RSF------EDSLIAFAGGSLGGEASFY----------- -------------EYVKNSWI--KKLG---------------------------------- -------------------------------------SKRNWE-DLL----RTG------- --------------TTVTASERKKVAG---------------------------------- -------------------------------------------PSRNFNRSSIK-KIESSS -TG----------LKLSLFETIAIGDGKAANNA-----------HLQELPD-PVTKL---- ------TW-----DNCILLSPALAKE-KGI-------------S-------------SNDV -LVLK---TA-K--------------QT---I--E-LPAQIQPGMHKDAIAIAVG-YGRT- ------------------------AAGAVGT-------GVGK------NAY---------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Bdellovibrio_bacteriovorus_NP_96849 ------------------MKKALRPKVER---------------DTKYWNSLEQWSNDPEF -NKIASTEF-QSS-PLRESDD---------EGGWARREFLK-L-------MGASLA---MA ----SAGCI--RRP----------VQKIVPY--NKQPEE------VTLGMANYYTSAYFDG -SDALGVLVKTR-EGR----PIKIEA--------NPGHPFSI------------------- ----------------SGLSIRSQASLLSMYDPE-RLKGPQRNLFNE-------------- -------------------KKSNSQ-VIDVKWE-DLDKKV--------AEQLK-------- ---------------KGDVV----------------------------------------- --------------------------ILSGNVASPA---------------TRAVIGDF-- -------AQGFKAKHVVWE-ALSNDDVREGQKASYG---DDVVP-AFRF-DKAKMIVSIDA ---DFLG----TW-ISPTAFTNQFVEGRK------DIKNMNR----LVSFDSNYSLTGANA -D----IRMKIKPSQQLDVVMGLLHEIIVKKGASS-------------------------- ------------------------------------------------------------- ---------------HAGNSAVKAAL----------------------------------- ------------------------------------------------------------- -------------APFADVAKKLNVEP---------ALFAKVAADLWAN----QGTSLVVA -GGIT---TLTEKSKELQVAVNFLNSILGNDGKTVDHNGGNKG------------------ -----DKASQADMAA---------------------------------------------- ------------------------------LIKDMK--DGK--------------VKTLII -HRVNPGFV-------------------------------LGADMGFAE-AIK-----KVD -LVVYTGDRIDETGVF--ADYITPD-NHALE-SWSDMELAS------------GVYSI-CQ -PSIRPMY-D---T--------RSFQLSLMTWAYLANMGPSRLRDYETFY----------- -------------DYLRVFWK--SDIF-------------------PKYGKGQS------- -------------------------------------FEDFWQTALQKGYVGEI------- --------------NSGSSSRSFKVD----------------------------------- -------------------------------------------AFTSIKPAAAK------- -----------EGFELALYSTSQHGDGSLANVS-----------WLHELPD-PVTKA---- ------VW-----DNYVMVSLATAEK-HGL-------------K-------------QATV -VELT---VG-G--------------KT---L--E-LPVLIQPGLHDDVLAVAVG-FGRT- ------------------------RAGKVGN------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- -- ->ACTB1_Cytophaga_hutchinsonii_YP_678817 -------------------------MKDN---------------NKVFWKGVEELGNSPEF -VKNAQNEFPEFL-PLKNSSE--------ESNGTDRRDFLK-L-------LGFSVA---AV ----SLAAC--EAP----------VKKAIPY--LNKPEE------IEPGIANYYASTFVDG -GEYCSVLVKTR-EGR----PIKIEG--------NKLSSVTK------------------- ----------------GGTNGRVQASVLSLYDTA-RIQGPLIKGA---------------- ----------------------------AATWA-DLDKQV--------GVQLGAI--AATG -G---------------NIR----------------------------------------- --------------------------IVSPTILSPT---------------TKKAIAAFK- -A-----KYPSTE-HVQYD-ANSSYGILKANQTSFG---QAVIP-SYDF-SKAEVIVGFGA ---DFLG----TW-ISPIEFVSQYADTRR---LSKTKKTMSQ----HFQFETALSLTGSNA -D----YRQPIKPSQEGLFIAELYNKIVSSK------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------VSTTPVKN---------DVLDKAAAALLKASN--RGKSLVVS -GSND---------VNVQILVNEINLALGNYGTTISLAT---------------------- -----PSFQKQGND----------------------------------------------- ------------------------EAMNTFINDAVA--GK---------------VNAVIF -YGSNPVFD-------------------------------HARGAELAK-ALS-----SVS -LTVSFADRVDETAAL--TKFVAPD-HHYLE-AWGDAEPRA------------GFYSL-GQ -PSISPIF-K---T--------RAA------QESLLLWS----GNSGDYY----------- -------------EFLKSNWI--SSIL---------------------------------- -------------------------------------GGASWD-QAL----QDG------- --------------VFEPKNK---------------------------------------- -------------------------------------------SGVEVTASSFD-RSAVEA -GIIKNYPANTSGIELKLYEKIGLGTGSQANNP-----------WLQELPD-PISKA---- ------TW-----DNYVAVSASYAKA-NAL-------------E-------------QGDR -VAVK---SA-N--------------YS---V--E-LPVLIQPGQAGNTVSIAIG-YGRT- ------------------------HVGKCGD-------GVGK---NVYPFARFVDGSVL-- ------DFVTG--------------------------VSVTKLGGDKYPIAQTQTHH---- ------------------------------------------------------------- -- ->ACTB1_Flavobacterium_psychrophilum_YP_001295304 --------------------------MSS---------------NKKYWKSVEELNENSSI -VETLRNN--EFV-EEISTNEFLGDAVTLATSSTTRRDFLK-Y-------VGFTTA---AA ----SLAAC--EGP----------VHKSIPY--VVQPEE------IVPGVADYYATTIADG -FDFANVLVKTR-EGR----PIKIEN--------NKIAGANF------------------- -----------------HANARVHASVLSLYDSM-RMKTSKIA------------------ --------------------------GKDTIWE-QANAKI--------KASIADA--KAKG -G---------------KVV----------------------------------------- --------------------------LLTNTSASPS---------------TDKLIAQFL- -------VSNPNAKHVTYD-AVSSSEALDAFQTVYG---ERALA-EYDF-SKANVIVSIGA ---DFLG----DWQGGGFDAGYAQGRIPQ-------NGKMSR----HFQFESNMTLSGAAA -D----KRVPMTVANQKQALVQIYNVITG----------------SSIGSSKD-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------EAVMKAAQQLKAA----GSKGVLVC -GIDD---------KNAQLLVLAINKVLSSEAFNTANTRQI-------------------- -----RKGNNADVKQ---------------------------------------------- ------------------------------LLADMK--SGA--------------VHTLIM -NGVNPVYS-------------------------------LPNGKEFAN-SLK-----KVK -LSVAFAMKEDETAAV--ANIAVAT-PHYLE-SWGDVSIVK------------GSYAL-TQ -PTIRPLF-D---T--------VQF------QDALLSWT----GNAQTYY----------- -------------DYLRSSWS---------------------------------------- -------------------------------------GAKSWN-QLV----HDG------- --------------VVFTEGISSSAGAG--------------------------------- -------------------------------------------ADYNGAASTLA-KA--SS -KG----------LELVLYTKTGLGDGQQANNP-----------WLQEFPD-PITRA---- ------SW-----DNYLTISQADATT-SGI----ENWNVANGGL-------------NGSY -VTLT---VD-G--------------VK---L--EKVPVIIQPGQAKGTVGLALG-YGRK- ------------------------AAMKEEM-------QVGVNAYTLYNNFSNVQNVSI-- ------AKEDG-------EHE----FA---------CVQLQRTLMGRGDIIK--------- ------------------------------------------------------------- -- ->PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 ------------------------------------------------------------- --------------------------------MVTRRDFLKAT-------ALTATAISAGI -KF-QPKSY---------------AEATAAS-----------------GEVKFVPNICAMC -PAACSIQVEVR-DGK----VHRIHG--------TPDHPINN------------------- ----------------GKICARGNAGVQRVYNPD-RLKKPLIRTG---------------- -------------------EKGTWS-FREASWE-EALSLI--------ASKVKEY--REMG -H-------------PEYIG----------------------------------------- --------------------------MLGGWLPCTY---------------YKPFFKAFL- -A-----ALGTPNGGGVPE-ALCFLSKALGWKSAYG--FGAHPELLTDY-ENARYVIMLRR -----------NV-AGSISVVHGWRLGQN--------RRKFK----LVVLDPRYSETAAKA -D----VWLPIKPGTDLAFLLAMMNVIINEKLYDS----------NFLAKYSN-------- ---------------------------APMLLKDGKPFKVWDENGKKKYLVFDLAKGAAVE -HDSAMLPALEGEYEVEGEKVIPAFEALKRRVAE--------------------------- ------------------------------------------------------------- -------------YTPEWAEGITDIEA---------KKIREIAREFALR------RGVIDS -GWHG---PKYRNSLLTWRAAAIVNALVGSVNNDGGLLFTGLAQFVT-------------- -----SKESTTEAPSQSVLRMWAEKR----------------------------------- ------------------------GIATAFLGHTVQ--AFYDAIVNEDPYP----IKMLFV -VGHNLLMN-------------------------------MPERQKWEE-ALK-----KLD -FMVAVDILPQDHLYY--ADVVLPE-STYIE-KDDPLFPIAYAPA--------FGFHT-RV -KAIEPIY-D---T--------KHV------IEMMVEIA-SRLGTEDTFFK---------- -------------ALSKGLGV--DAEK----------------------LKSYYHGEGVAG -IRRAQAEAKGVN------------------------YNELLSKGYVLKAGRDK------- --------------IVYNMPYK-----------------------------QPLPTPTGKV -EIFSFMLANF--------------------------------ASKASEPYWDA-LIKWVP -PKVSERKLGSNEFYLAYSRSPFTTHSSTSDNP-----------LLAKLID-DAELYYKG- ------IW----------INSERAAE-LGI-------------R-------------NGDR -VVVE---SVFT--------------GD---K--TEAIAFVNELVRKDTIFTVSG-FGQS- ------------------------------SERLTNIPQRGM------TMMRLIP-LQF-- ------DTLSG------------------TIMSQETIVRITKA------------------ ------------------------------------------------------------- -- ->PhsA_Wolinella_succinogenes_NP_906934 ------------------------------------------------------------- -----------------------------MEIEISRRRFLQGS-------VALTIVGASSG -AL-AVGGS---------------SGNKTES--------------QEKGERSVA-TLCEMC -VNKCAAIARVK-DGK----VIKLDP--------NPLFPKSR------------------- ----------------NMLCARGNAGIKALYDED-RLKYPLIRAG---------------- -------------------ERGDGK-FKRVTWD-EAYTYI--------QEKLVKIMDEEQD -N-------------RSAIG----------------------------------------- --------------------------FCAGEGMGEH------------------HFKEFN- -K-----VFGSSN-WLNHS-SVCLQSTVSGYTLTIG---TYGNP---DL-ANAKYVIMAGA ---NRAE-------AIVTPDTMDLFKRTL--------GRGCQ----LVVIDPRYSHTAHKA -D----LWLPIKAGTDLAFVLALTHVVLSEEIYNK----------KFVEEKFN-------- ----------------------------------------------------------GFE -E------------YKAHILQQN-------------------------------------- ------------------------------------------------------------- -------------YTPEWAEPITGISA---------SDIRKVARDFMAC----APQAIYYP -GRRT---TWAKNDFQLRRAMAIFTALGGGVDVKGGICYGKTL------------------ -----PIDEHSIPAPMYANAKSRIEQNK--------------------------------- ------------------------AAIVGGTGSWVA--WRDMVAAKETPYP----IRGMFI -YKQNPMHC-------------------------------VPNTAKTAQ-MFK-----NMD -LVVTIDTMPSDTAIM--SDVILPE-CTYLE-RTDPVKSFGGIE---------PAIAQ-RN -KVIEPLY-E---T--------KPV------LQILRELT-AKLSRPLFENSLKHDEDLQ-- -------------EMIEEKAS--ELAS-------------------SNPNKGEEELKKLAI -EEVFEDEMEGWDISQGYAHSEEEMNEH---------AVAKYAGAHEMLLKHGV------- --------------FYPGINEQFKQVSANEYVYYPES-------------KKAYSMRNGQF -NTPSKKVECVIPSLAS--------------------------KGIDTMPTWRE------- ---EYLPKTPAGQFRFVTGRHAQFTQSSTANNA-----------LLLDTMSENF------- ------IW----------INKRVAKE-RGI-------------K-------------FGDL -LEIS---SK-A--------------GK---T--R-IKAYPTEKIAPDTVFFVHG-FG--- ------------------------VQSKAMSRAYQNGGHDSM-----------IIEEHI-- ------EPVFG------------------AAAAHETLVEIRKV------------------ ------------------------------------------------------------- -- ->PsrA_Wolinella_succinogenes_NP_906381 ------------------------------------------------------------- ---------------------------------MTRRDFLKS--------AGAAGAAGLVW -SQ-TIPGT---------------LGALEKQ--------------EIKGSAKFVPSICEMC -TSSCTIEARVE-GDK----GVFIRG--------NPKDKSRG------------------- ----------------GKVCARGGSGFNQLYDPQ-RLVKPIMRVG---------------- -------------------ERGEGK-WKEVSWD-EAYTFI--------AKKLDEI--KQKH -G-------------AHTVA----------------------------------------- ---------------------------FTARSGW-----------------NKTWFHHLA- -Q-----AYGSPN-IFGHE-STCPLAYNMAGRDVFG-----GSM-NRDF-AKAKYIINMGH ---NVFE-------GIVISYVRQYMEAIE---------NGAK----VVTLEPRLSVMAQKA -S----EWHAIKPGHDLPFVLGFMHTLIFENLYDK----------KFVQKYCT-------- ----------------------------------------------------------GFE -E------------LKASIEP---------------------------------------- ------------------------------------------------------------- -------------CTPEKMALECDIPA---------DTIKRLAREFAKA----APKAIFDF -GHRV---TFTPQELELRRAMMMVNALVGNIERDGGMYFGKNASFYNQFLGEEDPKA---- -----KGLKKPKTPAYPKVEVPRIDRIGEKDGEFFL------------------------- ------------------------ANKGEGIVSLVP--KATLNELPGVPCK----IHGWFI -VRNNPVMT-------------------------------QTNADTVIK-ALK-----SMD -LVVCVDIQVSDTAWF--ADVVLPD-TTYLE-RDEEFTAGGGKN---------PSFGIGRQ -KVVEPLG-D---A--------KPG------WKIAKELS-EKMGLGEYFP----------- -------------------WK--DIED-------------------YRLQQVDGDLDLLAK -LKKDGSASFGVPLML---------------------QEKKSVAEFVKKFPGAA------- --------------SKVNEEGLIDFPK---------------------------------- -------------------------------------------KIQLFSPKLEEVSGKGGL -GYEPFKYKEEDELYFVQGKTPVRSNSHTGNVP-----------WLNNLME-YDA------ --------------IW--IHPKTASK-LGI-------------K-------------NGDA -IELY---NK-F--------------SS---Q--K-SKALITEGVREDTLFGYFG-FGHV- ------------------------SKDLKRAY------GKGV------NSNALMP-SFT-- ------SPNSG-------MD-----LH--VF-----GVKVKKA------------------ ------------------------------------------------------------- -- ->PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 ------------------------------------------------------------- ------------------------------MKKFSRRTFLKL--------SGAATAA-LAA -AP-TLPRM---------------ASLAANI--------------QLEGSAEFKASYCEMC -TSRCPIQAKVV-DGK----TVLING--------NPEWAATG------------------- ----------------GTVCARGGSGFSQLYDPQ-RLKKPLIRTG---------------- -------------------ERGEGK-WKEVSYE-EAYAYI--------AEKMQDI--KARY -G-------------PEAMA----------------------------------------- ----------------------------FACRKGPH---------------MGYLYTLAK- -------AYGSPN-TFNHE-STCPMAKTVALEATFG---TAAL--GIDY-ANVKYLVTFGR ---NFFE-------GIHVAQTRGVMTAVS---------KGAK----LVSFDPRFSLTSAKA -H----EWFAIRPGTDLAVVLAINHVLIRDGLYDR----------DFIDKYTE-------- ----------------------------------------------------------GFE -A------------VKASLTA---------------------------------------- ------------------------------------------------------------- -------------CTPAWAEQESGVRA---------ADIERIARELAAA----RPRAVVEF -GWRT---TSTPEEFELRRAIIITNLLLGNLEVPGGTFFVKSANFINSLVGKPVI------ -----QPIAGPKLPPFPQPGRPRIDGAGSKGQPYSL------------------------- ------------------------VPPIDGVVQTIP--EAALT---GKPYP----IRGWFI -YRYNPVLT-------------------------------IPDTNRVIE-GLK-----KMD -LVVVCDINMSDTAWY--ADVVLPE-STYLE-RDEGFNDYSGAV---------PVYTL-RQ -KVVEPLY-D---T--------RPH------WQIFKELA-EKLGLGAYFP----------- -------------------WK--DVEE-------------------LRLIQMGGKADLVRM -GKEKGFVNFGLKPLFL--------------------RDRASVAEFVAKFPEAK------- --------------ELVNTQGIIDKP------------------------LLNLKTKSKKI -ELLSTEAEE---------------------------------LFGRGVPVYRP-VKLAEA -GE----------AYFVQGKVAVHTNGHTHNVP-----------WLYNLMS---ENR---- ------LW----------LNPATAAK-LGL-------------K-------------DGDK -AILK---TR-T--------------GQ---Q--Q-VKVLVTEGVRPDTVFGYFG-FGRL- ------------------------SPGLGRAY------KKGI------NSNLALP------ ------------------LVT----ADVCGSTIQTTGVTISKV------------------ ------------------------------------------------------------- -- ->PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 ------------------------------------------------------------- ----------------------------MLEQKITRRTFLK---------GSLAAGALATF -GG-KLIPI---------------EPAKAAA--------------AGQAETRVVPTLCEMC -GVKCGVLAHVR-DGR----VWRLTG--------NPRDPQSG------------------- ----------------GRLCARGNAGTKTLYDPD-RLKGPMKRV----------------- ---------------------GEGQ-FQPISWE-QAFQEI--------GSKLKEL--KEQY -G-------------PQSL------------------------------------------ --------------------------VWLAHPEL-----------------ISPLEKHFM- -A-----AFGSPN-YTGHG-PTCYSSRNVAFEQMYG-----GVP-GVDY-RNVRYYIAFGR ---NLTG-------GIKNPDVQKIVAAKA---------EGAH----LVAVDPRLSDFAYFA -D----EWLPIRPGTDLAMVLAMINVLINENLYDA----------AFVAAYTT-------- ----------------------------------------------------------GFE -E------------LKKGVSG---------------------------------------- ------------------------------------------------------------- -------------YTPAWAAGITGIEA---------GTISRIARELAAA----KPAAAVDP -GWHAVTGSQYGNSVQAGRAIAALNALLGNLGARGGLSLPPTIKLGS-------------- -----PAGIMGPKPPAATAPRWDGAGSE--------------------------------- ------------------------KWPLNKDHGMIQ--TFPERVKQDQPYP----VKAVII -QHLNPVRS-------------------------------STDSLAFIE-ALK-----KLD -LVVAIDIQMNDTAYY--AHYILPE-ATYLE-RYDPLMTVG------------NKVLL-RQ -PAIKPLF-D---N--------KGA------EEIIAGIG-RAAGLSEYFNF---------- -----------------------TLEQ---------------------------------- -------------------------------------YNDALLGPLGLTQAQLA------- --------------LTGVAEVEASKPD-----------------------YSKLKTPSGKI -ELACPAFVK---------------------------------AGSTLTPAWEP-PLVEPR -DD---------SFRLIQGHVPMHTHTTTDNNS-----------YLHAIMP---ENE---- ------LW----------IHTSRAGK-LGI-------------K-------------TGDL -VEVA---SK-V--------------GK---V--R-VKARVTEAIHPEAVFLAHG-FGCR- ------------------------VPLRHLAY------NRGA------NGGDLIP-IMT-- ------APVSG------------------AAAQCETLVTVRKAG----------------- ------------------------------------------------------------- -- ->PsrA_Carboxydothermus_hydrogenoformans_YP_361367 ------------------------------------------------------------- -------------------------------MKLTRRSFLK---------ASAATGALAAL -SG-GVMSF-----------------ERWAA------------KAAETGEVKLIPSICEMC -GTKCGIIVKVK-NGR----VVKIEG--------NKEHPNGK------------------- ----------------GKICARGNAGMKLLYDPD-RLKQPLKK------------------ ----------------------EGDRFVPISWE-QAFREI--------GEKLKEI--KAKY -G-------------PEAL------------------------------------------ --------------------------VWSTHPE------------------LAYDYEVIFN -Q-----AFGSPN-LSAHA-PTCYSPRNVAYKTMYG-----EVP-TVDY-GNVKYYISCGR ---NLVE-------GINVSQVTGIMKAKE---------KGAK----LIALDPRYSNFAALA -S----EWVPIRPGTDLAFLLAMIHLIIKNEWYDK----------EFVKNYTI-------- ----------------------------------------------------------GFE -E------------VAAEVEK---------------------------------------- ------------------------------------------------------------- -------------YTPKWAEEITGIPA---------ATIERITEEFAKA----KPAAVVDP -GWHT---SRYMNSTEMVRAGAVINALMGNLGMKGGLKFPKYKFTKVEEREGLW------- -----PKLEKPKAKRFDGAG-------------------------GEKWP----------- ------------------------LAKGLGMIQMLP--EHILS---GQPYP----IKAYIV -NHHNPVRS-------------------------------AGNSQKWIE-ALK-----KLE -LLVVIDVQMSETAMM--AHYVLPE-STYLE-RFDPPQIAG------------NAVAL-RQ -PAVKPLH-N---T--------MGV------DDIIKELA-HEAGIGQYFNF---------- -----------------------TLEQ-------------------FSDQMLKP------- -------------------------------------FNVTFK-QLV----EKG------- --------------VIALDDGKTEYK------------------------VPEIKTESGKI -ELASSAFEK---------------------------------AGAKKVPTWVP-PGVTEG -NG---------KLRFLHGHTAVHTHTSTFNNE-----------YLHALMP---ENV---- ------LW----------INTRTAEK-LGI-------------K-------------NGDL -VEVK---SD-Y--------------GK---V--T-IKAKVTEAIHPDAVFMVHG-FGGF- ------------------------SPYQKKAY------KKGA------STSFIIP-CHV-- ------EPVSG------------------ASADCEVLVEVRKVGGGANA------------ ------------------------------------------------------------- -- ->PsrA_PhsA_Thermus_thermophilus_YP_004130 ------------------------------------------------------------- ---------------------------------MQRREFLK-L-------SALGVGAMALR -GS-GPAKA---------------LKAPWYA-----------------QEVKSVYQICEGC -FWRCGIVAHAV-GNR----VYKVEG--------YEANPKSR------------------- ----------------GRLCPRGQGAPQTTYDPD-RLKRPLIRVEGS-------------- -------------------QRGEGK-YRVATWE-EALDHI--------AKKMLEI--REKY -G-------------PEAIA----------------------------------------- ---------------------------FFGHGTGDY------------------WFVDFLP -A-----AWGSPN-AAKPSVSLCTAPREVASQWVFG-RPIGGHE-PIDW-ENARYIVLIGH ---HIGE-------DTHNTQLQDFALALK---------NGAK----VVVVDPRFSTAAAKA -H----RWLPIKPGTDTALLLAWIHVLIYEDLYDK----------EYVAKYTV-------- ----------------------------------------------------------GFE -E------------LKAHVKD---------------------------------------- ------------------------------------------------------------- -------------FTPEWAEKHTEIPA---------QVIREVAREMAAH----KPRAVLPP -TRHN---VWYGDDTYRVMALLYVNVLLGNYGRPGGFYIAQSPYL---------------- -----EKYPLPPLPLEPAAGGCSGPSGGDHEPEGFKPRAD--------------------- ------------------------KGKFFARSTAIQ--ELIEPMITGEPYP----IKGLFA -YGINLFHS-------------------------------IPNVPRTKE-ALK-----NLD -LYVAIDVLPQEHVMW--ADVILPE-ATYLE-RYDDFVLVAHKT---------PFIQL-RT -PAHEPLF-D---T--------KPG------WWIARELG-LRLGLEQYFP----------- -------------------WK--TIEE-------------------YLETRLQSLGLDLET -MKGMGTLVQRGKP-----------------------WLEDWE--------KEG------- --------------------------------------------------RLPFGTASGKI -ELYCQRFKE---------------------------------AGHQPLPVFTP-PEEPPE -GF----------YRLLYGRSPVHTFARTQNNW-----------VLMEMDP---ENE---- ------VW----------IHKEEAKR-LGL-------------K-------------EGDY -VMLV---NQ-D--------------GV---KEGP-VRVKPTARIRKDCVYIVHG-FGHK- ------------------------APLMRLAH------GRGA------SDNYLQTRYKL-- ------DPISG------------------GAGLRVNFVRLEKAERPRLPSLTGLAKRPFDE -RRM--------------------------------------------------------- -- ->PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 ------------------------------------------------------------- ------------------------------MPIMSRRSFLK-T-------SGICTAGAIAA ----TYLPD---------------QFLLWAG-------------EKGLAKTEKITTYCEMC -FWKCGAIATVV-GGR----VVKLEG--------NPLSATAK------------------- ----------------GKLCGRGNGGIGLLYDPD-RLKHPLIRTG---------------- -------------------KRGEGQ-FRKASWD-EALTHI--------ADKLKKI--KEEH -G-------------PESLA----------------------------------------- --------------------------LFTHGSPTEH---------------FMPLLQ---- -------GFGSNN-FAMPSFAQCRGPRVVGYELTYG--DDIGSPERLDM-ANSKVVVLIGS ---HLGE-------NMHNSQVQEFTDAIG---------NGAK----IIVVDPRFSVAAGKA -H----HWLPIKPASDMALILAWINIIIREGWYDR----------EYVAKYTH-------- ----------------------------------------------------------GFD -K------------LAAAVQQ---------------------------------------- ------------------------------------------------------------- -------------YTPEWAEKETDIPA---------AQIMATAREMGLH----RPAVCIHP -GRHV---TWDGKDVQRSRAIAILGAILGTWGREGGAYLATRGSF---------------- -----PAVPPPSFPASNRPTLKKG------------------------------------- ------------------------GFPLGGAEGVTN--AIREATSIGEPYP----VKAWMV -TGTNLLAA-------------------------------MPGQKETIE-AIS-----KLD -LLVVVDVIPSDTSLY--ADVVLPE-CTYLE-RHDGLIIGKGRA---------LSASI-RQ -PAVAPMY-D---S--------KPA------WWIAKELS-KKLGLEDYFP----------- -------------------WE--NFED-------------------RLNELCLT------- -------------------------------------YNIDYD-ELK----QKG------- --------------VISFPDTAKPFITADN--------------------QPVFKTKSGKI -ELYSKELEE---------------------------------LGFEPIPAYEK-NEEPPQ -GF----------YRLLYGRSAVHTFSRTVNNP-----------ALNELYK---ENE---- ------LW----------LSSVQARK-MGL-------------T-------------DGQY -VALQ---NQ-E--------------GI---TSNR-VRLKVTERIREDCVYMVHG-FGQQ- ------------------------SKGLTKAF------RRGA------DDQQLISSYPV-- ------DPICG------------------GTGMRCTFVKLVKGA----------------- ------------------------------------------------------------- -- ->PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 ------------------------------------------------------------- ---------------------------------MQRRDFIR---------MSSAVASAALL -GP-TLAGC--------------SRPAEWQR-------------MMTEAPATETPTVCNIC -FWACAAKVHTR-GER----LWKITG--------NPEDAHCE------------------- ----------------GRLCTRGTGGVGAYYDPN-RLVRPLVRMG---------------- -------------------KGADQR-FEVASWD-NALGLV--------AERMEKI--AREH -G-------------PDRLA----------------------------------------- --------------------------ALVHGPGAAH---------------FSHLVR---- -------AFGSDS-IAEPAFAQCRGPRDTGFFLTFG--QGFGSPEQTDM-AKARCIVLIGT ---HIGE-------NLHNSQVRTFTDGIR---------NDAT----IIVVDPRFSVAAGKA -N----HWLPIRPGTDIALLLAWMNVILAERRYDA----------GYVARNTV-------- ----------------------------------------------------------GLE -A------------LCAHVAP---------------------------------------- ------------------------------------------------------------- -------------FTPEWAYGETGIEP---------ALIRETARLMAAA----APATVVHP -GRHS---TWWGDDTQRARAMAILAGLLGIWGREGGYYLPESVAL---------------- -----PAYPVPAYPVPKTSWREIA------------------------------------- ------------------------LPVFPLAGAPVT--NVILDNAHGADAH----YKGLIV -YDTNLPMT-------------------------------MPGIRRTLEAAAQ-----SLE -LIVAVDVQPAEVTGY--ADVVLPE-CSYLE-RHDPLRNSGERY---------PALAL-RA -PALPPRG-E---S--------KPG------WWIAREIG-TRLGLGRYFP----------- -------------------WT--DYTE---------------------------------- --------------------------------------VIDWQLRQVGSSLKEL------- -----------------ETTGIRAFPRRTPAYFAPGE-------------TPRFATPSGKI -ELFSATLQQ---------------------------------AGFDPLPRYTR-PEAPPA -DH----------FHLNYGRAPQHSFSRTQNNP-----------VLYQLMP---ENL---- ------VW----------IHPTAARR-FGI-------------R-------------NGTY -VRLV---NQ-D--------------GV---VSNK-VRVRVTERTRPDSVWLVHG-FGHT- ------------------------APGLSLAR------GRGA------DDSALMTRVLY-- ------DPIMG------------------GTGMRGNFVTFRKENA---------------- ------------------------------------------------------------- -- ->B_Caldithrix_abyssi_ZP_09550397 ------------------------------------------------------------- -----------------------------MKTKMKRREFIK---------IAGAGAGSLVV -GS-KLYAS---------------FNSKDEQ------------NLLADGKIERTPTYCEMC -FWKCAGWVYKK-DGK----PWKIIG--------NPDDPNSR------------------- ----------------GRFCPRGTGGIGAYTDPD-RLKKPLLRVE---------------- -------------------KNGKQV-FKEVSWD-EALDFI--------AGRMKDI--AQKH -G-------------PECIA----------------------------------------- --------------------------LFSHGSGGSY---------------FKTLLH---- -------AFGSNN-VAAPSYAQCRGPREEAYMLTFG--EAVGSPERTDI-INAKCLVLLGS ---HIGE-------NMHNGQVQEFSEAVA---------HGAT----VITVDPRFSTAASKS -K----YWLPIKPGTDLALLLAWIHVIIYEELYDK----------EYVKKYTF-------- ----------------------------------------------------------GFE -Q------------LKEALKD---------------------------------------- ------------------------------------------------------------- -------------KTPEWAYPITTIKP---------HVIRQTAREMAKN----APATIVHP -GRHV---TWYGDDTQRVRAGAILNALLGSWGRRGGFYFPSKAHL---------------- -----PKMPIPKFPNVKRDWRKAF------------------------------------- ------------------------PNKYPVAHLALS--SGICDATIPSPERECS-FKGWIV -YGTNLPMT-------------------------------LPQPEKTLE-AIQ-----HLE -LLVAIDILPAEITGW--ADVVLPE-CTYLE-RYDNLRLSPGRV---------PSIAL-RA -PAFEPKY-E---S--------KPA------YWMARELA-KRLGLEDYFP----------- -------------AKTIEEYL--DYQL---------------------------------- -----------------------------------KAIGSSLE-EMK----KIG------- --------------VKLLPEEAQKLYLEDGE-------------------DFEFPTPTGKI -ELYSTILDE---------------------------------YGFDPIPQYTA-HEEPPE -GY----------YRLLYGRAPMHTFGRTTNNP-----------NLHDLME---ENT---- ------VW----------INSKVAKQ-WGI-------------K-------------NGEY -ITLE---NQ-D--------------GV---RSTP-VKAKVTERIRHDAVFMVHG-FGHS- ------------------------------DKRLRRAYGKGA------DDQRLITRVKI-- ------DPLMG------------------GTGMRVNFVTFRKEEA---------------- ------------------------------------------------------------- -- ->QrcB_Desulfomicrobium_baculatum_YP_003159879 ------------------------------------------------------------- -------------------------------MGLDRRSFIS-L-----VAGGVAGS---LF ----TPVIW-KTLD----------DVSIWTQ---NWPWI----PRLQYGEELTVPALCKLG -ADAYGLKVKTI-AGR----PVAAEG--------NPDHPLSL------------------- ----------------GGICPLGAASVHLLYSPS-RVKNPKLR------------------ --------------------DGS-S-FKDITWE-EAEELL--------AGKIKEA------ ---------------GASMA----------------------------------------- --------------------------MISGDETGS----------------VTDVLSGLV- -G-----KAGSDKSFFMPG----ESAPAAAALAMLG---GDGQV-GYDI-ENANYVLMLGA ---DALG----SW-GNVARNGKAFSASRE---------KGVK----FVYVGPAQNGTSAVA -D----SWIPCAAGTEPVLALGIAAVIAGTNR-DR----------SFWPGFAS-------- ------------------------------------------------------------- --------------FAKFVQTS--------------------------------------- ------------------------------------------------------------- -------------YPLDKVAEITGVSA---------ATITGLAQELVRA-----GRPLVLT -AAEA----GQGLGAFELAAGMSLNMLLQRVNTVGGVRILPWA------------------ -----PKVVEAA------------------------------------------------- ------------------------ADKKAMLANDLV--AYLSTVADGGAEA----PALLMV -YGANPAYA-------------------------------LPNLVKAQA-AID-----KAG -FVVSFSSFMDETAAM--ADLIMPD-SYAFE-RLDDAYSPYGSGQ--------PNYTV-AA -PVIKPVF-D---T--------RPA------GDVLLSVA-AKAELDLGFE----------- -----------------------TFED-----------------------VVKAKAEA--- -------------------------------------LGADFD-EMV----EGA------- --------------VWVSEEFPAQD------------------------------------ ------------------------------------------------LALWTT-PLQELA -VA----AQDGKTLALAPVLRLKIGSSKIAIPP-----------FNTNAIR-FDEML---- ------GN-----DMYVLINAATAKN-LGL-------------K-------------KDDA -VKLA---SS-G--------------GE---C--K-ARVRIFEGVMNDTVVAPLG-LGHT- ------------------------AWDAFSS-------GKGD------NVYKLLA-ADT-- ------ETETG-------LSR----FA--TV-----RVTVSKA------------------ ------------------------------------------------------------- -- ->QrcB_Desulfovibrio_magneticus_YP_002953179 ------------------------------------------------------------- -------------------------------MGLDRRAFLG-L-----VAGGTVGA---MF ----TPIPW-KLID----------DASIWTQ---NWPWI----PRVPKGQVDYVATTSKLC -PAGEGLKIMRV-AGN----PILAGG--------NPSHPLSC------------------- ----------------GGVSALARSEVYMLYSPA-RIKSPMKR------------------ --------------------NGK-T-FAPITWE-QALVEM--------AEKLGAA------ ---------------KGAVA----------------------------------------- --------------------------SISGDNTGT----------------INEVLTALT- -A-----KLGSAGSFMMPS----EATTAAKAMKLMG---AQGQA-GYDF-ENADTVLVLGA ---DIFE----TW-GTSSRNRKAFGANRP---------AGAKPANTYVYVGPSRNNTAAVC -D----QWVPAAAADLGVVALGIAWHLLKAGATSN-------------------------- --------------------------------------------------------APGFD -T------------FKAVVNGG--------------------------------------- ------------------------------------------------------------- -------------FGPEDVKRATGVAP---------ETLAAIAKALASA-----KAPLVVT -GSPF----GQGLGAAPVIAGMSLNMLLGRINKPGGVYMLPEL------------------ -----PSVVPGALTRAAM------------------------------------------- ------------------------------LDGDLP--AFLKGVESGKTPA----PKALLI -YDANPAYG-------------------------------LPEAATMAK-ALE-----KIP -FKVSFSSFMDETAAL--CDLVLPN-SLPLE-RYDDVATPYGSGF--------CVYSL-VR -PIQKPIC-D---T--------KTT------GDVLLGLA-RKLSIDLKFD----------- -----------------------NFQQ-------------------VIKEKVASLAKVSGG -FVAKDVMPWQVAAGKPAPALV---------------GGDLWK-ALE----AGY------- --------------AWTMVGQAAQ------------------------------------- -------------------------------------------TAMGFAAEVVAKAVKAGK -PA--------TATVLAPYAQLRTGTPVTGMPC-----------QDLTTVP-DTELL---- ------GD-----TTFIRVNSETAKT-LGL-------------K-------------KGQM -VKLS---GA-G--------------VD---C--Q-AKVHIFESVMPGMVSAPLG-FGHT- ------------------------AFDYYSQ-------GKGA------NYLSLAA-VVE-- ------EPGSG-------LSM----WI--AP-----EVKIA-------------------- ------------------------------------------------------------- -- ->QrcB_Desulfovibrio_vulgaris_YP_967712 ------------------------------------------------------------- -------------------------------MALDRRGFLK-F-----IGGATAGI---LA ----TPVVW-KGLD----------DVSIWSQ---NWSWI----PRNIKGANSYVPTVSKLC -PTGVGVRVRLV-DGR----PVRVIG--------NPEHPLSK------------------- ----------------GGVSSIAAAEVQMLYSPA-RMKRPLKRSP---------------- ----------------------DGA-YVMISWE-EAEAML-----------LDGLKAAKGG -D---------------ALA----------------------------------------- --------------------------CISGDDNGT----------------INELLSAFV- -Q-----QSGSKS-FFLMP---GEAQPAAKAWDLMG---GEGQI-GYDI-EKSDFVLAIGA ---NVLE----AW-GTAIRNRHAFGASHP-----HGAEPTAQ----FVYAGPVLNNTATGA -D----DWLPIRPGTESAFALGLAHLLIKAGASSS-----APDFDAFRSLAAS-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------FSPEKVAAQTGVDA---------KALTALAQALAKA-----KHPLVIV -GSEF----SQGAGAAPVMAGIALNMLLGSVNRDGGLRALPVA------------------ -----RKVVPAGMDRKAM------------------------------------------- ------------------------------LQQDLT--LWASAIASGKAKA----PKAMLV -YEANPVYA-------------------------------LPQGSAFKD-TLA-----KVP -FKVAFTSFLDETAMQ--CDLVIPV-SMGLE-RLDDVCTPYGCGE--------VVYSL-AT -PVTAPLF-D---T--------KPA------GDALIALG-GKLGLDLGVA----------- -----------------------SFED-------------------MLKAKAAA------- -------------------------------------HGADFD-KLA----EGT------- --------------AFTSRATVG-------------------------------------- -------------------------------------------ANLSFRPDVLSKALDVKA -PA--------LPLALAPVMKLNMGTSKTAIPP-----------FNTKTIR---------- ------RWEVQGKEGYVMLNGATARK-LGL-------------A-------------QHDR -VVLS---NP-T--------------GK---V--T-VRVNIFEGVMNDTVAMPLG-FGHT- ------------------------AFDEFSK-------GKGE------NVMHLLA-PST-- ------EPVTG-------LAV----WTGAGV-------NIAKA------------------ ------------------------------------------------------------- -- ->ArrA_Chrysiogenes_arsenatis_gb_AAU11839 ------------------------------------------------------------- -------------------------------MRIKRREFLK---------ASAAVGAVAVA -SP-TLNAF---------------AQTGTGA------------SAMGEAEGKWIPSTCQGC -TTWCPVEFLFR-MAV----RSKYAA--------TQLSKANN------------------- ----------------GYCCVRGHLMLQQLYDPD-RIKTPMKRTNPVKG------------ -------------------RKEDPK-ICPYHMGMKQWDTI--------ADKIMEL--RKNN -E-------------THKYL----------------------------------------- --------------------------LMRGRYSDH----------------NSIFYGDLT- -K-----MIGSPN-NISHS-AICAEVEKMGSMATEG---FWGYR-DYDL-DNMKYLIAWAC ---DPLS----SN-RQIPNAIRKIQGVMD----------RGK----VVAVDPRMNNTASKA -Q----EWLPIKPSEDGALALAMAHVIITKGLWSK----------EFVGDFKD-------- ----------------------------------------------------------GKN -K------------FVAGKTVKEEDF----------------------------------- -------EEKLTNGIVKWWNLEV--KD---------------------------------- -------------RTPKWAAKVTGIDE---------ATIIRVATEFAQA----APACAIWY -GPNM-----QPRGSYAVMCIHALNGLVGASDSEGGLCTGMGS------------------ -----PSSSYPKIDAYQDDVAKAGA----------KNKKIDQRGTLKFPAMGSA------- ------------------------KPGTGVVTNNVA--DALLA---ADPYD----IKVAIG -YFCNFNFS-------------------------------GTDGARWDK-ALA-----KVP -FFVHCVPMFSEMTYF--ADIVLPAALHHTE-DWAVIRSKANLH---------GHTSI-QQ -PVVERMF-D---V--------KGVE-----TEITWLLA-EKLKAKGFENMY--------- -------------NWLYNEYK--DPET----------------------GKNPTNSLEFAL -YATKIRSKKCWDPKENAEYKGD--------------KLNGWA-DFM----EKG------- --------------IVNSPKFKFRQKW-----------------------EKGFPTETKKF -EFYSETLKKGLLAHAEKNKVTVDQVMEATNYEAR--------GELAFIPHYES-PKRHGD -VK-------EFPFSLIDMKSRLNREGRSTNAT-----------WYHAFKKCDPGDV---- ------NQ-----EDVLQINPADAKK-LGI-------------N-------------EGDM -VKVT---SV-I--------------GS---L--T-VKARLWEGVRPGCVAKCYG-QGHF- ------------------------AMGRVSAKDFGKAVARGA------NFNDIMP-ADY-- ------DRITG-------ATA----RNGGFT-----GVKIEKA------------------ ------------------------------------------------------------- -- ->ArrA_Wolinella_succinogenes_NP_906980 ------------------------------------------------------------- -------------------------------MEINRRDFLKAT-------ALTAGAVGIAQ -IP-EIEANTQVSG----------EVGKWVA------------------------STCQGC -TSWCSIQGYVV-DGR----LVKVRG--------NPNAKGNH------------------- ----------------GKICPRPHLAIQQVYDPD-RVKTPLKRTNPKKG------------ -------------------KGIDPQ-FVPISWD-EAIDTI--------ADKIMAL--IKSG -E-------------SHKFA----------------------------------------- --------------------------LFRGRYTHMN---------------EI-LYNTFP- -K-----LIGSPN-NISHS-SICAEAEKFGRYYTEA---LWDYA-DFDL-DNTRYVLGWGA ---DPLA----SN-RQVPHFINIWGKVRD----------QAR----IAIIDPRLSATAAKA -D----HWLPIIPGEDSALAVAMAHVILAGGAWNK----------GYVGDFVD-------- ----------------------------------------------------------GHN -Y------------FKPGELVPESIEVEGKIIPVEF------------------------- -------KEKHTYGVVKWWNLEL--FD---------------------------------- -------------KTPEWAEPITGIPA---------KQIRQVALEFAAA----GSRAISWV -SPGA---CMQIRGSYASMAAHALNGLVGSCDSVGGILQGTSV------------------ -----PSGKTPDIKPYLSEEIASALKQKKIDQRGTPKFPALNK------------------ ------------------------KTGGGVVTANVA--NAILD---EKPYD----LKMAIG -YWNNFVFS-------------------------------INGTHLWEK-AME-----KLP -FYAHITTHMAEMTMY--ADIVLPAKMHMFE-RYGFSKNKQNLH---------GYLSI-HQ -PMVKPLG-E---A--------KTDE-----TEIVFMIA-QALAKKGHDAPL--------- -------------RYYQENFK--DPET----------------------GKIPSTPEEFDL -FSVKYFTQPIWDGSSNDKGD----------------SINSWK-ELL----EKG------- --------------VWSTKRYSIGKK------------------------IDNFKTETKKF -EFYSETLKKVLEEHVEKNKLSSIDEAIEASNNTAR-------GERVFVPHYEP-SVRYGD -PK-------IYPLIFAEHRSRLNREGRSQNAP-----------WYYEHKDVDPGDE---- ------IE-----KDVAKINPETAKQ-FGI-------------K-------------TGDR -IRIV---GT-Q--------------AS---I--E-TEVKLWEGIRPGIVVKCYG-QGHW- ------------------------AYGSVASEKFGSK-PRGT------NNNDIHI-HEY-- ------DRLSG-------STA----RHGGTA-----RVKIEKI------------------ ------------------------------------------------------------- -- ->ArrA_Sulfurospirillum_barnesii_gb_AAU11840 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -TSWCPIQGLVV-DGK----VVKVRG--------NPNSPSM-------------------- ----------------GRICPRPHLAIQQVYDPD-RVKTPLKRTNPKKG------------ -------------------KGIDPK-FVPISWD-EAINTI--------AEQILGL--IKAG -E-------------SHKFV----------------------------------------- --------------------------LMRGRYTH-----------------MNEILYNTFP -K-----LIGSPN-NISHA-SICAKTEKFGRYYTEG---FWDYA---DF-DLTIPVIFWDG -ERDM---------VSSNRQIPWFMNQQG------YVKDRAK----ITIIDPRLSATAAKA -D----RWAPIIPGTDSALAVAIAHVILSEGRWNK----------SFVGDFQD-------- ----------------------------------------------------------GKN -Y------------FIPGSTVPTEVIVDEKSLPVVF------------------------- -------EENHTYGVVAWWNLELKE------------------------------------ -------------RTPEWAEKITGISA---------KDIRTIAREFSDA----GSKAISWV -TTGA---SMQIRGAYASLAAHALNGLVGSVDAVGGTLQGSXA------------------ -----PSGKTPDIKPYLPAEFEAALKQKKIDQRGTLKLGAFNK------------------ ------------------------KTGGGVVTQQVA--DSILT---DKPYD----VKVAIG -YWNNFVFS-------------------------------INGANVWEK-AME-----KLP -FYAHITTHLAEMSMX--ADIVLPAKMHMFE-RYGFSKNKQNLQ---------GYLTI-HQ -PLVKSFA-D---A--------KTDE-----TEIPFLIA-QALAKKGFDGPL--------- -------------RYFQDNFK--DPES----------------------GKAPTNPRRVDL -YAVKQFTXPIWSGESNEKGD----------------TINSWN-ELL----DKG------- --------------VWKTKKYKIGKK------------------------VDNFATETKKF -EFYSETLKKVLIEHAEKNKVTVDEALEALNYTCR--------GELGFVPHYEE-AVRHGD -EK-------TYPFIFAEHRSRLNREGRSQNAP-----------WYYEIKDVDPGDV---- ------AG-----KDVTKINPLDGKK-LGL-------------K-------------DGDK -IKIT---SV-Q--------------GS---I--E-SEVKLWEGTRPGT------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -- ->ArrA_Bacillus_selenitireducens_gb_AAQ19491 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------EQGEWIA------------------------SVCQGC -TAWCAVQVYRI-DGR----ATKVRG--------NPNAKANH------------------- ----------------GHSCVRSHIGLQQVYDPD-RVKQPMKRTNPNKG------------ -------------------RDEDPE-FVPISWE-EAMDTI--------ADKIIEL--RENN -E-------------THKFS----------------------------------------- --------------------------VWRGRYTSN----------------NGILYGNMP- -K-----IIGSPN-NISHS-SICAESEKFGRYYTER---YWGYA-DYDH-ENALYEIFWGG ---DPIA----TN-RXVPHTASIWGELSD----------RAT----LACVDPRFSTTAANQ -M----NGCRLIPGEDGAIASAIAHVILTEGVWYK----------PFVGDFKD-------- ----------------------------------------------------------GQN -R------------FVEGRDVNEDDF----------------------------------- -------EEIQTHGLVKWWNLEL--KD---------------------------------- -------------KTPEWAAERSGIDA---------DQIYRVARGFANA----APKAISFS -SPGS---SMTIRGGYTAMTQAALNGLVGSADNLGGVISNGISV----------------- -----PNNGFPDPSDYIDEIAANGL----------EQDRIDWGGRLEFPALKDS------- ------------------------KSGGVKVTNTVA--DAVLA---EDPYE----FKSRIE -LLDELQFL-------------------------------QPRNGSLGQ-SFG-----QDS -IHGAYDCQSGEQTHF--ADIVLPVPHSQFE-RQSPVAGSNGNLH--------RHLHL-QN -KVIESPF-D---I--------RVDE-----TEIPWMIG-ESLEKKGYSNLI--------- -------------DYFRNEFR--DPET----------------------GEAPTNAAEFDE -IATKHYTHPVWDPTFEKDGD----------------QIDGWE-EYK----RLG------- --------------TWNTNKYEFRQKW-----------------------DGNWGTETGQF -EFYSETLKVALQDHADKHNASIDDVMEATFNTAK--------GELAFVPHYEP-AMRVGD -ES-------EYPLIFMEHRSKLNREARSANTS-----------WYQEFKDIDLGDE---- ------AW-----DDVAKLNPKDAAE-LGI-------------Q-------------NGDM -VRLV---TP-E--------------GQ---I--E-VKAKLWEGTRPGVVAKCYG-QGHW- ------------------------AYGHIASLDRRRQIARGG------NNNIILA-PVH-- ------EALSG-------SGA----RHGGQT-----RVRVEKV------------------ ------------------------------------------------------------- -- ->ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 ------------------------------------------------------------- -------------------------MSRNKTSGISRREFLK-V-------MGSTGAALGLG ----LSATS-GNKV----------LAEEDPY---EVLPE------GEHKSGEWVPTGCAGC -TSWCSLEANVV-DGR----VIKIRG--------NSRSKVNG------------------- ----------------ESSCPRSHLSLQQVYDPD-RIKRPMKRTNPEKG------------ -------------------RDVDPE-FVPISWE-EAFEEI--------ADKIIEL--RENG -E-------------SHKFV----------------------------------------- --------------------------LWRGRYTR-----------------LRDILYGILP -E-----FVGSPN-KISHS-SICAEAEKFGPYYTEG---YWAYR-DYDL-QNSDYILIWGT ---DPIQ----SN-RQVSLYSREWGNILE----------GAR----IATVDPRFSRTAAKS -N----EWLPVKPGEDGALALAMAHVILTEGLWHK----------EFVGDFVD-------- ----------------------------------------------------------GEN -K------------FTAGEEVDEDEF----------------------------------- -------EENYTHGVVKWWNEELKD------------------------------------ -------------RTPEWAADKTGIPA---------EQIVRVAAEFGEA----APHACVFM -GGGG---VMQTRGGYNSMAIHGLNGLVGSIDNEGGAV-RGASV----------------- -----PNQSFPDHSEFLDDISREGL----------DHEMIDRRGRLEFPAFKDG------- ------------------------ESGGGVVTNLSA--DGIIE---EDPYE----IKMGIG -YWNNFNFA-------------------------------APETERWDE-AMS-----KLD -FYVHLVTHQSEMTQY--ADIVIPSTHHMFE-QWGMLYQKGNLH---------THFWL-SR -PMINRHWEL---I--------EPE------AEFSWLLA-EKLAEKGYSNM---------- ----------------LDYFK--TIVD-------------------PETGEEPEDYREFAK -YATKHYMQPVWDPEMESHGD----------------QFDGWE-DFK----EAG------- --------------VWNSDEFEFQQYW------------------------GEFTNSTGDF -EFYSETLKEALEEHAEKHDVSIEEVLEACKYEAE--------GELAFLPHYEE-PYTVGD -DE-------EYPLLLVDSKSALNREGRSANAN-----------WYYDLKDIDPGDS---- ------TE-----ADVIKIHPRDAEE-LGL-------------E-------------DGDE -VVVS---SP-A--------------GE---I--T-CQLNVWEAVKPGTASKTFG-MGHW- ------------------------AYGRVAAEDFADGEPRGG------NNNEIIP-AEY-- ------ERLSG-------STS----FY-SHI-----KVNIERA------------------ ------------------------------------------------------------- -- ->QrcB_Syntrophobacter_fumaroxidans_YP_844744 ------------------------------------------------------------- -------------------------------MKVGRRAVLQFM-------AGAVGGTLL-- ----SPLPWKLTD-----------DAAIWSQ---NWFWR----PSPARGEITRKPTVCALC -EGGCGVQARLV-DGK---RAILLEG--------NPNHPVNQ------------------- ----------------GGICALGAAGLQFLYAPY-RIAQPLKQTK---------------- -------------------RRGDPTGFQPIAWN-EAVGEL--------AKKLGQM--RADG -K-------------PNGLA----------------------------------------- --------------------------GITRRRCSS----------------MDALLNQFF- -A-----AYGSPN-LFKMP-AHADSLKLAGAVTT-----GREAPFGCNI-EDAPYILSFGA ---GLVE----GW-GSPGRMQAAFRRWRQ------GGKSAAK----IVQVDSRCSTTAAMA -D----RWIAVPPGTEAALALGIAHLMVKDKLYDA----------EFMADRVF-------- ----------------------------------------------------------GFE -D------------WTDSQGKNHKGFKFLVQTDA--------------------------- ------------------------------------------------------------- -------------YTPEAISKLTGVDP---------AKIRELAKEFGTQ-----KGAVAVW -GQPQ---GSVPKDMYNELSFLALNALKGNI-KAGGAIGLA-------------------- -----PEVPLGALPELPGDPSALKGLKQLRLDLASSQK----------------------- ------------------------GPPPVLPGNNLH--GFLDAVSNGGKYP----IEVMLV -HEANPAYG-------------------------------LCENKLFQQ-ALT-----KIG -TLVSLSSYMDETAQQ--ADLILPI-HTAFE-GFDDVIGIPGAPY--------AYYGV-CA -PVLKPHL-N---T--------KAA------GDIVMSVA-KQLGGSIAAAL---------- ------------------PWA--SHEE-------------------YLKKRAEGLAASARG -ALADKKGVELWKLQPEEAVKPNYKD-----------GADLWK-KLA----GGA------- --------------CWYDAPVDP---------------------------LKDLKTESGKF -ELAAQLLLAKGQTGD---------------------------DDQVYLPHFSQVPPRGSD -KD--------YPLLLVTYQMSALADRDLANPP-----------FMTKTVF-DFILR---- ------QN-----DQFVEINPATASE-LGM-------------A-------------EGDS -AVLK---TP-Q--------------GE---V--P-VRVHLYAGARPKVVYLAQG-LGHK- ------------------------AYDEYIK-------DKGV------NANGVVE-VQL-- ------DRVTG-------LGT----VW--AA-----RAHLRRA------------------ ------------------------------------------------------------- -- ->QrcB_delta_proteobacterium_NaphS2_ZP_07200609 ------------------------------------------------------------- -----------------------------MTMKITRRNFIA-A-----VVGGVVGI---QV ----TPLPW-KFTD----------DAAIWTQ---NWPWV----PVPAEGAVTEENTVCNLC -PGGCGISVRKV-AER----AVKIEG--------RTDYPVNP------------------- ----------------GGICPVGMGGLQLLYDDDMRFPGPMKRAG---------------- -------------------ARGQGQ-FVNITWG-EAYDIL--------AGRIAKL--RKDG -T-------------PEALA----------------------------------------- --------------------------AIDGNYAGTT---------------TGLLVERFM- -R-----SVGSPN-YVKPN-AITDTYH-MGNLLMMG---KSVPM-AYDL-ENSDFILSFGC ---GLLE----GW-GAPGRVMNAWGMWHD----ANPKNRKTR----VVQVESRASNTASKA -D----FWVAPRPGTDGALALGIAHVLIKKGRVDE----------RFINGFTY-------- ----------------------------------------------------------GFD -D------------LTSSEGQSQPG------------------------------------ -------------------FKTIVSNK---------------------------------- -------------YSPVQVERITGVDA---------GTIVALANAFSKA-----KAPVAVY -GKGK---NNLNGSLYEFMAVQSLNAVKGRINRPGGVLVPDPL------------------ -----PLAPLPEFDPDEVAAKGLETPRIDGAG----------------------------- ------------------------TKAYPFTDSLIN--HFADAINQGARSP----VDTLLV -FSANPFFT-------------------------------VPDGPGFMN-ALE-----KIP -FIVSFSPYRDETANM--ADLILPD-HTYLE-KIEDIVWPVGLQY--------PLYGL-TK -PVVEPVN-D---T--------QHA------GDVIISLS-KAVGEATGSAF---------- ------------------PWE--NFEE-------------------ALQARAKGLFDAGGG -LVHYDASKPPWKFKPFGNGQKPSYKS----------FDDMWG-EMK----SGG------- --------------MWFQPVKLAGMDG-------------------------LFATSSGKF -EFVSQKLRQTINETAAQTSQKAALDQMGIRVA----------GAEAFMGHYAA-PKLG-- ------VDRSKYPLFMVPYEMINLSSGWIATPP-----------FLYKTIF-ASQLL---- ------KE-----ESFAAVNPETAAK-YKL-------------Q-------------QGDR -AIVK---SP-V--------------GE---L--R-VRIDLFEGAMPEMVYMPLG-FGHT- ------------------------AYDEYQK-------DKGV------NPNNIVK-ALN-- ------DPVSG-------YPL----WW--NT-----PVTLTKA------------------ ------------------------------------------------------------- -- ->QrcB_Desulfatibacillum_alkenivorans_YP_002430439 ------------------------------------------------------------- -------------------------------MKLNRRNFLL-VSTAG-AAGGAVGS---MF ----SPLSW-KLMD----------DSSIWTQ---NWPWT----PVPADGEVSFEETTCTLC -PGGCRVKVRKV-DER----PIKLEG--------VEGGPVND------------------- ----------------GGICILGLTALQLLFGPA-RVHTPMKRAG---------------- -------------------KRGEGK-WVEITWE-EAISEV--------SGKLAEI--RETG -R-------------AQDLG----------------------------------------- --------------------------CIAGGGKGV----------------INALFSRFM- -E-----AYGSPNFYWQATAWDCYEENI---LRTLG---LNGTA-GFDL-ENADYILSFGA ---GLLD----GW-GSPVHVFQAHSKWRE------NHDGHAT----LVQIDAQLSNTAAKA -D----KWLPIVPGTEGAVAMAMAHVIISKNLYNR----------GYVNWNTT-------- ----------------------------------------------------------GFR -D-----------FYRTVESEYAPAKVVKIACPVDN------------------------- -------------------------KE---------------------------------- -------------YQKKWL-----------------EELESRAIAFAKA-----DKPLAVA -GKGN---GDRPVSQAELNAVQALNALVGAINRKEGGMVVLPDE----------------- -----PKYPWKPVVMDAEARSYKPSLVSVRGRS---------------------------- ------------------------KYGHSNLVSVLP--QALNSSHEG--------LKVLLL -AGSNPLYT-------------------------------LADTEKTAE-ALQ-----KVE -YIVSFSSQFNDTTAY--ADIILPD-HIFLE-STVDAPTPPGFAK--------PVYGL-AE -PVIKPVY-K---T--------KAM------GDSIIEIA-KAMGGTIAQSF---------- ------------------PWA--DSAE-------------------AIEQA---------- -------------------------------------LGGKWP-LLK----RGG------- --------------VYVNEDFTPETEG---------------------------------- -------------------------------------------VRFRFFARSGMESRISIQ -GK-----AEQYPLIATPVDCIRLATGALADTP-----------FMVKTVS-DKKLK---- ------HK-----ELVVQVNAMTAQQ-YGF-------------K-------------EGSE -AVLE---TP-V--------------AK---A--K-VRVHCSEEIAPGLVGVPRG-LGHI- ------------------------AHDEFVG-------GKGT------NYNTLIS-PVQ-- ------DPATG-------FDV----AW--GI-----RAKLT-------------------- ------------------------------------------------------------- -- ->QrcB_Desulfococcus_oleovorans_YP_001530428 ------------------------------------------------------------- -------------------------------MKIDRRSFLT---------LLAGGAVGTAL ----SPMTI-KLTD----------DISIWSQNFRGTPIE---VPVPERGPASYVDSVCTLC -PGGCGISVRKI-GDR----AVKIEG--------KAGHPVNN------------------- ----------------DGVCALGLSGLQLLYGPW-RVTGPK-------------------- -------------------KKENGR-WKKISWD-RALSEI--------AEKLNEL--REAG -K-------------ADAIA----------------------------------------- --------------------------GISRTGRGT----------------VARLMQRLL- -A-----AAGSP--HFLPV-PTNENAYSDAVARMFG---KPGTV-GFDF-ENSGYVLSFAA ---GLLD----GW-GSPVHMFSAHSQWKT---------NGVK----MVQVESRLSSTAAKA -D----QWVAVKPGTEADLALGLAHVILRDNLNAG----------AAANSRAF-------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------DSFAALVKKD---------------------------------- -------------YTPARVAAATGIKE---------SVIVALAKEFAAA-----SHPVAVC -GRGD---GQTPCDSREVMAVTALNALVGSVNRQGGMIIGPEPDY---------------- -----IQWARPVLDDTAQKGL---------------------------------------- ------------------------AKGPKTLADLLA--GKTPD------------VQALFV -LEANPAYT-------------------------------LHDTTKVKA-ALE-----AVP -LVVSLSSFMDETSAL--ADYILPL-PTCLE-RTEDVVVTAGLKT--------PMIGL-TQ -PVVEPRL-D---T--------RHP------GDVILDLA-KAMGGTVAESF---------- ------------------AWS--DYQD-------------------CLEKT---------- -------------------------------------FGLVYG-KLA----TEG------- --------------YLQKSVLETLIDT---------------------------------- -------------------------------------------AVAVGRADFAP-VVEADK -K----VRQNTPALVLAAYDAMRVAGGAIATPP-----------YAMKIVP-DTILK---- ------KN-----DLYVEINPETAQK-AGL-------------A-------------DGKA -AVVE---TP-A--------------GT---A--Q-VRVRVTHEVAPGMVAMPRG-FGHT- ------------------------AYDDYVS-------GKGV------NVNDLIG-PVP-- ------DPVSG-------LDT----AW--GA-----PAKLIKA------------------ ------------------------------------------------------------- -- ->Gemmatimonas_aurantiaca_YP_002761548 ------------------------------------------------------------- ----------MIAPSATTDHRPSTTMTTEAGTGVKRREFLK-I-------LGATGATTAVV -GC-SSEK----------------VGKLIPY--VTSPDN------TVPGVSQYYATSCREC -AAACGVLAEVR-DGR----PIKLEG--------NPEHPLNR------------------- ----------------GAICATGLAGIQGVYNPD-RYRSPMVR------------------ ----------------------EGNALKPTTWD-KAYELL--------AQKLGEV--KSKG -Q-------------AGNVV----------------------------------------- --------------------------FVNQHETGT----------------FPGFLDQWL- -S-----AQGMPA-HLSVD-STAPIATIAANQKAYG----AAWP-ALNF-SAAKLVISFGA ---DFLD----GW-GHSVPQQLDWADARS------KLDVAPR----LVYIGARRSLTGLNA -D----QWIAAKAGSEMAICAALTGT----------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------GSAAAAAEAANVPV---------ATIEALVKAVADA----GNGIMALC -GVTG------NDAVECGVMVAEINKKGGAVGTTINTAK---------------------- -----AHGSYTGLASYAD------------------------------------------- ---------------------------LAAAVKNMD--AGT--------------VPLAFV -RGANPAHT-------------------------------MPKSAGFAA-AFA-----KVA -FKVSFSSMPDETAQL--ADLVLPD-NHWLE-SWGDAVGEN------------GQISL-QQ -PTLDPVF-D---T--------RAT------ADVLIDLA-KKDQTLAARY----------- -----------------------NVAN---------------------------------- -------------------------------------FRSWYISQF-----PGG------- -----------------ASAFATALTK---------------------------------- -------------------------------------------ASVSGAPLVAT-STRTLA -TTALPVAEGAGEFFVQVYPSSTLGDGAGANKP-----------WLQELPD-PVTKI---- ------AW-----QSWIEVHPSTAKK-LGI-------------K-------------EGSH -LTIE---TA-A--------------GK---V--T-APAYIYMGVRTDTVAIALG-QGHT- ------------------------AYGRFAQ-------NIGV------NAYDLVS-HGW-- ------DSA-G-------SLA----IG--SV-----KGKVTVSADSSPLVTTE-------- --GSARQHGRGIAQAMTLAA----------------------------------------- -- ->ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 ------------------------------------------------------------- --------------------------MKLLETLINRRRFLKAT-------GAVAGAGVVAG -GA-GVVP----------------GLTTLSHARSPAPSA----------DTTITKNICHQC -PARCGIDVYTT-GGR----VHAIYG--------TSDHPISN------------------- ----------------GKLCPKGPLGAYILYDPD-RFKGPMKRTNPNKG------------ -------------------RDQDPG-FVPISWN-EALDMV--------ADRLNGL--RERE -E-------------SHRFA----------------------------------------- --------------------------LLYGRGWGAS---------------CAGLLGNFG- -K-----LYGSPNVAIGHS-SMCSDGSIISKKAVDG---IGGYN-SYDY-KNANMLLMFGA ---GFLE----AF-RPYNNNMQVWGYIRG------VKVPKTR----ITAVDVHMNTTLAGS -D----RALLIKPGTDGALALAIAHVILVDGLWEK----------AFVGDFSD-------- ----------------------------------------------------------GVN -R------------FIPGETVDPDSF----------------------------------- -------EEKWVKGLVEWWNAEL--KD---------------------------------- -------------RSPRWAAQVTTLYE---------RDILATAREFGTT----RP-AIALY -ERGA---HAHSNGIFNGMAIHTLNALVGSLYAKGGLAYQVGPSYGPL------------- -----PVNADDYLDDWARTGGWK------------AQPRIDLKGH---------------- ------------------------PDGYLLANNMMQ--EIGPNSLQGKPYK----LDTIMF -YLNNAIWT-------------------------------APDVKAWEE-ALK-----EL- -FVIETSPFPSETAMF--ADVILPD-HTYLE-RLQDAPTYPFQGW--------PMTQL-RV -PAVKPLY-D---T--------KYF------GDVLIELG-KRIQGSMGEYY---------- --------------QALDNTE--NVIR-------------------HLAKGFESDPGDNGV -N-----------------------------------SFESWK--------EKG------- --------------VWYKRVYPYRQIDGEFYEWDGQDHTRL--MSADEVRGALFKTASGKF -EIRSGWLEAHADWIAAKTGRD---------------------PSRLMFPIWEE-PSHPGG -GD----------LYMVTPKVALHAEGRGANLP-----------VAIANMQ-PTLGG---- ------RN-----TIYIEINPKTARA-RGI-------------P-------------DGSR -VRIS---SD-L--------------GA---I--E-GYCKYYEGVRPDTLVFPME-HGHW- ------------------------AHGRWAK-------GRKP------GHSGEITVNQS-- ------DRITG-------QCS----YY--TT-----KVRIERA------------------ ------------------------------------------------------------- -- ->Halorhodospira_halophila_YP_001001949 ------------------------------------------------------------- --------------------------MSVLDHLVSRRRFLQ-A-------TGVGGGAVAAG -GV-GHLLS---------------FSAGGSHARADGPVG--------GGETQITKNVCHQC -PARCGIDVYTT-DGR----VHAIYG--------DPGNPIAN------------------- ----------------GRLCPKGHLGSYILYDPD-RFKGPMKRTNPNKG------------ -------------------RDEDPQ-FEAISWD-EALGIV--------AERLNRL--REQE -E-------------SHRFA----------------------------------------- --------------------------LMYGRGWGAS---------------CAGLLGPFA- -K-----LYGTPN-VIGHS-SMCSDGSMVAKGLTDG---NESYN-AYDY-RNTNYILNFGA ---GFLE----AF-RPYNYLMQVWGHMRT-------KSPKTR----VTAVDVHMNPTLAAA -D----RAVTIKPATDGAMALAIAHEMLVNGYWDR----------DFVGDFTD-------- ----------------------------------------------------------GAN -R------------FEAGTEIDPDDF----------------------------------- -------EEVWTQGLIRWWNDEL--KD---------------------------------- -------------RTPEWAESITTVPA---------ETIRRVAYEFGTT----RP-AMAIM -ERGP---TSHSNGTYNGMAIHALNALAGTLFTEGGLFYQMDVPYGDG------------- -----PADPDDYLDDYAGRMQERFDEGEIPRIDKLG------------------------- ------------------------TDRWPLARNMMQ--EVGPNHAAGEPYK----LDTILF -YLNNPIWT-------------------------------APDATAWEE-ALK-----DV- -FIIDTSPFPGETARY--ADLILPD-HTYLE-RLQDAPTYPFEGY--------PMTAL-RT -PAVEPLY-D---T--------KVF------GDILIEIG-KRLDGPAGEY----------- -------------------WQ--------------------------AVGDTENLLRHLAE -GFRDHPGDNGVE------------------------DFESWK--------AKG------- --------------VWYKKPYHWKQERGVFYEWVEDDGDYTHEMSAEEVADKLMPTPSGRF -EFFSEKLQEHADFVASEFGID---------------------HERAGLIQWVD-PDHPGG -GD----------LYFSTPKTALHAEGRGANIP-----------HAIAHVQ-PVMGG---- ------RT-----TVYLEIHPRTARE-RGI-------------R-------------SGDR -VRIV---SD-V--------------GE---I--E-AYARLFEGTRPDTVCLPME-HGHW- ------------------------AQGRWAE-------GRKP------GHSGEVTVNQS-- ------DRISG-------LAS----YY--TT-----KVRVERA------------------ ------------------------------------------------------------- -- ->Alkalilimnicola_ehrlichii_ABI55571 ------------------------------------------------------------- -------------------------MKMILDTLLNRRRFLKAT-------GATGAAAATTA -GVGKLAGF---------------TAASTTSTHVNARPG---------GETRVTKNICHQC -PARCGINVYTT-NGR----VHAIYG--------DPGNPIAN------------------- ----------------GKLCPKGHLGTQLLYDPD-RFKGPMKRTNPNKG------------ -------------------RDEDPE-FVPISWD-EAFDIV--------AERLNRL--RERG -E-------------SHRFA----------------------------------------- --------------------------HFYGRGWGSS---------------DAGLYGDFG- -K-----LYGTPNSAIGHA-SMCAEGSKRAKRATDG---NDSYN-SYDY-RNTNYILNFGA ---GFLE----AF-RPYNYLMQVWGHMRT-------KSPKTR----VTTIDVRMNPTMAAS -D----RALMIKPGTDGALALAIAHVILTEGLWDK----------EFVGDFED-------- ----------------------------------------------------------GRN -H------------FRTGETIIPDAF----------------------------------- -------QANWTHGLAEWWNGEL--KD---------------------------------- -------------RTPEWAEEITTIPA---------KHIYTVAREFATT----RP-AMAIM -ERGP---TAHFNGTYNGMAVHALNALVGSMFAEGGLFYQMGPSYGPL------------- -----PVSADDYMDDYAREMQGKHPRIDMAG------------------------------ ------------------------TEKWPMAGTMMQ--ECAKHHLAGDPYK----LDTAMF -FVTNPIWT-------------------------------APDPRLWEE-ALK-----DV- -FIIDTSPYPGETAMY--ADIIMPE-HTYLE-RLQDSPTYPFEGW--------PMAAL-RT -PAVDPVY-D---T--------KHF------GDMIIEIG-KRINSPMADYY---------- -----------------RELG--DVEN-------------------MLRHRAAGFANDPGD -N---GVN-----------------------------DFESWK--------EKG------- --------------VWYKKPYHWRYWRGTFYEWDGEGYNI--EMSEDEVKDKLMPTASGKF -EFKSSFLENNANYIARE--MGIA-------------------EDRVGLIQWVE-PRHTGD -GD----------LHFVTPKTPLHAEGRSANIP-----------QAQAYMQ-PIVGG---- ------RG-----TCYLEIHPKTAQE-RGI-------------N-------------DGDT -VRLS---AQ-VR-------------GETKSI--L-AVARYMPGHRPDTLVLPME-YGHW- ------------------------AQGRWAT-------AQGRDM-KPGHSGDLTE-NLS-- ------DPISG-------LAC----YY--TA-----KVRLEKA------------------ ------------------------------------------------------------- -- ->RBG1_855 ------------------------------------------------------------- -------------------------------MQVTRRDFLT------------------FA -GF-TLAGI---------------TLGEWGRSKILAREEYKDTLYSGIGKEEFRLSICGQC -PAGCGIVVRLM-DGN----PKKIDG--------NPLCPLSR------------------- ----------------GKLCPKGQNGLQVLYDPD-RLTGPVKRKG---------------- -------------------KRGEND-WEKISWE-EAINTV--------SQKLKEL--KEKQ -N-------------SYRLL----------------------------------------- --------------------------ILTQENKGL----------------SGKLWKQFA- -R-----AYGTPN-LVEGN-LLRDPGILWASYLMQG---IKDYP-AYDI-ENTKYILCFSP ----FLE----GW-YSPTWAQRMYGNFRR-----KRPEIRGK----LVQIEPRLSPTAANA -D----EWIQINTGTEAALVLGLAYLIIKEGRYDE----------NFIREHTF-------- ----------------------------------------------------------GFE -D------------WTDAQKRTHLG------------------------------------ -------------------FKNFVLQE---------------------------------- -------------YDTEKVSSLTGVPI---------VTIIRLAREFSEL----NPALAIAE -QRPA------SGGFYLQMAILALNALVSSLDVKGGVIIQREV------------------ -----PFKEFPEVSGSKKESILNQE------------------------------------ ------------------------RFSSQEVFPHLT--KAILE---EKPYP----IEIVLI -DKINPFSH-------------------------------CFPIINFKE-ALE-----KIP -FIVSFSPFLDETSLY--ADLILPD-HTFLE-KWQDVVPSATLGS--------PVLGI-SR -PAVDPFL-D---T--------KNT------ADVILEIA-HDRDILAYSTL---------- ------------------PWK--NYGE----------LLKDSLQGIYLSRRGMTYGTSFQG -AWMSQMEKGGWWSPTYTN------------------FEEFWN-QLL----EKG------- --------------GWWDPFYEHQKWD------------------------RVFKTPSGKF -EFYSQIFKNQLASIKPSKEN----------------------SDFKILPHWES-VVWEGD -EN-------SFPLYLNVFELLMFSAVLNSNQP-----------YLYEHIT-PHLSV---- ------QW-----ESWVEIHPEKAKA-LGI-------------E-------------ENDE -VWVE---SV-L--------------GK---I--K-TKAKLYFGTHPEVVSLPLG-LSGL- ------------------------SQSSWIK-------KEIS------NPNQLVT-GNS-- ------GNL---------ENK----YL---------RVKIYKA------------------ ------------------------------------------------------------- -- ->II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 ------------------------------------------------------------- ----------------------------MHLRRLSRRTFLK---------AAVATSAATA- ------------------------VLSHWPRSGRGIQEG------ATPAQERWVKSVCLQC -PAACGIMVRVV-KDSLGERAVKIEG--------NPNHPSNQ------------------- ----------------GGICPKGHIGLQILYDPD-RLQGPLRRVG---------------- -------------------PRGEGK-WEPISWE-EALQIV--------TERLKKL--RERG -E-------------PHKLV----------------------------------------- --------------------------IMSGRNRGQ----------------MGALIDRFL- -A-----AFGSPN-HVGHS-SICSDGAKLAHYLTQG---FKHYA-AYDW-DNCNYLLSFGA ---GFIE----AW-RPTVRLLRAFGHMRR------GRPIRAK----IVQIETRFSVTAAKA -D----EWLPINPGTDGALALAIAHVIVREGLYNK----------KFVEEHTF-------- ----------------------------------------------------------GFE -D------------WEDEQGHFHQGFKTLIRQ----------------------------- ------------------------------------------------------------- -------------YTPAWAAPITGVPE---------ETIVRIAREFATT-----PPQIAAG -QRGA---MMQTNGIYNYMAIHALNALVGSIDAPGGVL-VQIDP----------------- -----PLTPWPPLAQDEIAQTGV------------KQPRIDHAGTEEFPLA---------- ------------------------AN----VYAALP--DFIIN---EDPYA----IDTLML -YYTNPVFS-------------------------------SPDAPKYSQ-AFE-----KIP -FIVSFSPFLDDSSLF--ADLILPD-HTYLE-RWHDDVIYPSLGY--------PVYAV-RQ -PVIAPLY-N---T--------RNT------GDLLIELA-HRLGGTVKESF---------- ------------------PWK--DFLE-------------------LIQFRARGIYESGRG -NIQANS------------------------------FEEFWQ-QLL----EVG------- --------------FWTDPPYPFGQWE------------------------RVFKTPSKKF -EFFSQKLAHTLEDLAKKKAEHEGIPEEEALDKILTRLKITARGDAAFMPHYEE-PRFVGD -PK-------EYPLYLNTYKLMAHAEGRGANSP-----------WLQEILG-THVGR---- ------RW-----ETWVEINPTTAQK-LGI-------------T-------------EGDW -VWVE---SP-L--------------GK---I--K-VRAKLHPGAKPDVVNIPFE-RGHR- ------------------------SYGRWAV-------GFGA------NPNEVLA-REY-- ------DYLGG-------DAA----FF--ST-----RVKVYKAQEGE-------------- ------------------------------------------------------------- -- ->ACTB1_Geobacter_sp_M18_YP_004200644 ------------------------------------------------------------- ---------------------------------MKRRTFLQ-I-------SGMTAA---SA ----LISGC-QSA-----------NEKLIPY---LIPPD----EGITPGKAVYYASSCRSC -PAGCGILVRVS-EGR----AKKIEG--------NPEHPVNR------------------- ----------------GKLCARGQALLQELYHPD-RVPQPLKRSG---------------- -------------------PRGSGQ-FTRISWE-EGLNLL--------TGQLKGL--ERAG -A-------------AERLA----------------------------------------- --------------------------LMTPQLRGT----------------LATLAATFM- -S-----SFGSPH-HLSYE-LLAPDALRAANRASFG---QPSLP-WYDI-AQTRYLLSFGA ---EFVD----HH-LSPVHYGNAFGRMRQ-----ERDTVRGH----FTYVGGRLSLTAASA -D----RWMPARPGSEGALALGIARLILSESLHDR----------GALSANGL-------- ------------------------------------------------------------- ----------SATDLLAGLAS---------------------------------------- ------------------------------------------------------------- -------------YDLARVAELTGLSR---------EAIAEVAREFATT-----RPSLAMA -GEGV---AFLSNGPETLRAIGLLNLVTGNLNSPGGVYPDGSF------------------ -----PDGPENSFADLVS------------------------------------------- ------------------------------LVGAMA--GG---------------RIALAL -IQGDPLHR-------------------------------VPAATGFPE-ALA-----KVP -YIVSFSQIMDDTALQ--ADLILPD-HAQLE-SWGDVIPVAGGRF--------PLTGL-MQ -PVVTPVF-D---T--------RQF------PDVLLAAA-AALGGKTARAL---------- ------------------PFP--SYQE-------------------LVKKSVLQRAARVKG -EE----------------------------------AEEIWTSLLQ----KGG------- --------------DFREGPEQPKGYRW--------------------------------- -------------------------------------------APGASLPAPQA-PLFAGD -ER-------SFPLHLQLYPSTAFLDGRGAPLP-----------WLQQLPD-PMSTV---- ------VW-----DSWVEMNPKTAAG-LGI-------------A-------------HGDL -VEVS---SP-Q--------------GS---L--R-LPAVVYPGIRPDLVAIPIG-QGMR- ------------------------GGGRYAR-------GRGV------NPLSLLA-AKL-- ------KGTGP-------TPC----WS--AT-----RVKLVRISGDGGLVTNGNPQGSYRS -DLVGI------------------------------------------------------- -- ->ACTB1_Geobacter_metallireducens_GS_15_YP_384764 ------------------------------------------------------------- ---------------------------------MKRRTFLQ---------LGTVIAAGAVL -D--GCRSK---------------NEQLIPY--LIPPDE-----GITPGKGTYYASSCNAC -PAGCGILVRVS-EGR----AKKIEG--------NPEHPINR------------------- ----------------GKLCARGQAVVQELYHPD-RVPHPLKRNG---------------- -------------------PRGSGA-FTRISWQ-EGIGLL--------TDRLKAL--QREQ -S-------------TNGLA----------------------------------------- --------------------------LLTPHLRGT----------------LAELTGRFM- -R-----TFGSTN-HVSYE-LLTPDLLRIAARRSFG---QPTLP-YYDI-AETRYLLSFGA ---DFVD----SH-LSPVKYGSAFGEMRQ-----GRDTVRGH----FTYVGGRMSLTAASA -D----RWMPAKPGSEGTLALGIARLILAESLYDS----------GALAMNGL-------- ------------------------------------------------------------- ----------EAKKLLAALDR---------------------------------------- ------------------------------------------------------------- -------------YDLPRVAQLSGLPQ---------GAIAEVAREFAST-----RPALALA -GEMV---AFQSNGPESVRAVHLLNLLVGSLNRPGGIYPDAGS------------------ -----PSGPENSFAELIA------------------------------------------- ------------------------------LIETMR--GGH--------------VKVAMI -HG-DPLYS-------------------------------VPPATGFHD-ALA-----KVP -FIVSFSSLLDDTALH--ADLVLPD-HAALE-SWGDVIPVAGTRE--------PLVGL-MQ -PVVEPLF-D---T--------RQF------PEVLLATA-HELGGRMAA------------ -------------ALPDESYL--ELLK-------------------GAVRKQAGFGAGVD- -------------------------------------FEAAWVDLLQ----HGG------- --------------LFKTKSVQPTGYR---------------------------------- -------------------------------------------WSSDAPPPLPEDPDFAGD -QK-------TYPFHLIAYPATAFYDGRGAPYP-----------WLQQLPD-PMTTV---- ------VW-----GSWVEINPETAAE-HGI-------------G-------------FGDL -VEVS---SP-Q--------------GT---L--R-LPAVVYPGIRPDMVAIPLG-QGHR- ------------------------GMGRYAQ-------GQGV------NPLALVARQGT-- ------KQ----------QPA----WN--AT-----RVRITRISGNGELVTAGHPQGSLRS -ELVEI------------------------------------------------------- -- ->ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 ------------------------------------------------------------- ---------------------------------MKRRTFLQ-L-------SGMTAA---GT ----VLSGC-QSG-----------NEKLIPY---LVPPD----EGVTPGKADYYASSCRFC -PAGCGILVRVS-EGR----AKKIEG--------NPAHPVNR------------------- ----------------GKLCAMGQAVLQELYHPD-RVPQPLKRSG---------------- -------------------PRGSGA-FTRISWE-ESLELL--------AGQLRAL--QREK -A-------------TDRLA----------------------------------------- --------------------------LVTPQLNGT----------------LVELTTRFM- -R-----VFGSPH-HLSFD-LLGPDWLRTATRRSFG---QPGLP-WYDV-AETRYLLSFGA ---DFVE----HH-LSPVQYGYAFGRMRQ-----GRDTVRGH----FTYVGGRMSLTGASA -D----RWMPARPGSEGALALGMARLILAESLSDA----------GSLAVNGL-------- ------------------------------------------------------------- ----------QTEKLLRRLEA---------------------------------------- ------------------------------------------------------------- -------------YDLPRVAEQTGLPQ---------RIIAEVAREFATT-----RPALAMA -GETV---AFQSNGPDAVRAVQMLNLLVGNLNRPGGVYPDGGSRVG--------------- -----PENSFTELLS---------------------------------------------- ------------------------------LVAAMR--DGR--------------FRVAMI -HG-DPVHA-------------------------------IPPATGFQE-ALA-----RVP -FIVSFSSLMDDTALQ--ADLILPD-HAALE-SWGDVIPLAGTRD--------RVIGL-MQ -PVVTPLF-D---T--------RQF------PDVLMAMA-DKLGGKTAAF----------- ------------------PYQ--SYQE-------------------MLKGTMEKRVGRAAR -RD----------------------------------FETVWVELLR----QGG------- --------------LFETRQGQEKGYRR--------------------------------- -------------------------------------------APGSSLPNPAE-PRFAGD -EK-------RFPLHLLVYPSIAFYDGRGAPLP-----------WLQQLPD-PMTTV---- ------VW-----DSWVEINPRTAAE-MGI-------------G-------------FGDL -VEVT---SP-Q--------------GA---M--R-LPAVIYPGIRPDMVAIPLG-QGHR- ------------------------GMGRYAR-------GRGS------NPLVLLA-LIT-- ------DGTET-------RPA----WH--AT-----RVRLTRISEKGELVTAGHPQGSYRS -ELIEI------------------------------------------------------- -- ->ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 ------------------------------------------------------------- ------------------------MSENKSSSNWTRRSFIK-A-------MGLGGAAGSAL ----VLSGC-GDTDIINEVDIEVRKEKVEPN--VDPQDY------VRPGIEMYYASTCRQC -PAGCGVHARIR-EGR----VLKLEG--------NPVSDVNH------------------- ----------------GRLCPMGQAGLQSHYNPD-RLTKPMLRKG---------------- -----------------------GK-LVEISWD-EAEDVL--------RKNLGRK------ ---------------NAKLA----------------------------------------- --------------------------WLSGATSGH----------------HRALVDAYL- -A-----AAGAKN-HFVFD-TLPPAVGHAANQEMFG----SYMP-RLDF-DKARLIVSFGA ---DFLG----TW-MSPVQFSTQYAEFRN--------APRGT----LVQIEPKMTLTGANA -D----RWIPARPGTEGHLALALASLLVQKSEYAD------RVPADVVASLKD-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------VNVDEVAKLCDIPV---------ERIHHLHHLMTD-----RSPSLVLS -GASA---EGVQHGFETARAILMLNVLLGNVGETIL------------------------- -----PRSEDPFPALAPRMGGWS-------------------------------------- ------------------------------EVKAMV--DGLNKGS----------FDTVVV -FGSNPLYQ-------------------------------APGFMQADK-AFD-----KAK -FRISFSMFPDETTMA--CDLVLPV-HSYLE-EWNTTMPAYAATD--------GYLGL-QQ -PVMNPVF-GSHAT--------RSF------GDLMLDVL-KHMDPNFKQ------------ -------------------WD--SYQA-------------------YVMGALWTMRPALVK -QYKPSVPGQT--------------------------EEEAFKQGIL----SDG------- --------------FVQMKVAKAAKIE---------------------------------- -------------------------------------------AKVSAVTLPAE------- ------KANANYPFRLIPSARLGLWDGRHANVP-----------WLQELPD-QLTEV---- ------VW-----DSWIEIHPKTAEK-LGV-------------I-------------TGDV -VQVE---SS-A--------------GK---A--K-VKVVVFPGIHPDAVAIPLG-QGHT- ------------------------EYGRYAK-------GVGV------NPFSILA-ALF-- ------DGKTG-------ELA----TY--AT-----DVKVAKIESRGKLVTLANGDLVLES -NTSTQAG-RELVKTTTAENFDLTEKGA--------------------------------- -- ->ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 ------------------------------------------------------------- ---------------------------MMTENDFNRRDFLK-V-------LGWGGT---AV ----ALSGC-GNTSIQDG------QETVTSY--VELPSY------VIPSISNYFNSTCAQC -DAGCNIMGRVR-EGR----VLKAEG--------NPNSPINR------------------- ----------------GKMCGLGQSGVQAHYNPD-RVRQPLL------------------- --------------------KGEA-----ITWD-KALGVI--------AQNLSAVK----- ---------------GAEVA----------------------------------------- --------------------------FLTGGMSGH----------------VQALLGNYM- -D-----ALGSKN-HFSYE-AISPAVLRAANKKAYG----VSMP-RYRI-DKAKVVVSFGA ---DFLG----AW-VSPVHFTQQYAQFRK----GNRPEGRGV----LVQIEPKMTLTGANA -D----RWIAVRPGTEGVLALGIINALGKAGLSIP----------ADIAAVSN-------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------AYTAERVSGETDVSA---------EQIGKLAALLKE-----RTPSLVLA -GGAV---EGYAHGSQNATAIALLNRVLGNVGKTVEAT----------------------- -----ASVPFPQIAPTVGN------------------------------------------ ------------------------RSSLIGLNDGLA--AGK--------------YKVVFS -YGVNPVFS-------------------------------APASLKFRD-NFA-----KAE -FKVAFAQYMDETALA--ADLVLPL-DSAME-DWGTVVPEYMAAPAEDHSAAYAQMSF-RQ -PLMQKVFPD---T--------RGV------GDILLALL-KQREADKYKEF---------- ----------------EDFYS--YLRS-------------------AVLKNKVALGGKATD -D-----------------------------------DETFWD-NTL----SQG------- ------------IVPFKGIANPVSAK----------------------------------- -------------------------------------------ASAAGLKLPSA-V----- ------TADSSYPLRLIPAVSASMRDGRNANEP-----------WLQESPD-PLTTI---- ------VW-----DSWVEINPKTAAK-LGI-------------V-------------EGDI -VEVA---SK-S--------------GS---I--R-TQAYLFPGIHPDAVSVPVG-YGHE- ------------------------AMGRYAK-------GVGA------NVFGMLD-TVF-- ------DKETG-------ELA----LNETSVKISKVGQRVIIVKEEGPVGGSQDGKKKIAV -QVSADKVDLSKEV----------------------------------------------- -- ->ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 ------------------------------------------------------------- -------------------MIDSGSVKQMAGHPFDRRDFLK-V-------LGWSGA---AV ----ALSGC-GNTSVEDG------RETVVSY--VEANDY------MVPGIGVYFNSTCAQC -DAGCSVNGRVR-EGR----VLKLEG--------NPDSAINK------------------- ----------------GKLCGLGQAGVQHHYNPD-RVREPLLRNG---------------- -------------------NKGEA-----ISWD-KAYALI--------AEKLAGVQ----- ---------------GEEIA----------------------------------------- --------------------------FLSGGVSGH----------------LKVLLGNYL- -D-----SLGTKN-HFVYE-AIAPSVVRAANVKAFG----VEMP-RYRF-DKAQVVLSFGA ---DFLG----SW-VSPVHFSQQYAQFRK-----GVNGQRGV----LIQVESKMTLTGANA -D----RWLAVKPGTEGVLALGIINALGMATGDVA----------ELVKG----------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------YDKARVSRETGVST---------GQIDKIAALLKL-----RSPSLVLA -GSAA---EGYAHGSQNAAAINLLNQVLGNVGKTIEAP----------------------- -----VSVPFPQMAP---------------------------------------------- ------------------------SKGNTVALKNLN--DGLAAGK----------YKVVFN -FAANPVFT-------------------------------APGAFKFKD-NFA-----KAG -FKVAFAHYLDETALQ--ADLVLPL-DSALE-DWGTQVPEYLTEG--------AQINI-QQ -PLMERLHAD---T--------RGM------GDILLSLI-KQKKADEYKGF---------- ----------------EDYYA--YLRG-------------------AVLQNKGALGGGGVE -------------------------------------DDTFWNDTLTNGIVKLA------- --------------GTTTSLAAHAS------------------------------------ -------------------------------------------AAGLLLPAEAE------- -------ADEHFPLHLIPGVTASLRDGRHTNQP-----------WLQESPD-PLTTI---- ------VW-----DSWVEIHPKKAAE-LGI-------------V-------------EGDI -VEVT---SK-T--------------GS---V--K-AQVYLFPGIHPEAISIPVG-RGHD- ------------------------AMGRYAK-------GYGV------NPFQIMD-AVF-- ------EAATG-------ELA----MH--ET-----RVKISKTGQRVLVVKDEGAAGALQM -GRKIAARVSTDQVDLSKEV----------------------------------------- -- diff --git a/assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json b/assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json deleted file mode 100644 index 7d4156c1..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_phylo_model.json +++ /dev/null @@ -1,11 +0,0 @@ -{ - "empirical_frequencies": true, - "datatype": "AA", - "subs_model": "LG", - "program": "RAxML version 8.2.9", - "ras_model": "gamma", - "gamma": { - "alpha": 2.776473, - "n_cats": 4 - } -} diff --git a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta b/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta deleted file mode 100644 index f147286f..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta +++ /dev/null @@ -1,917 +0,0 @@ - ->Acidovorax delafieldii_NARG -MSHFLDRLSYFSQPRENFAQGHGQTNGEDRTWEDAYRDRWAHDKIVRSTHGVNCTGSCSWKIYVKGGIVT -WETQQTDYPRTRPDLPNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLKHWRAAMALAKSPVDAWASIV -ENDASRSEWQKQRGLGGFVRSTWDEVNQMIAAANVYTIKKHGPDRIIGFSPIPAMSMISYAAGSRYLSLI -GGVCMSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAHFLTEVRYKGTKVVS -ITPDYSEVAKLGDLWMHPKQGTDAAVAMAMGHVILKEFYFKDGGKGRSAYFDDYARRYTDLPLLVVLKEK -TLPDGRTVMVPDRYVRASDFPGQLDQSNNPDWKTVGYDELGQVTLPNGSIGFRWGADGRADQGLWNLENK -EARTGNTVKLKLSVIEDGVQAHDVADVAFPYFGGVQTPNFTANEQGGDVIVRRVPVSHLELAGHEAQGRV -MVATVFDLLAGNYGIDRGLPGEEPGGSYDADRPYTPAWQEKITGVPRDQIITVARQFADNADKTHGKSMV -IIGAAMNHWYHCDMNYRGIINMLMLCGCIGQSGGGWAHYVGQEKLRPQTGWTALAFALDWIRPPRQMNST -SFFYAHTDQWRYEKLGMEEILSPLADKKSYSGSMIDYNVRAERMGWLPSAPQLKTSPLQVAKDAAAKGMD -AKDYVVQSLKNGSLTMSCEDPDHPDNWPRNMFVWRSNILGSSGKGHEYFLKHLLGTTHGVQGKDLGQDEA -KPEEVQWHAKAPEGKLDLLVTLDFRMSTTCLYSDIVLPTATWYEKNDLNTSDMHPFIHPLSTAVDPAWQA -KSDWEIYKGFAKAVSEVSVGHLGVEKDVVLTPIMHDTAGEMAQPYGVRDWKRGECELIPGKTAPQVTVVE -RDYPNLYKRFTALGPLMDKAGNGGKGIGWNTQTEVGQLGDLNGRVKEEGVTQGMPRIVTDIDATEVVMML -APETNGHVACKAWEALGKQTGRDHVHLALHREDEKIRFRDIQAQPRKIISSPTWSGLESEKVSYNAGYTN -VHEYIPWRTLTGRQQFYQDHPWMRDFGEGFVSYRPPVHLKALHEVEGKKPNGNREIALNFITPHQKWGIH -STYSDNLIMLTLNRGGSVVWLSEDDAARAGIVDNDWVELFNANGAIAARAVVSQRVNPGMVMMYHSQEKI -INTPGSEITGTRGGIHNSVTRVVLKPTHMIGGYAQYSYGFNYYGTIGTNRDEFVLVRKMDRVDWLDDDVS -DAPAHA - ->NxrA1_Nitrospira_defluvii_YP_003798853 -MMQLSRRQFLKVSAGTVAVAAVADKALALTALQPVVEVNNPLGEYPDRSWERVYHDQYRYDSSFTWVCSP -NDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGTFAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKG -WKQWMDDGSPELTSDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRLREQGYAPE -MIEMMKGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNPDQAQGGRYWNNYTWHGDQDP -SQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAHWKLESMERGARLVIITPEYNPTASRADYWI -PVRPETDGALFLGASKIILDENYQDIDFIKGFTDMPLLVRTDTLQYLDPHEVLKDYQVPDFTKSYSGRVQ -GLSQDQVQRLGGMMVWDLAKGKAVPLHREQVGVHLAQSGIDPALTGTYRIKLLNGREVDVMPIYQLYTIH -LQDYDLDTVHQVNRAPKDLIVRWARDCGTVKPAAIHNGEGVCHYFHMTSMGRAAALVMMLTGNIGKFGTG -CHTWSGNYKVGIWQAAPWSGAGASVYLGEDPWNLNLRDDVHGKEIKYRKYYYGEEPGYWNHGDNALIVNT -PKYGRKVFTGKTHMPSPSKVRWVVNVNILNNAKHHYDMVKNVDPNIEMLVTQDIEMTSDVNHADVAFAVN -SWMEFTYPEMTATVSNPWVQIWKGGIRPLYDTRNDLDSFAGVAAKLKEMTGEQRMADTYKFVYHNRVDIY -VQRILDASTTFFGYSADVMLKSEKGWMVMCRTYPRHPLWEETNESKPHWTRSGRLETYRIEPEAIEYGEN -FISHREGPECTPYMPNAIMTTNPYVRPEDYGIPVTAQHHDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYC -VTPKTRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYVDGNPVD -RPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRPDGRAIAVDTGYQSNFR -YGAQQSFTRSWLMPMHQTDSLPGKQANALKFKWGFEIDHHAVNTVPKECLIRITKAEDGGIGARGPWEPV -RTGFTPGQENEFMVKWLKGEHIKIKV - ->NxrA2_Nitrospira_defluvii_YP_003798871 -MQVSVSRRQFLKISAGTVAAVAVADKVLALTALQPVIEVGNPLGEYPDRSWERVYHDQYRYDSSFTWCCSPNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGTFAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQWMDDGSPELTPDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRLREQGYAPEMIEMMKGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDAEKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAHWKLESIERGARIVVITPEYNPTAYRADYWIPVRPETDGANFLGAAKIIFDENLQDIDYIKEFTDLPLLVRTDTLQYLDPRDVIADYKFPDFSKSYSGRIQSLKPEQVERLGGMMVWDLAKGKAVPLHREQVGFHFKESGIDPALTGTFRVKLLNSREIDVMPIYQMYQVHLQDYDLDTTHQITRAPKDLIVRWARDSGTIKPAAMHNGEGVCHYFHMTEMGRAAAFIMTITGNIGKFGTGCHTWSGNYKAGIWNAVPWSGAGLAVHTGEDPFNLTLDPNAHGKEIKTRSYYYGEEVGYWNHGDTALIVNTPKYGRKVFTGKTHMPSPSKVRWVTNVNILNNAKHHYDMVKNVDPNIEMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSNPWIQIWKGGIRPLYDTRNDADTFAGVAAKLAEMTGDARFRGVFHFVYMNRVDVYPQRMLDASATCYGYSADVMLKSEKGWMVMGRTYPRHPLWEETNESKPQWTRSGRIETYRIEPEAIEYGENFISHREGPECTPYLPNAIFSNNPFIRPDDYGIPITAQHHDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPKTRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFVDGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRPDGRAIAVDTGYQSNFRYGAQQSFTRNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHHGINTVPKECLIRITKAEDGGIGARGPWEPVRTGFTPGQENEFMIKWLKGEHIKIKV - ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 -MKLTRRAFLQVAGATGATLTLAKNAMAFRLLKPAVVVDNPLDTYPDRRWESVYRDQYQYDRTFTYCCSPNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKATRNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKRWADDGFPELTPENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKLIDQGYPKEMVDRMQGAGTRTFKGRGGMGLLGVIGKYGMYRFNNCLAIVDAHNRGVGPDQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAHWVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNNTDTALFLGITKILIDNKWYDADYVKKFTDFPLLIRTDTLKRVSPKDIIPNYKLQDISDGPSYHIQGLKDEQREIIGDFVVWDAKSKGPKAITRDDVGETLVKKGIDPVLEGSFKLKTIDGKEIEVMTLLEMYKIHLRDYDIDSVVSMTNSPKDLIERLAKDIATIKPVAIHYGEGVNHYFHATLMNRSYYLPVMLTGNVGYFGSGSHTWAGNYKAGNFQASKWSGPGFYGWVAEDVFKPNLDPYASAKDLNIKGRALDEEVAYWNHSERPLIVNTPKYGRKVFTGKTHMPSPTKVLWFTNVNLINNAKHVYQMLKNVNPNIEQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSNPFIQIWGKTGITPVYESKDDVKILAGMASKLGELLRDKRFEDNWKFAIEGRASVYINRLLDGSTTMKGYTCEDILNGKYGEPGVAMLLFRTYPRHPFWEQVHESLPFYTPTGRLQAYNDEPEIIEYGENFIVHREGPEATPYLPNAIVSTNPYIRPDDYGIPENAEYWEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPKSRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYVDANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRPDGRALSPSGYQSSFRYGSQQSITRDWSMPMHQLDSLFHKAKIGMKFIFGFEADNHCINTVPKETLVKITKAENGGMGGKGVWDPVKTGYTAGNENDFMKKFLNGELIKVDA - ->I_OP1_uncultured_candidate_division_bacterium_BAL57377 -MAVSRRRFVKATAALTGAALVTDTLGLQGFKFVPEIKNPLEFYPNRDWEKIYRDQFRYDSSFTFLCAPNDTHNCLLRAYVRNGVIVRIGPTYGYNEARDLYGNKVSARWEPRCCQKGLALGRRFYGDRRVNGVWVRKGFFDWVRAGFPRDPHTGAPPKEYFNRGQDSWLKLSFDEAYGIVAQALFNIVQTYSGPEGAARLKAQNYDPTMLEAMHEAGTQTVKVRGGMPFLGATRIYGLARFANMLALLDAHIRNVSPDQALGGRVWDSYSWHTDLPPGHPMVTGQQTVEFDLFTAENAKLITLWGMNWICTKMPDAHWLTEARQRGAKVITIATEYQATANKADEVIIIRPGTDAAFALGVASVIINEKLYDEEYVKTFTDLPLLVRMDTLKLLRASDIIRDYQPAELTNYAKVLKPDEKPGPPLAQRVQYIPERARQAWGDFVVWDSTKNAPEVITRDHVGQFFAARGIDPALEGSFTVQTTDHQEITVRPVFDLIKEYLKEFTPPKVAEMSWAPSEAIVNLARQIAANKASTLLSHGMGPNHFFNADLKDRALFLIAALTKNIGHFGGSPGSYAGNYRVALFNGLPQYIAEDPFNIELDPTKPATVKSYAKSESAHYYNYGDRPLRVGKKLFTGKTHTPTPTKFMWFANSNSLLGNSKWGYDVIHNTLPKIEAIVVNEWWWTMSCEYADVVFGVDSWGELKYPDMCGSVTNPFVQVFPRTPLPRIFDTRSDIETYMGVAEKFAELTGDARFRDYWHFVRENRVDVYLQRICDASSSLRGYKFTDLEEQARQGTPMLKLLRTYPKIVGWEQTQESKPWYTKTGRLEFYREEDEFIEYGENLPVYREPVDATPHEPNVIVAPKTLSALKPAPPEQYGLKRDDLSTETRQVRNVIKTPEEVVRSQHPRTKDGLKFIFITPKYRHGAHTTPVDLDVLAVYFGPFGDIYRRDKRSPWVGEVYADINPQDAKELGIEDGDYIWIDADPEDRPYRGAKPSDPDYKIARLMGRARYYNGTPRGVVRMWFNMYQATHGTVNAHETRPDKLAKDPQTNYQAMFRYGGHQSCTRAWLRPTLMTDSLVRKDVFGQTIGQGFAPDIHCPVGAPKESFVKITRAEPGGADLKSLWRPAQLGYRPTYESDEMKQYLAGGFIEVT - ->RBG1_10 -MTLSRRRFLKISSLSAAGALVDLPELKFLQFLETVENPLEYYPNRDWEKIYRDQYRYDSSFTFVCTPNDTHACRLRAYVRNGIVIRVEQAYDVQNYTDLYGNKASVMWSPRGCNKGYNLPRRVYGPYRVKHPMVRKGWKEWAEAGFPDPTLPENQQKYFRRGEDSWVKVSWDEGFELVAKGLLHTMEKYSGEKGAEILRKQGYPEEMIEAMHGSGAQTIKIRGAMPLLGATRIFGFYRFANMLGLYDGKLGARGWSNFSWHGDLPPGHPMVTGVKCSDPELNDFRHSKLLVFLGKNMVESKMADAHWWIETIERGGKVVNISPEYSATSSKSDYWIPIRPGTDTALLLGVTQIIIQEKLYDQDFIKKHTDLPLLIRMDNLKLLRPTDIIKGYKNQILTGYSVKVQKIKPELREKWGDFVVWDLKTKKPQTVTREDLGEKIERKGLNPALEGNYKIKLVNGKEIEVKTVFQLYKELLSEYDLETVSQITGSPKNLIYQLAQDLATIKPASIHTGEGVNHFFHCDLVTRAVWLPLALTGNIGKPGANVGHWAGNYKGEVFDGLGVYLNEDPFNPNLDPSAKLEDIKLKKYYKGEEVCYWNYEDRPLIVKGKCFTGKTHMPTPTKAEWVGNGNLLNNAKWAHNMIANVEGKVEMIVYNEIEWTASCEYADVVFPVHSWMELTLPDMTASCSNPFLQVWKGGIKPIFDTKQDNEVLAGVAAKLSELTHDNRYKDYWKFVLEGNNEVYLQRILDACSTTKGYKIDELLKSDRGWLMNFRTYPRIPFWEQIQESKPFYTKTGRMEFYREEDEFIDYGENLIVHREPVEATPYLPNVILGTHKAIRPNSYGISPESINADERQVRNLKMSWKQVKLSKNPLWEKGFRFYCLTPKSRHTVHSSWSVLDWNMIWQSNFGDPYRMDNRTPGVGEHQMHMNPLDAKELGINDGDYAYVDANPEDRPYTGWKEEDPFYKVSRLMVRVKYNPAYPRGITMIKHASFIATHKSVKAHESRPDKRAVSEDTGYQSSFRYGSQQSITRGWLQPTMMTDSLVRKNYMGQEIGEGYEIDVNAPNTCPKETLVKIIKAEDGGMGGKGKWEPARTGYTPAGENKDMKKFLEGGFILKV - ->A_Nitrobacter_hamburgensis_YP_578638 -MSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLERSLPP -YEPRGCQRGISASWYVYSPIRVKYPYIRGPLLDMWREAKASSADPVQAWGALIGDEQKRSRIQKARGKGG -FRRAKWEELVELIAAASLHTARKHGPDRIMGFSPIPAMSMLSFAAGTRFLSLMGGSLMSFYDWYADLPTS -FPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVHFISEARTEGTKFVVLSPDFSQIAKYCDEWIP -IQAGQDTALWMAANHVILKEYYVDRQVPYFVDYIKRYTDLPFLVELESNGNTYKTGRLLRSNRVPRYKDV -ENGDWKMLLLDANSGELRAPKGQVGDRWGSVHGKWNLSGEDTLDNSPLDPVLSFIDRSDDVVQVGFDDFA -NGRIVSRGVPVKRVATDKGEILCATGFDIMMSQFGISRGLEGAFATSYDDEDAPYTPAWQERHTGIGRET -AIRFAREFATNAELTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVA -PWATVALALDWAKPPRLVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPKWAKGHAIDLEAKAVHNGWMPFT -PHFNRNPIEVAAEAERSGAKNVQDIETYVVDQVVSKKLQMAIDDPDAAENWPRMWFIWRGNAIQSSAKGH -EFFLRHYLGAHDNAIAEDRAKGKAQVVKYHETAPRGKYDLVIDLNFRMNTTSLYSDIVLPTAFWYEKNDL -NTTDLHSFLHVLGQAVPPVWESKTDWEIFKLIGKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPEIL -DWSLGECKAVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGISAVGVQIPIKKQYDQMLDNPIMPMPD -PRHMRCVEWGGKRYPSLEDVLDACNTVLLCAPEANGEVCYQAFHNEEHHVGLPLVDLAEPNRNVAATFYD -LTRQPRRIITSPCWTGMVNDGRAYSAWCMNVERLVPWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNPR -KTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRMLMLSRGMDPVWINDRDAEKVGIEDNDWVEVYN -DNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRTRINPLFLAGGYAQFTYGWN -YWGPTGILTRDTHVVVRKMEKLEW - ->B_Nitrobacter_hamburgensis_YP_578186 -MTTGLAAGQRTEETQMSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWE -MQQTDYPLLERSLPPYEPRGCQRGISASWYVYSPIRIKYPYVRGPLLDMWREAKASSADPVQAWGALVGD -EQKRARMQKARGKGGYRRAKWEELVELIAAASLHTARKHGPDRIMGFSPIPAMSMLSFAAGTRFLSLMGG -SLLSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVHFIAEARTEGTKFVVLS -PDFSQIAKYCDEWIPIQAGQDTALWMAANHVILKEYYVDRQVPYFIDYVKRYTDLPFLVELEPNGTTYKT -GRLLRARHVPRYKDVENGDWKMLLLDANSGELRAPKGQVGDRWGSVHGKWNLSGEDTLDNSPLDPVLSFI -DRSDDVVQVGFDDFANGRIVSRGVPVRRIATDKGEILCATGFDIMMSQFGISRGLEGAFATSYDDEDAPY -TPAWQERHTGIGRETAIRFAREFATTAEYTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGG -GINHYVGQEKLAPVAPWASIALALDWSKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPRWAKGHAI -DLEAKAVRSGWMPFTPHFNRNPIEVAAEAERAGAKSTEDIATHVIDQVASKKLNLAIEDPDAAENWPRLW -FIWRGNAIQSSAKGHEFFLRHYLGTHDNAIAEDRAKGKTHTVKYHDTAPRGKYDLVVDLNFRMDTSSLYS -DIVLPTAFWYEKNDLNTTDLHSFLHVLGQAVPPVWESKTDWDIFKLIAKKVSELAPLAFSKPVRDVVLQP -LMHDTPDELAQPEILDWAEGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGVSAVGVNVPIKK -QYDQMLDNPIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVLLCAPEANGEVCYQAFHNEEHHVGLPLV -DLAEPTRNVATTFYDLTRQPRRLLTSPCWTGMMNDGRAYSAWCMNVERLVPWRTLTGRQTLYIDHQWYLD -FGEHIPTYKPRLNPRKTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRMLMLSRGMDPVWINDRDA -EKVGIEDNDWVEVYNDNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRTRINP -LFLAGGYAQFTYGWNYWGPTGILTRDTHVVVRKMEKLEW - ->Nitrobacter_winogradskyi_gb_ABA05326 -MSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLERSLPP -YEPRGCQRGISASWYVYSPIRVKYPYIRGPLADLWHEAKASYPDPVQAWASLVEDEEKRNRIQKARGKGG -FRRAKWEELIELIAASCLYTARKHGPDRVMGFSPIPAMSMLSFAAGTRFLSLFGGGLMSFYDWYADLPTS -FPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVHFISEARTEGTKFVVLSPDFSQIAKYCDEWIP -IQAGQDTALWMAANHVILKEYYIDRQVPYFIDYVKRYTDLPFLVELEPNGNTYKTGRLLRSNRVARYKDV -ENGEWKMLVLDTATGEPRAFKGQVGDRWGSTHGKWNLSAEDTLDNSPIDPVLSFIDQSDGVVQVGFDDFV -NGSVVSRGVPVKRIATDKGEVLVTTGFDIMMSQFGHSRGLEGSFATSYDDEDAPYTPAWQERHTGIGRET -AIRFAREFATNAELTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVA -PWSTVAMALDWNKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPRWAKGHAIDLEAKSVRCGWMPFT -PNFHRNPIEVVAEAERAGAKSTADIATYVADQVASKKLDLAINDPDAEENWPRVWFIWRANAIQSSAKGH -EFFLRHYLGAHDNVIAEERAKGKTTTVKYRDTAPQGKYDLVVDINFRMNTTGLYSDIILPTAFWYEKNDL -NTTDLHSFLHVLGQAVPPVWESKTDWEIFKLIAKKVSELSPLAFSKPVRDIVLQPLMHDTPDELAQPEIL -DWAEGECKLVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGISAVGVNIPIKKQYDQMLENPIMPMPD -SRHMRCVEWGGKRYPSLEDVLDACNVVLLCAPVANGEVSYQGFVNEEQHVGLPLADIAEPTRGVSSTFYD -LTRQPRRILTSPCWTGLVNDGRAYSAWCMNIERLVPWRTLTGRQSLYLDHQWYLDFGEHIPTYKPRLNPR -KTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRLLMLSRGMDPVWINDRDAEKVGIEDNDWVEVYN -DNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRIRINPLFLAGGYAQFTYGWN -YWGPTGIFTRDTHVVVRKMEKVEW - ->Nitrobacter_sp_Nb_311A_ZP_01048070 -MSWILDLVNPRERKWEEFYRNRWSHDNVFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLERSLPP -YEPRGCQRGISASWYVYSPIRVKYPYIRGPLYDLWREAKASHPDPVQAWASLVGDEQKRLRMQKARGKGG -FRRAKWEELVELIAAAALYTARKWGPDRVMGFSPIPAMSMLSYAAGSRFLQLFGGVNMSFYDWYADLPTS -FPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVHFIAEARTEGTKFVVLSPDFSQIAKYCDEWIP -IQAGQDTALWMAANHVILKEYYIDRQVPYFIDYVKRYTDLPFLVELEPNGNTYKTGRLLRAKRVARYQDV -ENGDWKMLVLDSKTGEPRAFKGQVGDRWGSTHGKWNLSAEDTLDNSPIDPVLSFIDQSDGVVQVGFDDFV -NGSVVSRGVPVKRIATDKGEVLVTTGFDIMMSQFGHSRGLEGSFATSYDDENAPYTPAWQERHTGIGRET -AIRFAREFATNAELTNGKSMVIVGASANHWYYNNLCYRSATVALILCGCCGVNGGGINHYVGQEKLAPVA -PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYGLTAPNPRWAKGHAIDLQAKAVRSGWMPFT -PHFNRNPIELAAEAERAGAKSTDDIVTHVVDQVASKKVNFAIDDPDAEESWPRMWFIWRGNAIQSSAKGH -EFFLRHYLGAHDNSIAEDRAKGKTQRVKYRDTAPRGKYDLVVDLNFRMNTTSLYSDIVLPTAFWYEKNDL -NTTDLHSFLHVLGQAVPPVWESKTDWEIFKLIAKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPEIL -DWAEGECKPVPGKSFPHVRVVERDYANLYNKFISFGPKAREDGVSAVGVQIPIKKQYDQMLDNPIMPMPD -PRHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHHVGLPLVDIAEPTRGVSSTFYD -LTRQPRRILTSPCWTGMTNDGRAYSAWCMNVERLVPWRTLTGRQTLYIDSQWYLDFGEHIPTYKPRLNPR -KTGDIVKSRVDDRSLVLNYITPHGKWNIHSTYKDNHRMLMLSRGMDPVWINDRDAEKVGIEDNDWVEVYN -DNGVVVTRANVSRRIQPGTCMYYHAVERTVYIPKSQERKWRGGGHNSLTRTRINPLFLAGGYAQFTYGFN -YWGPTGIFTRDTHVVVRKMEKLEW - ->Nitrococcus_mobi_EAR23355 -MGWIQDLINPKTRRWEEFYRNRWQHDNIFRSTHGVNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGIPPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLDFWREARSSHNNPVEAWSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKYGPDRVMGFSPIPAMSMLSYAAGSRFLQLFGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVHFISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKGEDLGLWMAAGHVIYTEFYVKRQVPYFIDYVTRYTDMPFLVKLEKDGDGYRPGRYLTSEEVKKYKKQENAAWKQLVFDRKSNEARCPKGQIGHRHGKHGQWNLKMEDGLDNSPIEPVLSFLGESDDVAMVQFYEFASQTVYKRGVPAKKIDTGSGSVLVATVYDLNMGQYAVNRGLPGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRFAREFAGTAEKTKGRSMVIVGASANHWYHNNHIYRAAINCLIACGCCGRNGGGMNHYVGQEKLAIVAPWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYAPSPPNAKWAKGHSVDLVAKSVRMGWMPHYPQFNRSPLEVAREAEKAGAKDDKGMADYVVQALKKKNLSFSVDDPDAPENWPRVWFIWRGNAMQSSAKGAEFFLRHYLGTHDNAVAEERAKPHVKHVKFREPAPRGKFDLVVDINFRMDSTALYSDIVLPTAFWYEKNDLNSTDLHSFIHPLGQAVPPVWESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRDVKDWLEGECEPIPGKTMPHFRVVERDYSLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQPVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEHCGVPLTDLAEPYRGHQVTFYDLTRQPRRLLCSPVWTGNCGDGRAYSAWTLQIDRLVPFRTLTGRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIHDLDNSPIDDKTLILNYITPHGKWNIHSTYKDNHRMLTLSRGMDPVWINDKDAARVGLKDNDWVEVYNDNGVIVTRANVSRRVQSGMCLYYHAVERTIYIPKSQIRGGRRAGGHNSVTRTRINPVYLAGGNAQFTYLFNYWGPTGIMTRDTHVAVRKLEKLEW - ->Beggiatoa_sp_PS_ZP_02000390 -MAVTGAGAAVISQQAISATQLLTPVAIDNPLSNYPNRDWEKTYRDLYHYDSSFTFLCAPNDTHNCLLRGY -VKNGVVTRIAPTYGYQKAKDLDGNQSTQRWDPRCCQKGLALVRRFYGDRRCKRPMIRKGFKDWVEAGFPR -LPETGAVDQKYLQRGRDSWVGASWDEAFELAGKALTNIAQTYTGEEGQKKLLAQGYDPLMVEATEGAGTQ -VLKFRGGMPPLGMTRVFAQYREANAMALLDDKIRGKGTDSLGGRGFDNYSWHTDLPPGHPMVTGQQTVDF -DLCNVERTNLLIVWGMNWITTKMPDSHWMTEARMKGTKVVVIAAEYSATSSKADEVFVVRPGTTPALALG -IAQVLISENLYDAPYVKANTDLPLLVRMDTAEMLRAGDVFKDYQLAKLENNTLVVPTGEKGPPMHQQKGP -ILDEKQRADWGDFVYWDASESKPVAMNHDQVGKHFSGNPQLTGEFAVPLASGETVQCRTVFDVTKEMLDG -SYTPEDVAKLTWTSADGIRGLARQIAANQSNTLFTVGMGPNQFFNSDLKDRNIFLVAALTQNIGKIGGNV -GSYAGNYRASFFNGLAQFIGEDPFNPELDPTKPAKLRKRWKAESVHYFNHGDTILRMGKAVLTGKTHIPT -PTKAFHVSNSNSLIGNVKGHYDFVINTLSRVEFIAQNEWWWTASCEYADIVFAVDSWAELKYPDMTISVT -NPFLYTFPATPLPRIHDTRSDLEVAAGICGAIGKVTNDSRHKDYWHFINKGEVRPHIQRVLDHSNATRGY -KIEDLEKLANEGIPAILQTRTYPKVGAWEQGNENKPWYTKTGRLEFYREEPEFRDSGENIVVHREPIDST -RFEPNVIVAKSHPLLRPKTPEDYGVPSSDMSGDTRQARHVVKTVDEVLNSEHPLHKEGYDFVFHTPKYRH -GAHTTAVDTDIVAAWFGPFGDMLRRDRRMPFVAEAYVDINPDDAKGLGIEDGDYVYIDADPHDRPFKGWQ -KYPEGYKVARLLVRARYYPGTPRGVTRMWHNMFGATFSSVRGQETNPTGLAKSPETGYQSLYRGGSHQSC -TRGWLKPTWMTDSLYVKGLMGQKITQGFVPDVHCPTGAPREALVRIIKAENGGIDGKGLWSPAARGLRPT -YENDILKQFMAGKFVELA - ->Hydrogenobaculum_sp_Y04AAS1_YP_002121006 -MISRRDFLKNGSVFLAALSTPGFGKKLFEPLVIVGNPLASYPNRGWEKIYRDIYKPDETTVILCNPNDTHGCYLNAYVKNGIITRLEPTYKYGDATDIYGIKASHRWEPRCCNKGLALVRRFYGDRRIRGPFVRKGYYEWYKADFPRDENGKPPSKYFINRGKDEWLKVSWEEVSDIIAKSLINIAKTYSGEKGKAYLKAQGYPEEMIDTMAGAGTRTLKFRGSMPWLAVLRYVGQYRMSNMMALLDSNIRKVEPDKALGGVGWDNYSEHTDLPPAHTLVTGQQTVDFDLVTWEHAKLIVLWGMNPYGTKMPDSHWLTEAQIKGIKVIVISNDFMATARTADKVVITRTATDGALALSMAYVIMKEKLYDENFVKSFTDLPLLVRMDNAKLLRASDIIPNYIPKALNQAVVYNPSKQMPPPPMKQEKQYIPIQLRDQDINDFVVWDVKTNSPKVVTRDEVGKYFDMSSLDPALTGEYEVELVNGEKVKVKPNFQAYIELLEENYTPETVEEITGVPANVIRELALEIANHKGTTKITTGMGVNQYFHGDLIVRAIFLVAALTGNVGRESGNIGSYAGNYRLAVFNGVGQWNAEDPFNIELDPSKLAKVKFYWKGESQHYFADGDRPLKVGDKMLTGKTHMPVPTKFMWMADNNSGLGNQKWAYNVMFNVLPNVECVVTNDWWWSLSCEYSDIILGVDAWDENRFWDISGSCTNPFFLVWPRTKQKRLFDTKNDIETYALVAKRLSELTGDKRFKEYWHFVFEEKPEVYIQRIINASSNLKGYKIEEVAAKAEQGIPSLVMTRFYPKFIGYDQTVDGKPWYTKTGRLEFYREEDTFINVGENLIVHREAIDSTPYEPNTIVIAKKHPLLRPLDPKSYGLSSEEMLKDTELRQARAVFISPAKLKDTKHPLRVSFGATHIVHTPKFRHTTHSATGDVDIVALLFGPYGDMYRHDKRTPYVVDAFIEINTHDLQKLGINDGDYVWVDADPQDRPFIGWQNKPEEYEVARLLLRVRGSFSTPPGLAKIWFNMYGSSHGSVKGTKVNKNGLAENPVTGYQSFYRRGSQQSVTRGWLNPTLMGDTLVRKDLFGQTLNKGFMLDVYCPTGAPREGFAKITKAENGGIGNVGLWRPLSIGFRPQNPNKYFKKYLEAGYVIFV - ->Hydrogenobacter_thermophilus_YP_003433365 -MSDLTRRDLLKMGGLSLTAMLSPSFAFRVMEPVVRVENPLAYYPNRDWERFYRDIFKSEATFTFLCAPNDTHNCLLTAHVKNGVITRIEPTYKFGEATDIYGLKASHRWDPRCCNKGLALMRRFYGDRRVKGPMVRRGFYEWYKAGFPRDPITGKPLEKYFQRGKDKFIKVTWDEVADIIAKTLINIATTYSGEEGRKRLEAQGHYPKPMLDAMEGAGTRVLKFRGSMPFLAVVRYTSPYRFANMMALLDSHIRGVGPDKALGGRGWDNYAFHTDLAPGHPMVSGQQNVEFDLCMWEHSKLIILWGMNPFTTKMPDCHWLTEARIKGSKVIVISNDYSPTARASDELIVVRTGTDTALALSIAYVIMKEKLYQERFVKSFTDMPLLVRMDNGKVLRARDIIPNYQPQPLQKAVVFKPGETLPPFYKQDKQYIPEPIRKGDMDDFVVWDTKSNSPKVITRDHVGEDFWKLGIDPALYGTYRVKTVEGKEVEVKPLFQVYLEFFEKSYTPKQAEVITGVPAKKIEKLAREIASHPRNMKLAQGMGVNQYQHADLKDRAMYMICALTDNIGHATGNIGSYAGNFRLALFNGAPQYLAEDPFNIELDPEKPAKVKFYWKPESAHYYSHDDHPQYMGEHLITGKTHMPTPTKFVWFVDANSALGNAKWQYNIIMNTLPKIECIVTNEWWWSMTCEYSDIVLGVDAWNENKYWDIAGSVTNPFVYVWPKTGHRRFFDTKNDAEAFAIVANRLSELTGDERFRNYWKFVLEGKQDVVYVQRVINASSNLRGYRLEEIAKKAHEGIPSLIMTRSYPKYVGEDQTKEGMPWYTKSGRLEFYREEPEFMDAGENLPVYREPIDSTHHEPNVIVARPHPLLRPKKPEDYGLSAKDALLSTEWRQARNVLVSPEKLPNTKHPLMVTVGATHIVHTPKYRHSAHTTTGDTDIIVLLFGPFGDIYRHDKRMPFVSEAYIDINPKDLKKMGIQDGDYVWVDADPQDRPFAGWQKRPEDYEVGRLLLRARASNNTPPGCAKIWFNMYGSSHGSVRGTKENPNGLAKNPNTGYQSLYRRGSHQSITRGWFKPTYQTDTLVRKNLMGQIIGKGFELDVHGLIGAPREGFCKIAKAEDGGIGGKGVWRPVRLGYRPMTANEMLKKYLKGEYVK - ->Natrinema_pellirubrum_YP_007282293 -MANRDRSVDSANERSAEGTSVSRRTLLGGAGAAGVAGFAGCLRLFTDDGEGNGNGTSTASKLNPLTEYPNREWESHYRDVWDVDDTYYLACRPNDTHNCYLEANVKNGVVTRLGPSMNYGEAEDLYGNQASDRWDPRVCQKGLSMVERFYGERRVTSPMIRQGFKDWVDEGFPREEDGSMPEEYAKRGEDSWYEASWDEAYEYAAKTFLELADHYSGADAQELLLEQGYDDRVVEEMQGVGTRTMKFRGGMPMLSTIGLFGEYRFANSMALVDHHVRDVGEDEALGGVGGDNYTFHTDLPPGHPMVTGQQTVDFDLANVEYADNIVLAGINWMCTKMADSHWLTEARMNGANVTGIFTDYNATSSKCDELVIIRPATDSALFLGVAQQIIATDGYDAEFVRSNTDLPLLVRMDTGDHLRASDVFEDYDPADLERTQVAPADEHPAPTTVDTADQWITPDQREDWDDFVVYDDAAGGVRAVDREAVGEEFDVDAALEGSWELELADGDIVEVRPVFDLVKEYLDTTWDPESTAEVTGTEPEAVTNLAEQFADNKESTLLLTGMGPNQYFNGDLKDRAAFLVASLTSNVGTHSGNVGSYAGNYRAAMLNGIPHYHLEDPFDPELDPDADSRVDSRITMESMHFYSNLDKPLKIEGEYHMGDSHMNTPTKSLWVAGSNSILGNAKGSYKIIEGLLRTGKLEAFFCNEWWWTMTCEYSDIVFPADSWAEQNVHDLTASVTNPFLMVFPETGIDRVYDTRHDCQIYQGVAEKLAEKLDEPRLEQMWEFIDEDEYRGKPYVQRILDNSNMTKGYDAETLIEKAERGEPALMMSTTYPKKIGTRQANDDEPWYTKTGRLEFLREEETWTEVGETLPVHREAVDGTIYKPNVIVDDGDHPLIDPETPDDLGWDDDNIEDASARQVRNEVVSTDALVNSSHPLQDVDPGFKYSFMTPKYRHGAHTFCNALPNIAVWWGPFGDRDRKDDRKPYFGEGYVEMNPEDAKEEGFEDGDYVWVDADPNDRPYPSANGDPDEYSRALMRVRYQPAMPRGVTRSWHNLNQASHGTTEATPDRTGMAKNEETDYVSLYRRGGHQSMTRSWLRPTILTDEMNRKGLMGQSIGKGFAPDVHCANGAPRESFVKFEKEGDAGEDGEGLWRPAEMGLRPGYETETMQRYLDGDFTSTEGD - ->NxrA_planctomycete_KSU_1_ZP_10101005 -MKLTRRTFLQVTGATGATFTLANKAMAFRLLKPAVEVGNPLDAYPDRAWESVYREQYRYDRTFTYCCSPNDTHACRVRAF -VRNEVLMRVEQNYDHQNYADLYGNKATRNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQWADDGFPELTPENKSKYM -FDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKLLDQGYPKEMVDAMKGAGTRTFKGRGGMGLLGVIGKYGMY -RFNNSLALVDSHNRGVGPDKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAHWL -TQVFERGGKLVVITPEYSPSAQKADYWIPIKCNTDTALFLGITRILMDEKLYDADYVKKFTDFPLLVRTDTLKRLQAKDI -FPDYKLEDISHGASYKIHGLHDDQREIIGDFVVWDAKTKSPKAITRDDVGDKLVAKGIDPALDGTFKVKTVDGKEIEVMP -LFEMYKIHLKDYDIDSVVEMTNSPKELIVRLAHDIATIKPVAIHYGEGINHWFHATLFNRSTYLPLMLTGNIGYPGSGSH -TWSGNYKAGNFQASKWSGPGFYGWVAEDVFNPNLDPDAPAMDLKVKGRAYDEEVAYWNHNDRPLIVDTPKYGRKCFTGKT -HMPTPTKIMWFTNVNLVNNAKHVYQMLKNVNPNIEQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSNPFIQIW -KGGIKPVNDSKDDVMILAGMAAKLGELLRDMRFHDVWKFALEGRPEVYIQRLLDGSTTTKGYSFVDIINGKYGEPGVALL -LYRTYPRHPFWEQVHESIPFYTPTGRLQGYNDESEIIEYGENFIVHREGPEATQYLPNVIVSTNPYIRPDDYGIPEDAEH -WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPKSRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNP -EAAKDLGINDGDYVYVDANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRPDGRA -LSAGTGYQSSFRYGSQQSITRNWSMPMHQLDNLFHKSKTSMKFVFGYEADNHGINTTPKETLVKITKAEDGGIGGKGLWD -PAKTGYTAGNENDFMKKYLNGELIKVEKA - ->ACTB1_Sideroxydans_lithotrophicus_ES_1_YP_003523268 -MMTENDFNRRDFLKVLGWGGTAVALSGCGNTSIQDGQETVTSYVELPSYVIPSISNYFNSTCAQCDAGCN -IMGRVREGRVLKAEGNPNSPINRGKMCGLGQSGVQAHYNPDRVRQPLLKGEAITWDKALGVIAQNLSAVK -GAEVAFLTGGMSGHVQALLGNYMDALGSKNHFSYEAISPAVLRAANKKAYGVSMPRYRIDKAKVVVSFGA -DFLGAWVSPVHFTQQYAQFRKGNRPEGRGVLVQIEPKMTLTGANADRWIAVRPGTEGVLALGIINALGKA -GLSIPADIAAVSNAYTAERVSGETDVSAEQIGKLAALLKERTPSLVLAGGAVEGYAHGSQNATAIALLNR -VLGNVGKTVEATASVPFPQIAPTVGNRSSLIGLNDGLAAGKYKVVFSYGVNPVFSAPASLKFRDNFAKAE -FKVAFAQYMDETALAADLVLPLDSAMEDWGTVVPEYMAAPAEDHSAAYAQMSFRQPLMQKVFPDTRGVGD -ILLALLKQREADKYKEFEDFYSYLRSAVLKNKVALGGKATDDDETFWDNTLSQGIVPFKGIANPVSAKAS -AAGLKLPSAVTADSSYPLRLIPAVSASMRDGRNANEPWLQESPDPLTTIVWDSWVEINPKTAAKLGIVEG -DIVEVASKSGSIRTQAYLFPGIHPDAVSVPVGYGHEAMGRYAKGVGANVFGMLDTVFDKETGELALNETS -VKISKVGQRVIIVKEEGPVGGSQDGKKKIAVQVSADKVDLSKEV - ->ACTB1_Gallionella_capsiferriformans_ES_2_YP_003846257 -MIDSGSVKQMAGHPFDRRDFLKVLGWSGAAVALSGCGNTSVEDGRETVVSYVEANDYMVPGIGVYFNSTC -AQCDAGCSVNGRVREGRVLKLEGNPDSAINKGKLCGLGQAGVQHHYNPDRVREPLLRNGNKGEAISWDKA -YALIAEKLAGVQGEEIAFLSGGVSGHLKVLLGNYLDSLGTKNHFVYEAIAPSVVRAANVKAFGVEMPRYR -FDKAQVVLSFGADFLGSWVSPVHFSQQYAQFRKGVNGQRGVLIQVESKMTLTGANADRWLAVKPGTEGVL -ALGIINALGMATGDVAELVKGYDKARVSRETGVSTGQIDKIAALLKLRSPSLVLAGSAAEGYAHGSQNAA -AINLLNQVLGNVGKTIEAPVSVPFPQMAPSKGNTVALKNLNDGLAAGKYKVVFNFAANPVFTAPGAFKFK -DNFAKAGFKVAFAHYLDETALQADLVLPLDSALEDWGTQVPEYLTEGAQINIQQPLMERLHADTRGMGDI -LLSLIKQKKADEYKGFEDYYAYLRGAVLQNKGALGGGGVEDDTFWNDTLTNGIVKLAGTTTSLAAHASAA -GLLLPAEAEADEHFPLHLIPGVTASLRDGRHTNQPWLQESPDPLTTIVWDSWVEIHPKKAAELGIVEGDI -VEVTSKTGSVKAQVYLFPGIHPEAISIPVGRGHDAMGRYAKGYGVNPFQIMDAVFEAATGELAMHETRVK -ISKTGQRVLVVKDEGAAGALQMGRKIAARVSTDQVDLSKEV - ->QrcB_Desulfatibacillum_alkenivorans_YP_002430439 -MKLNRRNFLLVSTAGAAGGAVGSMFSPLSWKLMDDSSIWTQNWPWTPVPADGEVSFEETTCTLCPGGCRV -KVRKVDERPIKLEGVEGGPVNDGGICILGLTALQLLFGPARVHTPMKRAGKRGEGKWVEITWEEAISEVS -GKLAEIRETGRAQDLGCIAGGGKGVINALFSRFMEAYGSPNFYWQATAWDCYEENILRTLGLNGTAGFDL -ENADYILSFGAGLLDGWGSPVHVFQAHSKWRENHDGHATLVQIDAQLSNTAAKADKWLPIVPGTEGAVAM -AMAHVIISKNLYNRGYVNWNTTGFRDFYRTVESEYAPAKVVKIACPVDNKEYQKKWLEELESRAIAFAKA -DKPLAVAGKGNGDRPVSQAELNAVQALNALVGAINRKEGGMVVLPDEPKYPWKPVVMDAEARSYKPSLVS -VRGRSKYGHSNLVSVLPQALNSSHEGLKVLLLAGSNPLYTLADTEKTAEALQKVEYIVSFSSQFNDTTAY -ADIILPDHIFLESTVDAPTPPGFAKPVYGLAEPVIKPVYKTKAMGDSIIEIAKAMGGTIAQSFPWADSAE -AIEQALGGKWPLLKRGGVYVNEDFTPETEGVRFRFFARSGMESRISIQGKAEQYPLIATPVDCIRLATGA -LADTPFMVKTVSDKKLKHKELVVQVNAMTAQQYGFKEGSEAVLETPVAKAKVRVHCSEEIAPGLVGVPRG -LGHIAHDEFVGGKGTNYNTLISPVQDPATGFDVAWGIRAKLT - ->Gemmatimonas_aurantiaca_YP_002761548 -MIAPSATTDHRPSTTMTTEAGTGVKRREFLKILGATGATTAVVGCSSEKVGKLIPYVTSPDNTVPGVSQY -YATSCRECAAACGVLAEVRDGRPIKLEGNPEHPLNRGAICATGLAGIQGVYNPDRYRSPMVREGNALKPT -TWDKAYELLAQKLGEVKSKGQAGNVVFVNQHETGTFPGFLDQWLSAQGMPAHLSVDSTAPIATIAANQKA -YGAAWPALNFSAAKLVISFGADFLDGWGHSVPQQLDWADARSKLDVAPRLVYIGARRSLTGLNADQWIAA -KAGSEMAICAALTGTGSAAAAAEAANVPVATIEALVKAVADAGNGIMALCGVTGNDAVECGVMVAEINKK -GGAVGTTINTAKAHGSYTGLASYADLAAAVKNMDAGTVPLAFVRGANPAHTMPKSAGFAAAFAKVAFKVS -FSSMPDETAQLADLVLPDNHWLESWGDAVGENGQISLQQPTLDPVFDTRATADVLIDLAKKDQTLAARYN -VANFRSWYISQFPGGASAFATALTKASVSGAPLVATSTRTLATTALPVAEGAGEFFVQVYPSSTLGDGAG -ANKPWLQELPDPVTKIAWQSWIEVHPSTAKKLGIKEGSHLTIETAAGKVTAPAYIYMGVRTDTVAIALGQ -GHTAYGRFAQNIGVNAYDLVSHGWDSAGSLAIGSVKGKVTVSADSSPLVTTEGSARQHGRGIAQAMTLAA - ->ACTB1_Cytophaga_hutchinsonii_YP_678817 -MKDNNKVFWKGVEELGNSPEFVKNAQNEFPEFLPLKNSSEESNGTDRRDFLKLLGFSVAAVSLAACEAPV -KKAIPYLNKPEEIEPGIANYYASTFVDGGEYCSVLVKTREGRPIKIEGNKLSSVTKGGTNGRVQASVLSL -YDTARIQGPLIKGAAATWADLDKQVGVQLGAIAATGGNIRIVSPTILSPTTKKAIAAFKAKYPSTEHVQY -DANSSYGILKANQTSFGQAVIPSYDFSKAEVIVGFGADFLGTWISPIEFVSQYADTRRLSKTKKTMSQHF -QFETALSLTGSNADYRQPIKPSQEGLFIAELYNKIVSSKVSTTPVKNDVLDKAAAALLKASNRGKSLVVS -GSNDVNVQILVNEINLALGNYGTTISLATPSFQKQGNDEAMNTFINDAVAGKVNAVIFYGSNPVFDHARG -AELAKALSSVSLTVSFADRVDETAALTKFVAPDHHYLEAWGDAEPRAGFYSLGQPSISPIFKTRAAQESL -LLWSGNSGDYYEFLKSNWISSILGGASWDQALQDGVFEPKNKSGVEVTASSFDRSAVEAGIIKNYPANTS -GIELKLYEKIGLGTGSQANNPWLQELPDPISKATWDNYVAVSASYAKANALEQGDRVAVKSANYSVELPV -LIQPGQAGNTVSIAIGYGRTHVGKCGDGVGKNVYPFARFVDGSVLDFVTGVSVTKLGGDKYPIAQTQTHH - ->ACTB1_Leptospira_interrogans_serovar_NP_713447 -MDQKNFQKEKKAHWLSYDLKDKDEEVKEMQKSEFFTSPDPLIARIKSGEFDRKSFLKLMGAGVAMTSLNC -IRKPVEKIVPYVDLNKTDENSQYDFVKHGHSYYYTSVVAGTGVLIKARDGRPLKLEGNPDHPVSQGALSA -AGQASIFDLYDPDRAQNPATIEGGIEVKSDWATVDAKVKSALAANKGKTVVVTKLLDSPSTQSIIGDFLR -TVGGGKHYEISLTSAEEVVSKGQAASYGKAIVPNYHFDLANVILSIDCDFMGNWLSGEEHQKDFSKRRNL -RPNGSLKQNNLADVNLFIAAESVPTMTGSNADLRLAIRPGDQTKLALAIAAALGELGANTKDALNGATLS -ALVSELGVSEENIRKTAKALWSNKGRSLVVAGSLAATTKDAVDLQILVNLLNSVLENDGKTVDHSNPKKE -GLADSSGNLKSLAAELKQGKVGVLFVNDVNLVYQAGEEWKNLLHQAALVVSLSDRADETALSSNVLATTT -HFLESWGDAEVTKGIFSIQQPAIRPLFNSRSFEDSLIAFAGGSLGGEASFYEYVKNSWIKKLGSKRNWED -LLRTGTTVTASERKKVAGPSRNFNRSSIKKIESSSTGLKLSLFETIAIGDGKAANNAHLQELPDPVTKLT -WDNCILLSPALAKEKGISSNDVLVLKTAKQTIELPAQIQPGMHKDAIAIAVGYGRTAAGAVGTGVGKNAY - ->ACTB1_Bdellovibrio_bacteriovorus_NP_96849 -MKKALRPKVERDTKYWNSLEQWSNDPEFNKIASTEFQSSPLRESDDEGGWARREFLKLMGASLAMASAGC -IRRPVQKIVPYNKQPEEVTLGMANYYTSAYFDGSDALGVLVKTREGRPIKIEANPGHPFSISGLSIRSQA -SLLSMYDPERLKGPQRNLFNEKKSNSQVIDVKWEDLDKKVAEQLKKGDVVILSGNVASPATRAVIGDFAQ -GFKAKHVVWEALSNDDVREGQKASYGDDVVPAFRFDKAKMIVSIDADFLGTWISPTAFTNQFVEGRKDIK -NMNRLVSFDSNYSLTGANADIRMKIKPSQQLDVVMGLLHEIIVKKGASSHAGNSAVKAALAPFADVAKKL -NVEPALFAKVAADLWANQGTSLVVAGGITTLTEKSKELQVAVNFLNSILGNDGKTVDHNGGNKGDKASQA -DMAALIKDMKDGKVKTLIIHRVNPGFVLGADMGFAEAIKKVDLVVYTGDRIDETGVFADYITPDNHALES -WSDMELASGVYSICQPSIRPMYDTRSFQLSLMTWAYLANMGPSRLRDYETFYDYLRVFWKSDIFPKYGKG -QSFEDFWQTALQKGYVGEINSGSSSRSFKVDAFTSIKPAAAKEGFELALYSTSQHGDGSLANVSWLHELP -DPVTKAVWDNYVMVSLATAEKHGLKQATVVELTVGGKTLELPVLIQPGLHDDVLAVAVGFGRTRAGKVGN - ->ACTB1_Gluconacetobacter_diazotrophicus_YP_001602862 -MPSLDGLPGDEREWIGRFPHLEQALAHPLDRRRTLKLMALALAGGGLAGCDPGTPDRGFVSAVRAAPGVI -PGVPNVYASAHVRDGYANGILVTHQMGRPTKVEGNPGHPSSLGATDVFAQAAIQDFYDPDRASGPLHDGM -PAAWQEVTTALQVLRAAPNGGVPQGASGLRILTGTVTSPTLGAAIDALLAAYPGAIWHRWDAIGRDTVRQ -GAELAYGRPAMVIPDLRQVDVALAVDSDLLDSAPGHLRHARAFAGRRNPVQGPMNRLYAVEPTPSLTGVA -ADHRFITAPAACDEIIGRLAAAVLRNEAPSGGPDWLGAVVADLRAHPGRALIHLGPDHGAQAQAAVHAMN -EALGGRGRAFDVFDAPDHRPARPTSTLPALMDDMENGRVRALLILDVNPVYQVPRFAAALPRVPLSVALA -DRPHETAQAARWHVPLAHGFEEWGDARADDGTATILQPQAMPLYGGVSAATILHLCAGDVARPARDLVRQ -TWRQHLPSERDWRAALAAGVVPGTASARLDTPLAPVMPPAPPPAPPVDLTLLLRPDPHLWDGREANNPWL -QELPRPLSKIVWGNPLLIPPDLARSMGLRNGDEVALSVGARRAVLPIWVQPGQASGCVVGLLGSGRRRAG - ->ACTB1_Methylobacterium_sp_4_YP_001772545 -MPPLSGPRTVSRREALRAFAAGITLAAGACAKPDEEIVPYVVQPERVTGGVPLVFASTLPLAGYGRGCRV -RSVDGRPIKVEGNPRHPGSLGATDVFAEAAVLSLYDPDRSKTLRQGGDIGTWSALQRALVAKVAAWRETR -GEGMRLLTGRVTSPTLQRQIARLLDAYPRAAWHAHEPTEDASARAGAALAFGRPLWPVPHLDRAAVIVSL -DADPLGPGPDQIRNGRGFGSRRVPAAGEGFSRLYAVEAAPTLTGAKADHRLALPPHRIGEVAVALARALG -ADLRAPTLPEEAARLAARAAQDLRARRGAALVLAGPTLPPEIHALAHWINGVLGAPLDWIEPPDLIGGRA -PGTLSDLARDLAAGGVQDLVMLGVNPVYDAPADLALAERLGRAPFRLHLGPAVDETAVLATWHVPETHPL -EAWGDLRAVDGTASLVQPLIRPLYATRTAEEVVCALLGEGDAASYDLVRETWRPGREAGFEEWWRRALHE -GVVQDSAAAPVATGSPRLPDPGPPAAAQDLTLVLRPDPGTWDGRMANNAWLQECPAPLTKQVWGNALALA -PDEAARRGLAQGDLVRVAAGGRSIEVPVATVPGHAAGVASLTLGHGRSRAGAIGNGIGASAYALRREDAL - ->ACTB1_Ralstonia_eutropha_YP_298623 -MTRARVIPLVPVDEPSDAPRSPARRHFLRTTMAASAALAGAACSGPPAEMIVPYVQMPEGIVPGRPLFYA -TALTRHGYGMGVLVETNMGRPTKIEGNPRHPASLGATHPFDQAAVLQLWDPDRSQAPYRGGALSGWAAFD -AALATQRVQWRDRDGEGLRLLTGNVGSPTLSAQIAQWLDRYPKAVWHVHDPLYDEDPSPRMAFGDDVDLL -IDPKPATTIVTLDADLVGHGPAAVRHAHDFMADRRGVAPMLACRLYAIESSPTLTGEISDNRLALPPHEI -ERLAWSLARKLGVPDVPVDTPEPASDTARHWIAVLARRLREAPPGSSLLIAGGALSGPTRALVWRLNARL -GNLGKSVRPVAGTPRRPLGEAHSIGALTEAMRAGAVSALLMIDVNPAYDAPCGLGFDAALRHVPWSSHMG -VYRDETARLTTWHAPMAHDLERWSDARAWDGTASIVQPVIAPLNGGRSAHELLSAAVDEHQSGYDLVRAH -WRARQRDDFDAFWEQALRTGVIADTAAPPATTDMRQPITPPSFAAPPLVARFMPDPATDAGELANNAWLQ -ELPRALTRHTWDNAALIGPLTARARRLSTGDIVVIRRTDRQGNPIEAPVWVLPRHAEGVVSLPLGYGRRH - ->ACTB1_Chloroflexus_aggregans_YP_002464666 -MTQHQSDLEAIRAQLRDARGPQFWRSLDQLADSPAFRELVEREFPRGASEMSDGMSRRTFLKLMGASLAL -AGVTACTYQPRQYIAPFDRQPEGRIPGVPQYFASTLTLGGYGTGVLVRANEGRPTKVEGNPRHPASLGST -DLFAQAEILTMYDPDRSTTVLRQGVPSTWAEFTTTLANALTAAQATQGAGVRLLTTTVTSPSLAAQIEQF -LQAYPQARWYQYEPVNRDNVVEGARLAFGRDVTTRYDLAAAQVIVSLDADFLAPGPGFIAYARAFADGRK -VRKDSTGMNRLYVIEASPSTTGTAADHRLALRADAIAAFAGALAHELGIGGAPATLAAKAEEFLKAIAKD -LEEHRGRSVVIAGDQQPPIVHALAHLINAELGNVGKTVFYHEPVEARPTNQTNELVTLVSEMAAGRVELL -VMIGGNPVYNAPGDLRFAERMATVPLTVHLSQFVDETSVQATWHIPQAHPLESWGDARAFDGTASIVQPL -IEPLYGGKTANELLAAMLGQPDAESYDLVRGYWEERIGNTNWNVALATGVIADTSAPVINPTLNEAAIRA -TAIPQPGDGVEIVFRPDPSVFDGFYANNGWLQELPRPLTKLVWDNAALMSPRTAIKLLGLPFSADRLVGN -EADDRERQRYLEQLSKVNGTIARIEYRGGVVELPIWLLPGHAEDSITLNLGYGRTNAGRVGNGVGINVYP - ->ACTB1_Nitrosococcus_oceani_YP_343269 -MAGSSIKPLDLAPIRARLAEAQGRAFWKSLEELAGSEEFERFLYQEFPFFRELSQASLSRRDFMRLMGAS -LALAGLSACSTPPPEEILPYIRAPEGLVPGESLFFATAMPLDGFATGVLVESRMGRPTKVEGNPLHPASL -GGTDIFAQASVLQLWDPDRAQVISHRGEISTWQTFLAAMGEKMRTFEGNQGKGLYLLTPTVSSPTLISQL -RTLGKRFPHAHWHQYQPINQDNSYEGARLAFGESLETRYHLERAEVILSLDGDFLGSLPGHLRYARDFAK -KRRVDSAQSTMNRLYVAESSPTITGTMADHGVSLRASQIEVLALQLARALGIGVPRREETASDLPEQWVR -AVAEDLRQHRGTSLVITGEKQPPFVHGLVHAVNQALGNVGTTLTYSAPRAFNPRNQNESLNHLVAQMDAG -KVDTLIMLGGNPAYNAPADLAFSKQLAKVKSSIYLGLYEDETAAHSHWHIPETHYLERWGDARAYEGTVS -LLQPLIAPLYQGKSDYELLAVLLGQTDRSDYDWVRGYWQKQWPKSDFKSIWNQALQAGFIEGTALRSKSV -KLRDDWVAHLSRGQSKSKETSGMEIIFMPDPTIWDGQFTNNGWLQELPKPLTKLTWDNAALISPRTAENL -GLANEEVVALRYQERQVQAPIWIMPGHPEGAVTVTLGYGRAKTGQVGAGTGFNAYALRSSRAPWFGWGLE - ->ACTB1_Candidatus_Solibacter_usitatus_YP_821785 -MSDPRNQLDLAAVQKRLEGARGRDYWRSLDDLAATPEFQDLLEREFPRQAVGWADDEDANEGRRNFLKVM -GASLALAGMTACTRQPTEHIMPYVRQPEELIPGRPLFFATAMTVNGVANGLLAESHMGRPTKMEGNPEHP -ATLGACDPYSQASVLQLYDPDRSQALTFNGEIRSWGRFTGELREALALQKTKNGSGIRILTETVTSPTMA -AQLRAIQQVYPSSKWHQWDPAGPHMARAGSVQAFGQPTNTYYDFTHANVVVSLDSDFLASGPGYLRYARQ -FSARRRIHEPSDSMNRLYVAEPMPTPTGTKADHRLQLRAGDIEEFAWGLAISLGIAEGPKNGENHDIYKW -LGPMARDLQSNKGASLVIAGAHQPPIVHALAAIMNEKLGNVGKTVFYTDPIEANPGDQLASLMDLVKDLD -AGAVDVLLILGGNPAFNSPVELGMRDRLKKAKLRIRLGLYADETTEVCQWQVPEAHFLETWGDARAFDGT -ITIQQPLIQPLYNGRSALQLLQNFTDQPESSPYDVVKGYWRTQHQGADFENWWRRAVHDGFVANSALPTK -TPTVRGEALSARAGARHLGGKLEVIFRPDPTIFDGRFANNGWLQEMPKPVTKLTWDNAAILSPYDANRFG -VQNGDMLKLTYDGRSLNAPVFIQPGHVNGATTLHLGYGRWAGGRAAKGMGFDPYGLRTSKALWQDVGMDA - ->ACTB1_Candidatus_Koribacter_versatilis_Ellin345_YP_592078 -MDNGSKKNGADVCPSKKGKLELADVKQQLAAAKDGPQYWRSLDELSNTDEFQEMLHREFPRQASEWVDDG -GSSRRDFLKLMSASLALAGLTACTKQPIEPIVPYVRQPEELTLGKPLFFATANTVGGYAVPVLAESHEGR -PTKLEGNPQHPATLGGTDVFTQASVLTMYDPDRSQVVMLDNEIRTWGSFVGAVANPLAAQKAVQGAGLRL -LTRSTTSPTLGAQIKQLLQTYPQAKLVQYDPAGRDNARAGSQLAFGQYVETQYNLDKADIILSLDGDFLS -SGFPGFHKYARNFSQRRQPDLKEKMVRFYMAESTPTNTGGKADHRIPMRASDVEQFGRAIAAGIGVAGAG -GSAKQEWQNQVAAIVSDLNKHKGAAVVVVGEHQPPAVHALAHSMNAALGAVGTTVTYTEPIEQIPADQTA -GLKELVADMNSGKVDLLVVMGANPVYEAPADLAFLDAFKKVAVRIHHGLYVDETAVLSHWHINGTHFLEQ -WGDVRAFDGTVTIQQPLIAPLYNGKSQYEFVAALNGQGSTSGYELVKGTWQKQHTGADFEAWWRKAVHDG -LIAGTAAPAKTVSAKGAPAATNAASDSAMELIFRRDPMIYDGEYSNNGWLQEAPKPITQLTWDNPIEMNV -TQAEQMGIKTEDELEITVDGRKIVGGAWLTPGHPKNSVTVFLGYGRTRAGRVGTGTGYNAYQARTSDKQW - ->ACTB1_Anaeromyxobacter_dehalogenans_YP_002491266 -MPSLGLPIYGQKQGAGLDARRWRSVEEAAEAREVPPGEFPDDAAAVPEGFTRRGFLQVLGASVALAGLEA -CKPPRENVVSYVRPPAGVTPSLPSAYATVASRGGYAVGVVVTSHEGRPTKIEGNREHPSSRGGSDAMLQA -SILDLYDPRRLKGFTRAGRPLGFATLLREVSALARSHAQDGGARLRFLVEPTSSPAVADLRRRILERFPR -ARFDAWAPVGADAGRAGAAIAFGKPLDAAASLADADVILSLESDFLALEGDSLRLAREFGARRTAERMNR -LYVAESAYTVTGGAADHRFRMRSADVLGFGRAVAAELAAKHGLAQLAPLGAPAGGERAKAAAAVAADLAR -ARGRSAVLAGDRQPAAVHALAAALNGALGNAGKTVAYRPTALLDPAAGPDRLRALAGELEAGKVDALVVT -AWNPAHTAPADVPLRKLLPKAKDTIALALREDDTVRLATWKIAATHPLEAWGDLRAADGTASIQQPLIAP -LHESLSELELLAAFLDEGDHGTWRIVREGWRRRAGEAGFDGRWDGWLAAGVVAGSAVPPEPAQADLARVA -EAVRAVAAPGASLELGFAADYKVLDGRFLENAWLQEYPHPITKLTWDNAAQLSAATAKQLGVESGDLVEL -SWRGRTLTAPALVVPGHADGSVLLTLGYGQALSGPVGKGVGHDAYALRTSDAPWFGAGVEVRKTGKRHPL - ->QrcB_Desulfococcus_oleovorans_YP_001530428 -MKIDRRSFLTLLAGGAVGTALSPMTIKLTDDISIWSQNFRGTPIEVPVPERGPASYVDSVCTLCPGGCGI -SVRKIGDRAVKIEGKAGHPVNNDGVCALGLSGLQLLYGPWRVTGPKKKENGRWKKISWDRALSEIAEKLN -ELREAGKADAIAGISRTGRGTVARLMQRLLAAAGSPHFLPVPTNENAYSDAVARMFGKPGTVGFDFENSG -YVLSFAAGLLDGWGSPVHMFSAHSQWKTNGVKMVQVESRLSSTAAKADQWVAVKPGTEADLALGLAHVIL -RDNLNAGAAANSRAFDSFAALVKKDYTPARVAAATGIKESVIVALAKEFAAASHPVAVCGRGDGQTPCDS -REVMAVTALNALVGSVNRQGGMIIGPEPDYIQWARPVLDDTAQKGLAKGPKTLADLLAGKTPDVQALFVL -EANPAYTLHDTTKVKAALEAVPLVVSLSSFMDETSALADYILPLPTCLERTEDVVVTAGLKTPMIGLTQP -VVEPRLDTRHPGDVILDLAKAMGGTVAESFAWSDYQDCLEKTFGLVYGKLATEGYLQKSVLETLIDTAVA -VGRADFAPVVEADKKVRQNTPALVLAAYDAMRVAGGAIATPPYAMKIVPDTILKKNDLYVEINPETAQKA -GLADGKAAVVETPAGTAQVRVRVTHEVAPGMVAMPRGFGHTAYDDYVSGKGVNVNDLIGPVPDPVSGLDT -AWGAPAKLIKA - ->QrcB_Desulfomicrobium_baculatum_YP_003159879 -MGLDRRSFISLVAGGVAGSLFTPVIWKTLDDVSIWTQNWPWIPRLQYGEELTVPALCKLGADAYGLKVKT -IAGRPVAAEGNPDHPLSLGGICPLGAASVHLLYSPSRVKNPKLRDGSSFKDITWEEAEELLAGKIKEAGA -SMAMISGDETGSVTDVLSGLVGKAGSDKSFFMPGESAPAAAALAMLGGDGQVGYDIENANYVLMLGADAL -GSWGNVARNGKAFSASREKGVKFVYVGPAQNGTSAVADSWIPCAAGTEPVLALGIAAVIAGTNRDRSFWP -GFASFAKFVQTSYPLDKVAEITGVSAATITGLAQELVRAGRPLVLTAAEAGQGLGAFELAAGMSLNMLLQ -RVNTVGGVRILPWAPKVVEAAADKKAMLANDLVAYLSTVADGGAEAPALLMVYGANPAYALPNLVKAQAA -IDKAGFVVSFSSFMDETAAMADLIMPDSYAFERLDDAYSPYGSGQPNYTVAAPVIKPVFDTRPAGDVLLS -VAAKAELDLGFETFEDVVKAKAEALGADFDEMVEGAVWVSEEFPAQDLALWTTPLQELAVAAQDGKTLAL -APVLRLKIGSSKIAIPPFNTNAIRFDEMLGNDMYVLINAATAKNLGLKKDDAVKLASSGGECKARVRIFE -GVMNDTVVAPLGLGHTAWDAFSSGKGDNVYKLLAADTETETGLSRFATVRVTVSKA - ->QrcB_Desulfovibrio_magneticus_YP_002953179 -MGLDRRAFLGLVAGGTVGAMFTPIPWKLIDDASIWTQNWPWIPRVPKGQVDYVATTSKLCPAGEGLKIMR -VAGNPILAGGNPSHPLSCGGVSALARSEVYMLYSPARIKSPMKRNGKTFAPITWEQALVEMAEKLGAAKG -AVASISGDNTGTINEVLTALTAKLGSAGSFMMPSEATTAAKAMKLMGAQGQAGYDFENADTVLVLGADIF -ETWGTSSRNRKAFGANRPAGAKPANTYVYVGPSRNNTAAVCDQWVPAAAADLGVVALGIAWHLLKAGATS -NAPGFDTFKAVVNGGFGPEDVKRATGVAPETLAAIAKALASAKAPLVVTGSPFGQGLGAAPVIAGMSLNM -LLGRINKPGGVYMLPELPSVVPGALTRAAMLDGDLPAFLKGVESGKTPAPKALLIYDANPAYGLPEAATM -AKALEKIPFKVSFSSFMDETAALCDLVLPNSLPLERYDDVATPYGSGFCVYSLVRPIQKPICDTKTTGDV -LLGLARKLSIDLKFDNFQQVIKEKVASLAKVSGGFVAKDVMPWQVAAGKPAPALVGGDLWKALEAGYAWT -MVGQAAQTAMGFAAEVVAKAVKAGKPATATVLAPYAQLRTGTPVTGMPCQDLTTVPDTELLGDTTFIRVN -SETAKTLGLKKGQMVKLSGAGVDCQAKVHIFESVMPGMVSAPLGFGHTAFDYYSQGKGANYLSLAAVVEE -PGSGLSMWIAPEVKIA - ->QrcB_Desulfovibrio_vulgaris_YP_967712 -MALDRRGFLKFIGGATAGILATPVVWKGLDDVSIWSQNWSWIPRNIKGANSYVPTVSKLCPTGVGVRVRL -VDGRPVRVIGNPEHPLSKGGVSSIAAAEVQMLYSPARMKRPLKRSPDGAYVMISWEEAEAMLLDGLKAAK -GGDALACISGDDNGTINELLSAFVQQSGSKSFFLMPGEAQPAAKAWDLMGGEGQIGYDIEKSDFVLAIGA -NVLEAWGTAIRNRHAFGASHPHGAEPTAQFVYAGPVLNNTATGADDWLPIRPGTESAFALGLAHLLIKAG -ASSSAPDFDAFRSLAASFSPEKVAAQTGVDAKALTALAQALAKAKHPLVIVGSEFSQGAGAAPVMAGIAL -NMLLGSVNRDGGLRALPVARKVVPAGMDRKAMLQQDLTLWASAIASGKAKAPKAMLVYEANPVYALPQGS -AFKDTLAKVPFKVAFTSFLDETAMQCDLVIPVSMGLERLDDVCTPYGCGEVVYSLATPVTAPLFDTKPAG -DALIALGGKLGLDLGVASFEDMLKAKAAAHGADFDKLAEGTAFTSRATVGANLSFRPDVLSKALDVKAPA -LPLALAPVMKLNMGTSKTAIPPFNTKTIRRWEVQGKEGYVMLNGATARKLGLAQHDRVVLSNPTGKVTVR -VNIFEGVMNDTVAMPLGFGHTAFDEFSKGKGENVMHLLAPSTEPVTGLAVWTGAGVNIAKA - ->ACTB1_Mariprofundus_ferrooxydans_ZP_01451016 -MSENKSSSNWTRRSFIKAMGLGGAAGSALVLSGCGDTDIINEVDIEVRKEKVEPNVDPQDYVRPGIEMYY -ASTCRQCPAGCGVHARIREGRVLKLEGNPVSDVNHGRLCPMGQAGLQSHYNPDRLTKPMLRKGGKLVEIS -WDEAEDVLRKNLGRKNAKLAWLSGATSGHHRALVDAYLAAAGAKNHFVFDTLPPAVGHAANQEMFGSYMP -RLDFDKARLIVSFGADFLGTWMSPVQFSTQYAEFRNAPRGTLVQIEPKMTLTGANADRWIPARPGTEGHL -ALALASLLVQKSEYADRVPADVVASLKDVNVDEVAKLCDIPVERIHHLHHLMTDRSPSLVLSGASAEGVQ -HGFETARAILMLNVLLGNVGETILPRSEDPFPALAPRMGGWSEVKAMVDGLNKGSFDTVVVFGSNPLYQA -PGFMQADKAFDKAKFRISFSMFPDETTMACDLVLPVHSYLEEWNTTMPAYAATDGYLGLQQPVMNPVFGS -HATRSFGDLMLDVLKHMDPNFKQWDSYQAYVMGALWTMRPALVKQYKPSVPGQTEEEAFKQGILSDGFVQ -MKVAKAAKIEAKVSAVTLPAEKANANYPFRLIPSARLGLWDGRHANVPWLQELPDQLTEVVWDSWIEIHP -KTAEKLGVITGDVVQVESSAGKAKVKVVVFPGIHPDAVAIPLGQGHTEYGRYAKGVGVNPFSILAALFDG -KTGELATYATDVKVAKIESRGKLVTLANGDLVLESNTSTQAGRELVKTTTAENFDLTEKGA - ->RBG1_1305 -MNNKENPHKKYWSTLSEFHQDAEFKKLKKEEFLSKPQSFFESNGNNDTTFSRRDILKLAGAAAVFTAAACARRPVEKIVPYLDPSEEVIPGKAVWYSSTSGTSDGCGMLVKTREGRPIKLEGNPDHPLNKGTLSAREQAAILDLYDPDRLKHPAKISAGQVLKSDWKSADTEIARSLKSAKGKMVLLTGTIHGPARKRLIREFLFSFSNAEHITFDALSEEEILEAQELCYGNRVLPRYRFDKAEALVFLGADPLASGHSKTEFAYGFGHQRKINSNQMSKVISFEPALSLTGQNADLHYLVKPQDLIKVGLALAHQLIVAEKKSKLASDLLVQNLLENYSAKKVETEIGLPEGTIKSVAADLWLARGRGLVYTGSLTVRDNSALALHLVTNLLNSALENEGNTVDGVQSVSQQSQGSYSELMNLISDMKSGKVEAVLIYGNNPAYGLPQSAGFEEALQKVKTKIYLGDRADETGSLCDFVLPSLHFLESWGDAEPQQSLYSLMQPTISPLHDNRGWEDSLLALMREIKGVALGKEYASWHDFLKDTWYKEIYLKNDLVASFEDFWISVLRQGLFDTVNRSAEKSSPRQFRTTALSNIGKIKNVDSKFTLALYTPAMQFDGRTNNNSWLLETPDPVSKIAWDNYVNIAPRTSVELGLQESDVVSLTVNGVTQEIPVHIQPGIHPEVFTVAVGWGREKVGRVGNNVGVNAFRWSKIQNRHLVSSSLPVEIKKTGKQIKLANVQGHNYINGRPVIYEATLAEYQKNPTAGRAGEEKLTSIWPSHPYE - ->B_Caldithrix_abyssi_ZP_09550397 -MKTKMKRREFIKIAGAGAGSLVVGSKLYASFNSKDEQNLLADGKIERTPTYCEMCFWKCAGWVYKKDGKP -WKIIGNPDDPNSRGRFCPRGTGGIGAYTDPDRLKKPLLRVEKNGKQVFKEVSWDEALDFIAGRMKDIAQK -HGPECIALFSHGSGGSYFKTLLHAFGSNNVAAPSYAQCRGPREEAYMLTFGEAVGSPERTDIINAKCLVL -LGSHIGENMHNGQVQEFSEAVAHGATVITVDPRFSTAASKSKYWLPIKPGTDLALLLAWIHVIIYEELYD -KEYVKKYTFGFEQLKEALKDKTPEWAYPITTIKPHVIRQTAREMAKNAPATIVHPGRHVTWYGDDTQRVR -AGAILNALLGSWGRRGGFYFPSKAHLPKMPIPKFPNVKRDWRKAFPNKYPVAHLALSSGICDATIPSPER -ECSFKGWIVYGTNLPMTLPQPEKTLEAIQHLELLVAIDILPAEITGWADVVLPECTYLERYDNLRLSPGR -VPSIALRAPAFEPKYESKPAYWMARELAKRLGLEDYFPAKTIEEYLDYQLKAIGSSLEEMKKIGVKLLPE -EAQKLYLEDGEDFEFPTPTGKIELYSTILDEYGFDPIPQYTAHEEPPEGYYRLLYGRAPMHTFGRTTNNP -NLHDLMEENTVWINSKVAKQWGIKNGEYITLENQDGVRSTPVKAKVTERIRHDAVFMVHGFGHSDKRLRR -AYGKGADDQRLITRVKIDPLMGGTGMRVNFVTFRKEEA - ->ACTB1_Opitutus_terrae_gb_ACB77208 -MKRKSDHSAPANSEPTGPKYWRSLDELAATPGFQEQLHREFPEGASELNGVDRRHFLKIMAASFALGGVG -LAGCRRPEKYVLPYGKSVEGMIPGLPLYFATAMPLRRTAIPVLAETHQGRPTKIEGNPTYQQHGGSASLL -AQASVLDLYDPERATQHTREGRKLNVADLNEQLAQIGTSHAANGGAGLAFLAEESSSPTRARLLAQLRAR -LPRAIWAEYEPVADEAPVSAATAAFGQPVRPLYRFARARRIVSLDADFLRPDGAGLYYAREFAKGRRVVN -REDAQQMNRLYVAESAFTITGSMADHRLRLASSHMLALAAALAVKITGSAAFAPLSAGLDIDPKWIDECA -ADLLAHRGTSVFVAGAHLPEQVHAIAYAINAALGNIGATVDFVAPPTNDAASIQTLATAIRDGAIDTLVI -LGGNPVYNAPADLDWAALQKSVKNVVRLGYHTDETTVASPAGAHLAAAHYLESWGDARTADGTIVPIQPM -ILPLFGGLTELEVLARIVGANNPDPYALVLETITALAGGDAEKAFQQFLHDGLLANSAYPTVAVSYNAAG -VARLLGAGAGNPAALSKDNLEVRFVTDYKMDDGRFANNGWLQELPDPITKISWDNAILVSPRLARELGVY -PDGSTLQVARVEMAGFHQGKEQAFIGELTVNGRTVRAPIHIQPGLSNYTVVLPLGYGRTQSGHVGRGMGH -DFYPLRTSAGLHFTVGGKLVPTQDVKAMPNTQEHWSMEGRDIIREANVDEFLENPRFVAAFGMESHSPSI - - ->ACTB1_Flavobacterium_psychrophilum_YP_001295304 -MSSNKKYWKSVEELNENSSIVETLRNNEFVEEISTNEFLGDAVTLATSSTTRRDFLKYVGFTTAAASLAA -CEGPVHKSIPYVVQPEEIVPGVADYYATTIADGFDFANVLVKTREGRPIKIENNKIAGANFHANARVHAS -VLSLYDSMRMKTSKIAGKDTIWEQANAKIKASIADAKAKGGKVVLLTNTSASPSTDKLIAQFLVSNPNAK -HVTYDAVSSSEALDAFQTVYGERALAEYDFSKANVIVSIGADFLGDWQGGGFDAGYAQGRIPQNGKMSRH -FQFESNMTLSGAAADKRVPMTVANQKQALVQIYNVITGSSIGSSKDEAVMKAAQQLKAAGSKGVLVCGID -DKNAQLLVLAINKVLSSEAFNTANTRQIRKGNNADVKQLLADMKSGAVHTLIMNGVNPVYSLPNGKEFAN -SLKKVKLSVAFAMKEDETAAVANIAVATPHYLESWGDVSIVKGSYALTQPTIRPLFDTVQFQDALLSWTG -NAQTYYDYLRSSWSGAKSWNQLVHDGVVFTEGISSSAGAGADYNGAASTLAKASSKGLELVLYTKTGLGD -GQQANNPWLQEFPDPITRASWDNYLTISQADATTSGIENWNVANGGLNGSYVTLTVDGVKLEKVPVIIQP -GQAKGTVGLALGYGRKAAMKEEMQVGVNAYTLYNNFSNVQNVSIAKEDGEHEFACVQLQRTLMGRGDIIK - ->ACTB1_Salinibacter_ruber_emb_CBH25246 -MIELDVIDSETAARDEESGARDGSSEPTFWRHWSESDADEDGDDLTEFVPGDSEPPSGASRRQFLQLMGA -AMAMAGLAGCRRPEEKILPYAREPETVTPGIEDHYATSMPFRGVLRPVVAQSNEGRPTKIKGNSDHPSGQ -SGTSPYEQASVLNLYDPDRSRSVRQEGRAASWSDFVSFCRQLGNEADQHQVAVLAEKTSSPTVQAMRQRM -ADRFPNLQWVPYAPTGTDPRRLGMQQAFGRPLRPRFELGEAEVIVSLDANFLDGRTHDFGYHTQGFAEGR -RLDDAEDTMSRLYTVESRYSTTGGSSDHRLAMRAGRIPALAAALAAELGVGEAPDVSWSERERLHVREMA -RDLQAAGEHGVVMAGEAQPPEVHALAMAVNQRLGGLGTTVTLFDPGDDEIQPQDEALADLTASMRAGEVD -TLFMLGVNPVYDAPSELGFEEALSNVRDTVHLGRLRNETAQAARWHLPRTHYLEQWGDGRAYDGTKSIVQ -PLIRPLYDDAHSLIEVLNLAATGVDASGHDLVREQWRAQLPAPFQERWRKALHDGYLEGSGYETASVGTA -TVPSIDAPASDPDEIEVVFRTDSKLLAGRFSNNPWMQELPDPISKIVWDNVAVMSRATADELGVEVQRRE -GSFYADRVELTLDGQSVKLPVWVQPGYPDGSIGVSMGYGRTIASTRESESTPFWDTSDQTNIYNGSPIAG -GVDSSGEPVDVVGGNVAPMRPNGGRVATGANVTQVGSGYLLATTQEEGSMQGRPIVRWATLDEFKENPEF -VNESQPPVPDLGHESGGHGDGGHGDGGGHGGGDGHSGDGAAGNVSGQGLEAGPGADAHGADEMPEQAAHG - - ->ACTB1_Rhodothermus_marinus_gb_ABV55245 -MIELPVVNPDGAETPGSGKRLWRSTADLRRDPEWVKLAHDEFMPGVAEPPSGTSRRQFLQIMGASMALAG -LTACRRPVEKILPYVRQPEEIIPGIPLYYATAMPFRGSVRPLLVESHEGRPTKIEGNPDHPLSRGATGVF -EQASLLNLYDPDRSQQVLRKGEPASWGDFVQFARSLAAEAGTKRLAVLCEPSSSPTLAALRRELERRYAQ -VRWVTYRPEGDDHEALGLQQAFGRPVRARYRFSEARVIVSLDADFLGPTDRNFVENTREFAASRRMERPE -DEISRLYVIESTYTVTGGMADHRLRLRAGDIPAFAAALAAELGVGELREAGARFAGHPYVVEIARDLRAA -GARGVVLAGETQPPAVHALCAVINDLLGSLGRTVILHALDEPATAQHAALAELVQAMQAGAVDALLLLNV -NPVYDAPAALGFAEALAQVPEVIHLGLHMDETARRSTWHLPSTHYLEAWGDGRAYDGTLSVIQPLIAPLY -EAAHSPLEVLALLATGEEQSAYDLVRNTWRRLLAGRGAFEQAWQRVLHDGFLPDSGYPTVSLRPNRQALA -DWPQAAEGGLEVVFRLDPTVLDGSFANNAWAQELPDPITKIVWDNVAILSPKTAAALGVKAEYHKGVYIA -DVIELSLDGRAVELPVWVLPGHPDDSITVYLGYGREITSTRPERKTPFFDLDEYTDMYGHGAIATGVGPR -TWPRCGGPDNTWVAYGAQVRKTGRTYKIVTTQDHGSMVGRPLVRLSTVEEFRKNPDFAKEAEPPLEGLEP - ->TMAO_Photobacterium_profundum_YP_129680 -MNMSVSRRSFLKGLATTSAVSVIGPSLLASSKAMAAETTGTWKTSGSHWGAFRAHVYAGKVQEIKPLEMD -KYPTDMLNGIKGIIYSPSRVRYPMVRLDWLKKHKYSGETRGNNRFIRMTWDDALDLFYRELERVQKDYGP -WALHAGQTGWRQTGQFHSCTSHMQRAVGMHGNFITKVGDYSTGAGQTILPYVLGSTEVYAQGTSWSEILD -HSKNIVLWATDPVKNLQVGWNCETHESFAYLEQLKEKVAKGEINVLSVDPVKNKTQRFLGNDHMYINPQT -DVAFMLAVAHTLYTEDLYDKEFIKMYCLGFDEFVPYFMGKSKDNIEKTPEWAAEICGLPADEIRDFARML -VAERTQILFGWCIQRQEHGEQPYWMGAVIAAMVGQIGLPGGGVSYGHHYSSIGVPSTGFAAPGGFPRNVD -EGQKPKWDNNDFNGYSRTIPVARWVDCLLEPGKEIKYNGSKVILPDYKMMIISGNNPWHHHQDRNRMKQA -FQKLQTVVTIDFAWTATCRFSDIVLPACTQFERNDIDVYGSYSGRGLVAMHKLVDPLYQSKTDFDIFTEL -SRRFGRHKEYTRGMDEMEWVRSLYSDCRDANKAKFDMPEFDEFWAKGVLDFGEGTPWVRHADFREDPEIN -ALGTPSGFIEISSRKIDRFGYEHCQGHPMWFEKSERSHGGPGSKKHPFWMQSCHPDKRLHSQMCESEEMR -ATYAVKGREPVYINPKDAAEKGIKDGDIVRVFNDRGQLLAGAVLSDSYARGVIRIEEGAWYGPLNEKVGA -IDTYGDPNTLTQDIPSSELAQATSANTCLVDFEKFKGEVPPVTSFGGPIEVS - ->TMAO_Vibrio_vulnificus_YP_004189064 -MAITRRSFLKGVATTSAASVIGPSLLASASANAVETTGTWKVSGSHWGAFRAHIYAGKVQEIKPIELDQN -PTEMLNGIKGIIYSPSRVRYPMVRLDWLKKHKYSADTRGNNRFVRVTWDEALDLFYRELERVQKEYGPWA -LHAGQTGWNQTGSFNNCTAHMQRAVGMHGNYITKVGDYSTGAGQTILPYVLGSTEVYAQGTSWSEILENA -DNIILWANDPVKNLQVGWNCETHESYAYLAQLKEKVAKGEINVISVDPVKNKTQRYLENDHLYVNPMTDV -PFMLAIAHVLYTENLYDKKFIETYCLGFEEFINYVQGKTKDKVEKTPEWAAPICGVKADKIREFARMLVK -GRTQILMGWCIQRQEHGEQPYWAAAVVAAMIGQIGLPGGGISYGHHYSSIGVPSTGFAGPGGFPRNLDAG -MKPKWDNNDFNGYSRTIPVARWIDCLLEPGKEINYNGGKVKLPDFKMMVISGCNPWHHHQDRNRMKQAFQ -KLQTVVTIDFAWTATCRFSDIVLPACTQWERNDIDVYGSYSSRGLIAMHRLVDPLFQSKPDFQIMKELTE -RFGRSEEYSRGMSEMDWIRSLYNDCKKSNEGKFEMPEFDEFWEKSVLDFGQGQPWVRHADFRQDPEINPL -GTPSGFIEITSRKIGRYGYEHCQEHPMWFEKSERSHGGPGSDKHPFWLQSCHPDKRLHSQMCESEEFRAT -YAVKGREPVYINPLDAKAKGIKEGDLVRVFNDRGQLLAGAVLTDSYPRGVIRIEEGAWYGPLSEKVGAIC -TYGDPNTLTQDIGSSELAQATSANTCIVDFEKFTGKVPPVTSFGGPIEVA - ->TMAO_Citrobacter_youngae_ZP_06352135 -MLAVGAASALAPNPLISKVWAAGENPEQWIQSGSHFGAFEAKVVNGEWLETRPFKHDKYPCDMLNAVREV -VYNPSRVRYPMVRLDWLRKREKSDRSQRGDNRFVRVSWDQALDLFYEELERVQKTYGSSGVFTGLADWQM -VGKYHKAGGAMDRGLGLHGSYVTTVGDYSAAAAQVILPHVIGSLEVYEQQTSLPLVIQNSNTIVLWGCDP -IKNLQIEFLVPDHDAFGYWQQIKEAVAQGKMRVISVDPVRSKSQNYLGCEQLALRPQTDVALMLALAHTL -YEEKLYDTAFINDYTVGFEQFLPYLLGESDKQPKNAEWAAEICGLTAEQIRDFARLLVKGRTQFMGGWCA -QRMHHGEQYPWMLVVLASMVGQIGLPGGGVGFGWHYNGGGTVTSAGPVLSGLGGIANPPPAKYKADFRGA -SEHIPTSRIVDCLLEPGKKVAFNGETLTWPDIKMAIYSAANPFHAQQDRNRMIEAWKKLETVVVLDHQWT -ASCRFADIVLPVTTRFERNDIEQFGTHSNKGLMALHQVVKPQYEARHDFDVFAGLCKRFDKEAVYRENRD -EMQWIQALYDEGVKMGASLGVSLPDFTTFWQGEGYIEYPAGQPWVRHGEFRDQPDLNPLGTPSGLIEIYS -KTIAGFAYEDCPGHPVWMEPFERNHSAKKNKYPLHLQSCHPDKRLHSQLCSSDAFRNTYAVAGREPLYIS -AQDAAARGLKAGDIARVFNDRGQVLAGVVISPDFTPGVIRIHEGAWYSPQEGGKAGTLCTYGDPNVLSAD -IGTSQLAQGPSAHTVLVEVERYQQKAPQVTAFGGPETVKEEGGSAA - ->TMAO_Salmonella_enterica_gb_AEZ47489 -MKNKDSLHVSRRRFLAQLGGLTVAGMLGPSLLTPRSARAADAVAPGAATKEGILTGSHWGAIRATVVDGR -FVAAKPFEQDKYPSKMIAGLPDHVHNAARIRYPMVRVDWMRKGHQSDTSQRGDNRFVRVSWDEALDLFYQ -ELERVQKTYGPSALLTASGWQSTGMFHNASGMLARAIALHGNSVSTGGDYSTGAAQVILPRVVGSMEVYE -QQTSWPLVLQNSKTIVLWGSDMVKNQQANWWCPDHDVYQYYEQLKEKVASGAISVISIDPVVTSTHDYLG -RDKVKHIAINPQTDVPLQLALAHTLYSEKLYDKNFLDNYCVGFDQFLPYLLGEKDGQPKDAAWAEKLCGI -DADTIRALARQMAGDRTQIIAGWCVQRMQHGEQWSWMVVVLAAMLGQIGLPGGGFGFGWHYNGAGTPGRK -GIILSGFSGSTTVPPVHDSTDYKGYSSTIPIARFMDAILEPGKIINWNGKSVKLPPLKMCVFAGTNPFHR -HQQINRIIEGWRKLETVIAIDNQWTSTCRFADIVLPATTQFERNDLDQFGNHSNRGIIAMKQVVSPQFEA -RNDFDIFRDLCRRFNREAAFTEGLDEMGWLKRIWQEGSQQGKGRGIHLPTFEVFWNQQEYIEFDHPQMFV -RHQAFREDPDLEPLGTPSGLIEIYSKTIADMQYDDCQGHPMWFEKIERSHGGPGSQRWPLHLQSVHPDFR -LHSQLCESETLRQQYAVGGKEPVFINPQDASARGIRNGDIVRVFNARGQVLAGAVVSDRYAPGVARIHEG -AWYDPDKGGDLNALCKYGNPNVLTLDTGTSQLAQATSAHTTLVEIEKYTGPMDNVTAFNGPAEMVAQCEY -VPASQGNPHD - ->TMAO_E_coli_CAA52095 -MNNNDLFQASRRRFLAQLGGLTVAGMLGPSLLTPRRATAAQAATDAVISKEGILTGSHWGAIRATVKDGR -FVAAKPFELDKYPSKMIAGLPDHVHNAARIRYPMVRVDWLRKRHLSDTSQRGDNRFVRVSWDEALDMFYE -ELERVQKTHGPSALLTASGWQSTGMFHNASGMRAKRIALHGNSVGTGGDYSTGAAQVILPRVVGSMEVYE -QQTSWPLVLQNSKTIVLWGSDLLKNQQANWWCPDHDVYEYYAQLKRKSAAGEIEVISIDPVVTSTHEYLG -GEHVKHIAVNPQTDVPLQLALAHTLYSENLYDKNFLANYCVGFEEFLPYLLGEKDGQPKDAAWAEKLSGI -DAETIRGLARQMAANRTQIIAGWCVQRMQHGEQWAWMIVVLAAMLGQIGLPGGGFGFGWHYNGAGTPGRK -GVILSGFSGSTSIPPVHDNSDYKGYSSTIPIARFIDAILEPGKVINWNGKSVKLPPLKMCIFAGTNPFHR -HQQINRIIEGLRNVETVIAIDNQWTSTCRFADIVLPATTQFERNDLDQYGNHSNRGIIAMKQVVPPQFEA -RNDFDIFRELCRRFNREEAFTEGLDEMGWLKRIWQEGVQQGKGRGVHLPAFDDFWNNKEYVEFDHPQMFV -RHQAFREDPDLEPLGTPSGLIEIYSKTIADMNYDDCQGHPMWFEKIERSHGGPGSQKYPLHLQSVHPDFR -LHSQLCESETLRHEYTVAGKEPVFINPQDASARGIRNGDVVRVFNARGQVMAGAVVSDRYAPGVARIHEG -AWYDPDKGGELGALCKYGNPNVLTIDIGTSQLAQATSAHTTLVEIEKYNGTVEQVTAFNGPVEMVAQCEY -VPASQVKS - ->TMAO_Shewanella_massilia_CAA06851 -MNRRDFLKGIASSSFVVLGGSSVLTPLNALAKAGINEDEWLTTGSHFGAFKMKRKNGVIAEVKPFDLDKY -PTDMINGIRGMVYNPSRVRYPMVRLDFLLKGHKSNTHQRGDFRFVRVTWDKALTLFKHSLDEVQTQYGPS -GLHAGQTGWRATGQLHSSTSHMQRAVGMHGNYVKKIGDYSTGAGQTILPYVLGSTEVYAQGTSWPLILEH -SDTIVLWSNDPYKNLQVGWNAETHESFAYLAQLKEKVKQGKIRVISIDPVVTKTQAYLGCEQLYVNPQTD -VTLMLAIAHEMISKKLYDDKFIQGYSLGFEEFVPYVMGTKDGVAKTPEWAAPICGVEAHVIRDLAKTLVK -GRTQFMMGWCIQRQQHGEQPYWMAAVLATMIGQIGLPGGGISYGHHYSSIGVPSSGAAAPGAFPRNLDEN -QKPLFDSSDFKGASSTIPVARWIDAILEPGKTIDANGSKVVYPDIKMMIFSGNNPWNHHQDRNRMKQAFH -KLECVVTVDVNWTATCRFSDIVLPACTTYERNDIDVYGAYANRGILAMQKMVEPLFDSLSDFEIFTRFAA -VLGKEKEYTRNMGEMEWLETLYNECKAANAGKFEMPDFATFWKQGYVHFGDGEVWTRHADFRNDPEINPL -GTPSGLIEIFSRKIDQFGYDDCKGHPTWMEKTERSHGGPGSDKHPIWLQSCHPDKRLHSQMCESREYRET -YAVNGREPVYISPVDAKARGIKDGDIVRVFNDRGQLLAGAVVSDNFPKGIVRIHEGAWYGPVGKDGSTEG -GAEVGALCSYGDPNTLTLDIGTSKLAQACSAYTCLVEFEKYQGKVPKVSSFDGPIEVEI - ->DmsA_Actinobacillus_succinogenes_130Z gi|75429943|ref|ZP_00732527.1| -MNHLDLNSNTTRRRFIKTTGLTAFAASAGISIPFATKAGNQSITSTAGADEKVVWSACTVNCGSRCPLRM -HVKDDQIIYVETDNTGSETYNLDHQVRACLRGRSMRRRVYNPDRLKYPMKRIGKRGEGKFKRISWDEALT -EIAQSLQKNIAQYGNESIYLNYGTGTLGGTVTKSWPPGSTLIARLMNCIGGYLNHYGDYSTAQISVGLDY -TYGGGWVLGNGMADIENTKLVVLFGNNPAETRMSGGGLTYCIQQAKAKSNAKLIVIDPRYTDTGVGKEDE -WIPIRPGTDAALVSALAYVMITEELVDQPFLDKYCVGYDENTLPADAPQNGHYKAYILGQGEDGIAKTPE -WAAKITGIPAERIIRLAREIGSTKPAYISQGWGPQRRSNGEIISRAIAMLPILTGNVGISGGNTGARESS -YGVPFVMMPTLTNPVKASIPMFLWTDAITRATEMTAKTDGIRGVERLTAPIKFIWNYAGNCLTNQHADIN -RTHEILQDESLCEMIVTIDNHMTSTAKYSDIVLPDCMTSEQMDFCLDGYVANMSYVIFADQAVKPSFECR -NIYDMLSDLSEKLGVKQQFTEDRTQEEWLRYIYRQSREQLPELPVFDEFRTQGIFKKVDPKGFYIPYKEF -RDDPQANPLKTPSGKIEIYSSRLAEIARSWKLDEDEVIHPLPIHVDSFEHYGDPLMEKYPLQLTGFHYKA -RTHSTYGNVDILKSANPQEIWINPFDAEKRGIKNGDMLRMFNDRGEVRIHAKVTPRIIPGVVALGEGAWH -APDNQGIDHSGCINVLTTQRPSPLAKGNPQHSNLVQVEKL - ->DmsA_Haemophilus_influenza_sp_P45004 -MSNFNQISRRDFVKASSAGAALAVSNLTLPFNVMAKETQRLNENNQERIVWSACTVNCGSRCPLRMHVKD -NRITYVETDNTGTETYNLDHQVRACLRGRSMRRRVYNPDRLKYPMKRIGKRGEGKFKRISWDEALTEIAD -ALKRNIKKYGNESIYLNYGTGTLGGTMAKSWPPASTMIARFMNCIGGYLNHYGDYSTAQIAVGLDYTYGG -GWALGNGMADIENTKLIVLFGNNPAETRMSGGGLTYCIEQAKARSNAKMIIIDPRYNDTGAGREDEWIPI -RPGTDAALVAALAYVMIQENLVDQPFLDKYCVGYDEKTLPTDAPKNGHYKAYILGYGNDGIAKTPEWAAK -ITGIPAERIIKLAREIGSTKPAFISQGWGPQRRSNGELISRAIAMLPILTGNVGIHGGNTGARESAYSIP -FVRMPTLKNPVKASIPMFLWTDAIIRGTEMTALTDGIRGVDKLSSPIKVIWNYASNCLINQHAQINRTHD -ILQDDTQCEMIITIDNHMTSTAKYSDILLPDCTTSEQMDFALDAFVSNMAYVIFADQVIKPSFECRPIYD -MLSDLAEKMGVKEKFTEGRTQEEWLRHIYEQSREKLPELPTFEEFRQQGIFKKVDPNGFKVAYKDFRDNP -EAHPLKTPSGKIEIYSSRLAEIAKTWKLAEDDVIHPLPIHAQSFEHYGDPLMEKYPLQLSGFHYKARTHS -TYGNVDVLKAANPQEVWMNPIDAEPRNIKNGDMIRIFNDRGEVHINVKITPRIIPGVVALSEGAWYAPDK -DRIDHSGCINVLTTQRPSPLAKGNPQHSNLVQVERL - ->DmsA_E_coli_sp_P18775 - -MKTKIPDAVLAAEVSRRGLVKTTAIGGLAMASSALTLPFSRIAHAVDSAIPTKSDEKVIWSACTVNCGSR -CPLRMHVVDGEIKYVETDNTGDDNYDGLHQVRACLRGRSMRRRVYNPDRLKYPMKRVGARGEGKFERISW -EEAYDIIATNMQRLIKEYGNESIYLNYGTGTLGGTMTRSWPPGNTLVARLMNCCGGYLNHYGDYSSAQIA -EGLNYTYGGWADGNSPSDIENSKLVVLFGNNPGETRMSGGGVTYYLEQARQKSNARMIIIDPRYTDTGAG -REDEWIPIRPGTDAALVNGLAYVMITENLVDQAFLDKYCVGYDEKTLPASAPKNGHYKAYILGEGPDGVA -KTPEWASQITGVPADKIIKLAREIGSTKPAFISQGWGPQRHANGEIATRAISMLAILTGNVGINGGNSGA -REGSYSLPFVRMPTLENPIQTSISMFMWTDAIERGPEMTALRDGVRGKDKLDVPIKMIWNYAGNCLINQH -SEINRTHEILQDDKKCELIVVIDCHMTSSAKYADILLPDCTASEQMDFALDASCGNMSYVIFNDQVIKPR -FECKTIYEMTSELAKRLGVEQQFTEGRTQEEWMRHLYAQSREAIPELPTFEEFRKQGIFKKRDPQGHHVA -YKAFREDPQANPLTTPSGKIEIYSQALADIAATWELPEGDVIDPLPIYTPGFESYQDPLNKQYPLQLTGF -HYKSRVHSTYGNVDVLKAACRQEMWINPLDAQKRGIHNGDKVRIFNDRGEVHIEAKVTPRMMPGVVALGE -GAWYDPDAKRVDKGGCINVLTTQRPSPLAKGNPSHTNLVQVEKV - ->TtrA_Wolinella_succinogenes_NP_907142 -MEEGRRRFLLGSGVVAGSAAVVGYKETLGAVALLKDKGERAKDSIYGEAAEPEVRFESGRTLINPKYSIRPSVCNGCTTHCGIRVKINQESGAVERVFGNPYSLLSSDPWLPYNTPLKESLEVLSAQKESGLHHRSTACARGNAVYDKLNDSFRVTKPLKRVGKRGENAWVEISPEQLIQEILEGGNLFGEGEVEGLRSIRQLDKLIDEENPEYGSSANRLCVLGTADEGRQVVMVQRFVQSFGTVNFMGHTSICGLSMRAGEAAYLNDFVGYPHLKPDFKNCKFLLNIGTAPAHAGNPFKRQAKLLAQARTTGECRYVTVTPILANSDNIAVGERSRWLPVAPSGDLALVMGMIRLIIEEKRYLADYLAIPSLESQKALEEVSFTNATHLIIQKGEKEGQILKDSQGSPWVIDVKEGVLRDSKSVLRGELDFAGEVTLEGVSYEVKSAFLLLKESALAYTLEEYASFSGIDSKEIVHLAREFTSYGRSVGVDCHGGTMHTTGFYATYAVMMLGALVGNLNHKGGMSMGGGKFEDFNGEAYNLIAYPNKPKPQGARIDRARMAYEKTSEFKRKVAQGENPYPAKAPWYGLANALESDVITNSEEGYPYKLGALISWCANFIYGQSGSEHLLESLKDPKRAIPLFIAIDPFINETSRWADYIVPDSVMYETWGVVSPWGASLTKASHLRYPILPSPNAKWSNGEPVSMDSFIIELGKALGLPGFGKNGIVAKSGEKFPFDRPEELYLRAFENIALSGKAVPEISDEEIELAGLKEYASKLQAINGENWRRVAYVMARGGRFAPIEDAYKGDSLSRAYPKAISIYNEALGTSKNSLTGERYSGVPRFYAPRFTDGRALEEAGLGDSRSFLAFSYKSNVLSAPTTASRHLKELRYTTFVDMNSQSAKALGIVHGERVRVVSKGGFVIGICRLREGIHPRSIGIEHGAGREGEGAIDLLINGNVIRGEIARRSGVNINKLGLKDASKGKVGTLSDFVIGSNARQGIPVWIEKLS - ->RBG1_855 -MQVTRRDFLTFAGFTLAGITLGEWGRSKILAREEYKDTLYSGIGKEEFRLSICGQCPAGCGIVVRLMDGNPKKIDGNPLCPLSRGKLCPKGQNGLQVLYDPDRLTGPVKRKGKRGENDWEKISWEEAINTVSQKLKELKEKQNSYRLLILTQENKGLSGKLWKQFARAYGTPNLVEGNLLRDPGILWASYLMQGIKDYPAYDIENTKYILCFSPFLEGWYSPTWAQRMYGNFRRKRPEIRGKLVQIEPRLSPTAANADEWIQINTGTEAALVLGLAYLIIKEGRYDENFIREHTFGFEDWTDAQKRTHLGFKNFVLQEYDTEKVSSLTGVPIVTIIRLAREFSELNPALAIAEQRPASGGFYLQMAILALNALVSSLDVKGGVIIQREVPFKEFPEVSGSKKESILNQERFSSQEVFPHLTKAILEEKPYPIEIVLIDKINPFSHCFPIINFKEALEKIPFIVSFSPFLDETSLYADLILPDHTFLEKWQDVVPSATLGSPVLGISRPAVDPFLDTKNTADVILEIAHDRDILAYSTLPWKNYGELLKDSLQGIYLSRRGMTYGTSFQGAWMSQMEKGGWWSPTYTNFEEFWNQLLEKGGWWDPFYEHQKWDRVFKTPSGKFEFYSQIFKNQLASIKPSKENSDFKILPHWESVVWEGDENSFPLYLNVFELLMFSAVLNSNQPYLYEHITPHLSVQWESWVEIHPEKAKALGIEENDEVWVESVLGKIKTKAKLYFGTHPEVVSLPLGLSGLSQSSWIKKEISNPNQLVTGNSGNLENKYLRVKIYKA - ->QrcB_delta_proteobacterium_NaphS2_ZP_07200609 -MTMKITRRNFIAAVVGGVVGIQVTPLPWKFTDDAAIWTQNWPWVPVPAEGAVTEENTVCNLCPGGCGISV -RKVAERAVKIEGRTDYPVNPGGICPVGMGGLQLLYDDDMRFPGPMKRAGARGQGQFVNITWGEAYDILAG -RIAKLRKDGTPEALAAIDGNYAGTTTGLLVERFMRSVGSPNYVKPNAITDTYHMGNLLMMGKSVPMAYDL -ENSDFILSFGCGLLEGWGAPGRVMNAWGMWHDANPKNRKTRVVQVESRASNTASKADFWVAPRPGTDGAL -ALGIAHVLIKKGRVDERFINGFTYGFDDLTSSEGQSQPGFKTIVSNKYSPVQVERITGVDAGTIVALANA -FSKAKAPVAVYGKGKNNLNGSLYEFMAVQSLNAVKGRINRPGGVLVPDPLPLAPLPEFDPDEVAAKGLET -PRIDGAGTKAYPFTDSLINHFADAINQGARSPVDTLLVFSANPFFTVPDGPGFMNALEKIPFIVSFSPYR -DETANMADLILPDHTYLEKIEDIVWPVGLQYPLYGLTKPVVEPVNDTQHAGDVIISLSKAVGEATGSAFP -WENFEEALQARAKGLFDAGGGLVHYDASKPPWKFKPFGNGQKPSYKSFDDMWGEMKSGGMWFQPVKLAGM -DGLFATSSGKFEFVSQKLRQTINETAAQTSQKAALDQMGIRVAGAEAFMGHYAAPKLGVDRSKYPLFMVP -YEMINLSSGWIATPPFLYKTIFASQLLKEESFAAVNPETAAKYKLQQGDRAIVKSPVGELRVRIDLFEGA -MPEMVYMPLGFGHTAYDEYQKDKGVNPNNIVKALNDPVSGYPLWWNTPVTLTKA - ->ACTB1_Geobacter_metallireducens_GS_15_YP_384764 -MKRRTFLQLGTVIAAGAVLDGCRSKNEQLIPYLIPPDEGITPGKGTYYASSCNACPAGCGILVRVSEGRA -KKIEGNPEHPINRGKLCARGQAVVQELYHPDRVPHPLKRNGPRGSGAFTRISWQEGIGLLTDRLKALQRE -QSTNGLALLTPHLRGTLAELTGRFMRTFGSTNHVSYELLTPDLLRIAARRSFGQPTLPYYDIAETRYLLS -FGADFVDSHLSPVKYGSAFGEMRQGRDTVRGHFTYVGGRMSLTAASADRWMPAKPGSEGTLALGIARLIL -AESLYDSGALAMNGLEAKKLLAALDRYDLPRVAQLSGLPQGAIAEVAREFASTRPALALAGEMVAFQSNG -PESVRAVHLLNLLVGSLNRPGGIYPDAGSPSGPENSFAELIALIETMRGGHVKVAMIHGDPLYSVPPATG -FHDALAKVPFIVSFSSLLDDTALHADLVLPDHAALESWGDVIPVAGTREPLVGLMQPVVEPLFDTRQFPE -VLLATAHELGGRMAAALPDESYLELLKGAVRKQAGFGAGVDFEAAWVDLLQHGGLFKTKSVQPTGYRWSS -DAPPPLPEDPDFAGDQKTYPFHLIAYPATAFYDGRGAPYPWLQQLPDPMTTVVWGSWVEINPETAAEHGI -GFGDLVEVSSPQGTLRLPAVVYPGIRPDMVAIPLGQGHRGMGRYAQGQGVNPLALVARQGTKQQPAWNAT -RVRITRISGNGELVTAGHPQGSLRSELVEI - ->ACTB1_Geobacter_uraniireducens_Rf4_YP_001231524 -MKRRTFLQLSGMTAAGTVLSGCQSGNEKLIPYLVPPDEGVTPGKADYYASSCRFCPAGCGILVRVSEGRA -KKIEGNPAHPVNRGKLCAMGQAVLQELYHPDRVPQPLKRSGPRGSGAFTRISWEESLELLAGQLRALQRE -KATDRLALVTPQLNGTLVELTTRFMRVFGSPHHLSFDLLGPDWLRTATRRSFGQPGLPWYDVAETRYLLS -FGADFVEHHLSPVQYGYAFGRMRQGRDTVRGHFTYVGGRMSLTGASADRWMPARPGSEGALALGMARLIL -AESLSDAGSLAVNGLQTEKLLRRLEAYDLPRVAEQTGLPQRIIAEVAREFATTRPALAMAGETVAFQSNG -PDAVRAVQMLNLLVGNLNRPGGVYPDGGSRVGPENSFTELLSLVAAMRDGRFRVAMIHGDPVHAIPPATG -FQEALARVPFIVSFSSLMDDTALQADLILPDHAALESWGDVIPLAGTRDRVIGLMQPVVTPLFDTRQFPD -VLMAMADKLGGKTAAFPYQSYQEMLKGTMEKRVGRAARRDFETVWVELLRQGGLFETRQGQEKGYRRAPG -SSLPNPAEPRFAGDEKRFPLHLLVYPSIAFYDGRGAPLPWLQQLPDPMTTVVWDSWVEINPRTAAEMGIG -FGDLVEVTSPQGAMRLPAVIYPGIRPDMVAIPLGQGHRGMGRYARGRGSNPLVLLALITDGTETRPAWHA -TRVRLTRISEKGELVTAGHPQGSYRSELIEI - ->ACTB1_Geobacter_sp_M18_YP_004200644 -MKRRTFLQISGMTAASALISGCQSANEKLIPYLIPPDEGITPGKAVYYASSCRSCPAGCGILVRVSEGRA -KKIEGNPEHPVNRGKLCARGQALLQELYHPDRVPQPLKRSGPRGSGQFTRISWEEGLNLLTGQLKGLERA -GAAERLALMTPQLRGTLATLAATFMSSFGSPHHLSYELLAPDALRAANRASFGQPSLPWYDIAQTRYLLS -FGAEFVDHHLSPVHYGNAFGRMRQERDTVRGHFTYVGGRLSLTAASADRWMPARPGSEGALALGIARLIL -SESLHDRGALSANGLSATDLLAGLASYDLARVAELTGLSREAIAEVAREFATTRPSLAMAGEGVAFLSNG -PETLRAIGLLNLVTGNLNSPGGVYPDGSFPDGPENSFADLVSLVGAMAGGRIALALIQGDPLHRVPAATG -FPEALAKVPYIVSFSQIMDDTALQADLILPDHAQLESWGDVIPVAGGRFPLTGLMQPVVTPVFDTRQFPD -VLLAAAAALGGKTARALPFPSYQELVKKSVLQRAARVKGEEAEEIWTSLLQKGGDFREGPEQPKGYRWAP -GASLPAPQAPLFAGDERSFPLHLQLYPSTAFLDGRGAPLPWLQQLPDPMSTVVWDSWVEMNPKTAAGLGI -AHGDLVEVSSPQGSLRLPAVVYPGIRPDLVAIPIGQGMRGGGRYARGRGVNPLSLLAAKLKGTGPTPCWS -ATRVKLVRISGDGGLVTNGNPQGSYRSDLVGI - ->TtrA_Photobacterium_profundum_YP_133039 -MAALIMDRRQFLKMGAATTFTGGMAGISKATAGDSNQDISRYAPLSAEPEFILGPDNKLTNNPNQRFAFTKCFGCYNVCGARIRIDNNTDQILRVCGNPYALSTQSGNPVAMEVSPQEAMLQLVGEQGNENRATLCGRGNAVPDAITDSRRVTQCLKRVGKRGENHWQSISYEQLIKEVVEGGNLFGEGHVEGLSDIYDDKTVANPAYPDFGPKKNQLLMTGCSEDPARWGFYKRFSEASWGTPNIGNKDSYCGHQQVAGCALGVEDGANSGALPTTDFEHCEFAIFIGTNPGLSGISLNSASKRLADARTQNPNFKYVVIDPILRSLTSSSTPENCEWVPIRSSGDTALMHAMMQYIINNERYNKSYLASCSQEGAYKVSEINYTNAPYLVVTDKKHPLYRKFLTAAACGKGDADTKMVIDAKSQQLTTSDSSEPCNIKFSGKVTTEDGQAVKVETAFSLLAKRVNEHSMADYAAECQVPEAKIIELAKEFTSHGRRVSIETNTGCNASDGSQFAFAMIMLTTLVGAHNAKGGMLHTGSMGFENTSPLYDMMAFEHAHLSGFNAERSGDYRQSNEFKEKVKNGINPYPSEMPWNETFIQDNAGELLVAHANGNPFKFKAWIAWANNPLYACSGLKDQVEASIKDPKQLGLIIASDPYFNETNVYADYFVPDLAQYEQWGASRQWGSELMGDVVSFPIITPKTPLNAEGNRVCMEQFLIDVAKQIKLNGFGENAFKDTAGNAKAINTPEDYYIPVLANLAHSDEVLPTPTEEDVKFTSVDRIYSQLKERLKAEEIGPTMFLFTRGGRYLTVNSRYEGEFFNEMMRWDAQFQVYNEGLAHITNFHSGEYLDGLPVFDKQRFWDGTAIRDLWSENEYPFYFSTFKHQLRSPYSVALKSITALGVSNFIQMNENDAKKYGLTTGDKARIATPKGAAIEGIVQADTTVAKGCIAVPLGYGHTAFGASDITIDGKTLTGIPERKGGMAVNAFNAVDPTRKGASLYRDVTFGSTARHGIPMKIEKV - ->TtrA_Haemophilus_somnus_gb_ABI25172 -MNKQRRNLIKGALATTAATAFVAGYSPKVKEIAKGVIEGSSGQKTQDNINGNSLLPEYQVKEGNLLTNSQQVVCNTQCMGCWTLCGLRVRIDLEKNKVLRINGNPYHPLSSDHYLDYNQSIKQAELSVSGENGLQQRSTACARGAAFLDGINSPYRITQPLKRVGKRGEGKWKTISFEQLIDEVVNGGDLFGEGHVDGLKAIRDLQTPVNAQHPDFGAKVNQLMVTFAGPEGRQPLLKRFANNSFGTINFASHGSFCGLSYRAGSGAFMNDFANNSHAKPDWDHVEFILFMGTSPAQSGNPFKRQSRQLAKKRTEDNFEYVVIAPRLELTSTAAQDKNRWVPIIPGKDLSLALAMLRWIIENERYNEDYLSIPSEIAMQQANGVSFCNATHLFIADPNHKQYGQAIRNFHIEDLSEPEKLSDSDILVKDRQTGKFIAAKDCQSAVLFVEDRISLKDGSQVLAKSALQLFKESCFSYSIEEYSEQCGVPVDTIIQLAKKFTSHGPRAAVITHGGTMHSNGFYTAWAILLLNAMIGNMNKKGGMSMSGGKFKDFSAGPRYNLANFPNMVKPKGTNLARSKKDYEKSSEFKQKVAQGISPYPAKAAWYPFVGGQMSEMITSALQGYPYSLKAWINHMGNPIYGMTGIHHITQQKLKDPKILPLFISIDAFMNETTALADYIVPDTHNFESWGFSTPWAGVPTKTSTARWPVIASPNEKTSQGDTICMESFVIEIAKMMQLPGFGDNAILDKQNHSYPLNRSEDFFLRAAANIAYDGKQPVQDATQEDLLLTGVQRLMPSLQQVLKPEEIKKVATIYCKGGRFAPHSSAWQEDNMQARWKNCLQIWNENVAKAKHAQTGKNYHGCPTYFEDQFADNSTVESHYPKIQWPFKLISFKSNLMSSITAPLLRLHSIKPNGIVAINQQDATEYGLQHGDLVELNTPGGKAVVQLVVMNGVIKGTIAIEHGYGHKQLGATGYTINGKLIEGNAQIGSGVNINDLGLLDSTKEIASPWVDWVCGSAVRQGIPAKLVKLA - ->TtrA_Yersinia_enterocolitica_YP_001005907 -MAKSTRRQWLKGSLALGGVVAFGASYHAVARKTLAGLVDGSAGKLTLDPISGNALPTEGRVGPQWQANPQQAVSMTQCFGCWTLCGLRVRVDTQQNKILRIAGNPYHPLSHDHHFPYQLPVGEALQHLGGEQGMTGRSTACARGATLLEGVDSPYRITEPMKRVGPRGSGKWQRISFEQLVAEVTEGGDLFGEGPVEGLRAIRDLDTPIDAKQPSLGPKANQLLVTNAGDDGRDAFIQRFANQAFGTKNLGSHGAYCGLAYRAGSGALMGDLDKNAHVKPDWDNVRFALFLGTSPAQSGNPFKRQGRQLANARQRDDFNYVVVAPALPLTTTLANQHNRWVPVLPGTDAALAMGIIRWIIEQHRFNHAYLAIPGEMAMQAAGERSWTNASHLVITTETHPLAGQFLRANMLSGETVAEGEESPVLAQAIDGALQPAAQMLQAELFVTQDLTLHDGQNVQVQSGMTCLQQAAARFTLAEYSQQCGVPEATIIGLAREFTAYQRQAAVISHGGMMGGNGFYTTWAVMMLNAMIGNLNLKGGVSVGGGKFDGFADGPRYQLATFVGMVKPKGLPLSRSKQPYEKSEEYQQKIQQGQSGYPARGPWYPFVGGQLTEQLAPALAGYPYPLKAWISHMTNPLYGVAGLRNLIEERLQDPRQLPLFIAIDAFMNETTALADYIVPDTHNFESWGFSAPWAGVLVKASTARWPVVEPRTARTAQGEPVAMESFLIAVAKAMKLPGFGANAMQDSEGNSLSLDRAEDYYLRAAANIAYGGEKPLPAAVDDELRLTGVDRLWPALQRSLYPDEQRRVAYLLARGGRFAPYEKSWNGDATGSQWKKPLQIWNENVAKHHHAITGERYSGCPTWYPPRLADGSDVFQHYPVSDWPLRLMSFKSHLMSSSTAMIERLRAVKSTNLVAINPQDAQRNGIQHGDIVRLMTPGGQMEVQVSLLDGVMPGVVAIEHGYGHREMGSRAHTLDGVVMASDPRIGQGSNLNDLGFTDPTREIPNTWLDWVSGAAVRQGLPAKLQRIS - ->TtrA_Aeropyrum_pernix_NP_148724 -MVSRRDFVKGSIAIASLLVAGAGLQPVLSQLVRPKFERIAPDLQMGANVRYVYSSCLGCNVRCGIKARVVKVGDLEIVERIEGNPYHPYNRAVSLNGNGKLGSQHLRFYHLPYNTPVKEALTKWHGTLCPRGQDGIYYLYDPYRVLVPLKRAGPRGSGKWKPISWEQLIREVVEGGVIEETGERLPGLRDFFVYGKLREAGFEDPNAILSDMKKDVQEILEYAKKPETSYEDIVMKIEEFKEKWSKILGEKGLKLDDILIDPDRPDLGTKANMVAYLRGRGQGHTDYMSARWIAGFGSVNWLRHTSACQLGYYAANYLWAGYHDIQPDPVSSKVIIMAGASMGRLHPGTTGQGLLISRAGEGDLKIYYVNPTAPRTDAGGNIVWIPIKPGYDAALAFALIRWIIENERYNKEFLEIPNEEAAERKGYPVHSNATWLVIMEEGHEKWGEYLKAKDVGLEDSDKPVVFTGEGLATYDSVDNAEIDWEGEVVLTTGERVKVKTSFRILKDEALSRSIDQWLSVASPYEPGSSEFREWKEKVLEMARDFAEAAPMAGTYVHRGVGMHSNGEYAVWAYRALDTLVGNYHRKGGLLARAGHTKYNSYVYHVDKKGFGEPVKWGPPIDRHKAKYEDTLEYWLKVKKGENPYPAKRPWYPHTPEESYTEIFAGIAEEYPYKMGALILFYANPVLSANYGVKFIEVLKDTKKLPLFIAITTTINETMLYADYIVPDTTYLETGTLGMQYLYASSGGVLLAEAARSPVVMPLTQKIGEPERYASFWEFFIDTGKALGMPGFGKGAIKGLKYHEGKSYDLDSLWDYIMRVYANAAMHAKDMGIIPENVPEEEVKFVEENYPVAKFKHLIPDEWPYVAYMLARGGVFTSYEESFHPNGVSKRKVPSKRKKFKKTLMLWNEDLAKTRNSVTGAKFWGGPKYIPPSTYAPVKGGSKSFYGTPLREIYPESEYPFHLVFTTGPLFTKHRSQFYYAIKQISPENYLVVNPKDAEKLGLETGDVVEVETPTGRFKAPVVVEPTVPPGVIMVPYGMGRWADTVVKKPSYFEVKDSRLASLINELPEREEIPEEAVNPVKKLPELKKKVLFTKSTPAYYNQAEPDKWRFNGITPNVAEMSDPSLGGWPLLSIIGAAQAYYFNVARIRKTGEKHEFEKTYPYIVW - - ->PsrA_PhsA_Archaeoglobus_fulgidus_NP_071207 -MVTRRDFLKATALTATAISAGIKFQPKSYAEATAASGEVKFVPNICAMCPAACSIQVEVRDGKVHRIHGTPDHPINNGKICARGNAGVQRVYNPDRLKKPLIRTGEKGTWSFREASWEEALSLIASKVKEYREMGHPEYIGMLGGWLPCTYYKPFFKAFLAALGTPNGGGVPEALCFLSKALGWKSAYGFGAHPELLTDYENARYVIMLRRNVAGSISVVHGWRLGQNRRKFKLVVLDPRYSETAAKADVWLPIKPGTDLAFLLAMMNVIINEKLYDSNFLAKYSNAPMLLKDGKPFKVWDENGKKKYLVFDLAKGAAVEHDSAMLPALEGEYEVEGEKVIPAFEALKRRVAEYTPEWAEGITDIEAKKIREIAREFALRRGVIDSGWHGPKYRNSLLTWRAAAIVNALVGSVNNDGGLLFTGLAQFVTSKESTTEAPSQSVLRMWAEKRGIATAFLGHTVQAFYDAIVNEDPYPIKMLFVVGHNLLMNMPERQKWEEALKKLDFMVAVDILPQDHLYYADVVLPESTYIEKDDPLFPIAYAPAFGFHTRVKAIEPIYDTKHVIEMMVEIASRLGTEDTFFKALSKGLGVDAEKLKSYYHGEGVAGIRRAQAEAKGVNYNELLSKGYVLKAGRDKIVYNMPYKQPLPTPTGKVEIFSFMLANFASKASEPYWDALIKWVPPKVSERKLGSNEFYLAYSRSPFTTHSSTSDNPLLAKLIDDAELYYKGIWINSERAAELGIRNGDRVVVESVFTGDKTEAIAFVNELVRKDTIFTVSGFGQSSERLTNIPQRGMTMMRLIPLQFDTLSGTIMSQETIVRITKA - ->PsrA_PhsA_Thermus_thermophilus_YP_004130 -MQRREFLKLSALGVGAMALRGSGPAKALKAPWYAQEVKSVYQICEGCFWRCGIVAHAVGNRVYKVEGYEANPKSRGRLCPRGQGAPQTTYDPDRLKRPLIRVEGSQRGEGKYRVATWEEALDHIAKKMLEIREKYGPEAIAFFGHGTGDYWFVDFLPAAWGSPNAAKPSVSLCTAPREVASQWVFGRPIGGHEPIDWENARYIVLIGHHIGEDTHNTQLQDFALALKNGAKVVVVDPRFSTAAAKAHRWLPIKPGTDTALLLAWIHVLIYEDLYDKEYVAKYTVGFEELKAHVKDFTPEWAEKHTEIPAQVIREVAREMAAHKPRAVLPPTRHNVWYGDDTYRVMALLYVNVLLGNYGRPGGFYIAQSPYLEKYPLPPLPLEPAAGGCSGPSGGDHEPEGFKPRADKGKFFARSTAIQELIEPMITGEPYPIKGLFAYGINLFHSIPNVPRTKEALKNLDLYVAIDVLPQEHVMWADVILPEATYLERYDDFVLVAHKTPFIQLRTPAHEPLFDTKPGWWIARELGLRLGLEQYFPWKTIEEYLETRLQSLGLDLETMKGMGTLVQRGKPWLEDWEKEGRLPFGTASGKIELYCQRFKEAGHQPLPVFTPPEEPPEGFYRLLYGRSPVHTFARTQNNWVLMEMDPENEVWIHKEEAKRLGLKEGDYVMLVNQDGVKEGPVRVKPTARIRKDCVYIVHGFGHKAPLMRLAHGRGASDNYLQTRYKLDPISGGAGLRVNFVRLEKAERPRLPSLTGLAKRPFDERRM - ->PsrA_PhsA_Moorella_thermoacetica_ATCC_YP_429324 -[MLEQKITRRTFLKGSLAAGALATFGGKLIPIEPAKAAAAGQAETRVVPTLCEMCGVKCGVLAHVRDGRVWRLTGNPRDPQSGGRLCARGNAGTKTLYDPDRLKGPMKRVGEGQFQPISWEQAFQEIGSKLKELKEQYGPQSLVWLAHPELISPLEKHFMAAFGSPNYTGHGPTCYSSRNVAFEQMYGGVPGVDYRNVRYYIAFGRNLTGGIKNPDVQKIVAAKAEGAHLVAVDPRLSDFAYFADEWLPIRPGTDLAMVLAMINVLINENLYDAAFVAAYTTGFEELKKGVSGYTPAWAAGITGIEAGTISRIARELAAAKPAAAVDPGWHAVTGSQYGNSVQAGRAIAALNALLGNLGARGGLSLPPTIKLGSPAGIMGPKPPAATAPRWDGAGSEKWPLNKDHGMIQTFPERVKQDQPYPVKAVIIQHLNPVRSSTDSLAFIEALKKLDLVVAIDIQMNDTAYYAHYILPEATYLERYDPLMTVGNKVLLRQPAIKPLFDNKGAEEIIAGIGRAAGLSEYFNFTLEQYNDALLGPLGLTQAQLALTGVAEVEASKPDYSKLKTPSGKIELACPAFVKAGSTLTPAWEPPLVEPRDDSFRLIQGHVPMHTHTTTDNNSYLHAIMPENELWIHTSRAGKLGIKTGDLVEVASKVGKVRVKARVTEAIHPEAVFLAHGFGCRVPLRHLAYNRGANGGDLIPIMTAPVSGAAAQCETLVTVRKAG - ->PsrA_Wolinella_succinogenes_NP_906381 -MTRRDFLKSAGAAGAAGLVWSQTIPGTLGALEKQEIKGSAKFVPSICEMCTSSCTIEARVEGDKGVFIRGNPKDKSRGGKVCARGGSGFNQLYDPQRLVKPIMRVGERGEGKWKEVSWDEAYTFIAKKLDEIKQKHGAHTVAFTARSGWNKTWFHHLAQAYGSPNIFGHESTCPLAYNMAGRDVFGGSMNRDFAKAKYIINMGHNVFEGIVISYVRQYMEAIENGAKVVTLEPRLSVMAQKASEWHAIKPGHDLPFVLGFMHTLIFENLYDKKFVQKYCTGFEELKASIEPCTPEKMALECDIPADTIKRLAREFAKAAPKAIFDFGHRVTFTPQELELRRAMMMVNALVGNIERDGGMYFGKNASFYNQFLGEEDPKAKGLKKPKTPAYPKVEVPRIDRIGEKDGEFFLANKGEGIVSLVPKATLNELPGVPCKIHGWFIVRNNPVMTQTNADTVIKALKSMDLVVCVDIQVSDTAWFADVVLPDTTYLERDEEFTAGGGKNPSFGIGRQKVVEPLGDAKPGWKIAKELSEKMGLGEYFPWKDIEDYRLQQVDGDLDLLAKLKKDGSASFGVPLMLQEKKSVAEFVKKFPGAASKVNEEGLIDFPKKIQLFSPKLEEVSGKGGLGYEPFKYKEEDELYFVQGKTPVRSNSHTGNVPWLNNLMEYDAIWIHPKTASKLGIKNGDAIELYNKFSSQKSKALITEGVREDTLFGYFGFGHVSKDLKRAYGKGVNSNALMPSFTSPNSGMDLHVFGVKVKKA - ->PhsA_Wolinella_succinogenes_NP_906934 -MEIEISRRRFLQGSVALTIVGASSGALAVGGSSGNKTESQEKGERSVATLCEMCVNKCAAIARVKDGKVIKLDPNPLFPKSRNMLCARGNAGIKALYDEDRLKYPLIRAGERGDGKFKRVTWDEAYTYIQEKLVKIMDEEQDNRSAIGFCAGEGMGEHHFKEFNKVFGSSNWLNHSSVCLQSTVSGYTLTIGTYGNPDLANAKYVIMAGANRAEAIVTPDTMDLFKRTLGRGCQLVVIDPRYSHTAHKADLWLPIKAGTDLAFVLALTHVVLSEEIYNKKFVEEKFNGFEEYKAHILQQNYTPEWAEPITGISASDIRKVARDFMACAPQAIYYPGRRTTWAKNDFQLRRAMAIFTALGGGVDVKGGICYGKTLPIDEHSIPAPMYANAKSRIEQNKAAIVGGTGSWVAWRDMVAAKETPYPIRGMFIYKQNPMHCVPNTAKTAQMFKNMDLVVTIDTMPSDTAIMSDVILPECTYLERTDPVKSFGGIEPAIAQRNKVIEPLYETKPVLQILRELTAKLSRPLFENSLKHDEDLQEMIEEKASELASSNPNKGEEELKKLAIEEVFEDEMEGWDISQGYAHSEEEMNEHAVAKYAGAHEMLLKHGVFYPGINEQFKQVSANEYVYYPESKKAYSMRNGQFNTPSKKVECVIPSLASKGIDTMPTWREEYLPKTPAGQFRFVTGRHAQFTQSSTANNALLLDTMSENFIWINKRVAKERGIKFGDLLEISSKAGKTRIKAYPTEKIAPDTVFFVHGFGVQSKAMSRAYQNGGHDSMIIEEHIEPVFGAAAAHETLVEIRKV - ->PsrA_PhsA_Thermosinus_carboxydivorans_ZP_01667237 -MKKFSRRTFLKLSGAATAALAAAPTLPRMASLAANIQLEGSAEFKASYCEMCTSRCPIQAKVVDGKTVLI -NGNPEWAATGGTVCARGGSGFSQLYDPQRLKKPLIRTGERGEGKWKEVSYEEAYAYIAEKMQDIKARYGP -EAMAFACRKGPHMGYLYTLAKAYGSPNTFNHESTCPMAKTVALEATFGTAALGIDYANVKYLVTFGRNFF -EGIHVAQTRGVMTAVSKGAKLVSFDPRFSLTSAKAHEWFAIRPGTDLAVVLAINHVLIRDGLYDRDFIDK -YTEGFEAVKASLTACTPAWAEQESGVRAADIERIARELAAARPRAVVEFGWRTTSTPEEFELRRAIIITN -LLLGNLEVPGGTFFVKSANFINSLVGKPVIQPIAGPKLPPFPQPGRPRIDGAGSKGQPYSLVPPIDGVVQ -TIPEAALTGKPYPIRGWFIYRYNPVLTIPDTNRVIEGLKKMDLVVVCDINMSDTAWYADVVLPESTYLER -DEGFNDYSGAVPVYTLRQKVVEPLYDTRPHWQIFKELAEKLGLGAYFPWKDVEELRLIQMGGKADLVRMG -KEKGFVNFGLKPLFLRDRASVAEFVAKFPEAKELVNTQGIIDKPLLNLKTKSKKIELLSTEAEELFGRGV -PVYRPVKLAEAGEAYFVQGKVAVHTNGHTHNVPWLYNLMSENRLWLNPATAAKLGLKDGDKAILKTRTGQ -QQVKVLVTEGVRPDTVFGYFGFGRLSPGLGRAYKKGINSNLALPLVTADVCGSTIQTTGVTISKV - ->PsrA_Carboxydothermus_hydrogenoformans_YP_361367 -MKLTRRSFLKASAATGALAALSGGVMSFERWAAKAAETGEVKLIPSICEMCGTKCGIIVKVKNGRVVKIE -GNKEHPNGKGKICARGNAGMKLLYDPDRLKQPLKKEGDRFVPISWEQAFREIGEKLKEIKAKYGPEALVW -STHPELAYDYEVIFNQAFGSPNLSAHAPTCYSPRNVAYKTMYGEVPTVDYGNVKYYISCGRNLVEGINVS -QVTGIMKAKEKGAKLIALDPRYSNFAALASEWVPIRPGTDLAFLLAMIHLIIKNEWYDKEFVKNYTIGFE -EVAAEVEKYTPKWAEEITGIPAATIERITEEFAKAKPAAVVDPGWHTSRYMNSTEMVRAGAVINALMGNL -GMKGGLKFPKYKFTKVEEREGLWPKLEKPKAKRFDGAGGEKWPLAKGLGMIQMLPEHILSGQPYPIKAYI -VNHHNPVRSAGNSQKWIEALKKLELLVVIDVQMSETAMMAHYVLPESTYLERFDPPQIAGNAVALRQPAV -KPLHNTMGVDDIIKELAHEAGIGQYFNFTLEQFSDQMLKPFNVTFKQLVEKGVIALDDGKTEYKVPEIKT -ESGKIELASSAFEKAGAKKVPTWVPPGVTEGNGKLRFLHGHTAVHTHTSTFNNEYLHALMPENVLWINTR -TAEKLGIKNGDLVEVKSDYGKVTIKAKVTEAIHPDAVFMVHGFGGFSPYQKKAYKKGASTSFIIPCHVEP -VSGASADCEVLVEVRKVGGGANA - ->PsrA_PhsA_Acidiphilium_cryptum_YP_001233491 -MQRRDFIRMSSAVASAALLGPTLAGCSRPAEWQRMMTEAPATETPTVCNICFWACAAKVHTRGERLWKIT -GNPEDAHCEGRLCTRGTGGVGAYYDPNRLVRPLVRMGKGADQRFEVASWDNALGLVAERMEKIAREHGPD -RLAALVHGPGAAHFSHLVRAFGSDSIAEPAFAQCRGPRDTGFFLTFGQGFGSPEQTDMAKARCIVLIGTH -IGENLHNSQVRTFTDGIRNDATIIVVDPRFSVAAGKANHWLPIRPGTDIALLLAWMNVILAERRYDAGYV -ARNTVGLEALCAHVAPFTPEWAYGETGIEPALIRETARLMAAAAPATVVHPGRHSTWWGDDTQRARAMAI -LAGLLGIWGREGGYYLPESVALPAYPVPAYPVPKTSWREIALPVFPLAGAPVTNVILDNAHGADAHYKGL -IVYDTNLPMTMPGIRRTLEAAAQSLELIVAVDVQPAEVTGYADVVLPECSYLERHDPLRNSGERYPALAL -RAPALPPRGESKPGWWIAREIGTRLGLGRYFPWTDYTEVIDWQLRQVGSSLKELETTGIRAFPRRTPAYF -APGETPRFATPSGKIELFSATLQQAGFDPLPRYTRPEAPPADHFHLNYGRAPQHSFSRTQNNPVLYQLMP -ENLVWIHPTAARRFGIRNGTYVRLVNQDGVVSNKVRVRVTERTRPDSVWLVHGFGHTAPGLSLARGRGAD -DSALMTRVLYDPIMGGTGMRGNFVTFRKENA - ->PsrA_PhsA_Geobacter_lovleyi_ZP_01593406 -MPIMSRRSFLKTSGICTAGAIAATYLPDQFLLWAGEKGLAKTEKITTYCEMCFWKCGAIATVVGGRVVKL -EGNPLSATAKGKLCGRGNGGIGLLYDPDRLKHPLIRTGKRGEGQFRKASWDEALTHIADKLKKIKEEHGP -ESLALFTHGSPTEHFMPLLQGFGSNNFAMPSFAQCRGPRVVGYELTYGDDIGSPERLDMANSKVVVLIGS -HLGENMHNSQVQEFTDAIGNGAKIIVVDPRFSVAAGKAHHWLPIKPASDMALILAWINIIIREGWYDREY -VAKYTHGFDKLAAAVQQYTPEWAEKETDIPAAQIMATAREMGLHRPAVCIHPGRHVTWDGKDVQRSRAIA -ILGAILGTWGREGGAYLATRGSFPAVPPPSFPASNRPTLKKGGFPLGGAEGVTNAIREATSIGEPYPVKA -WMVTGTNLLAAMPGQKETIEAISKLDLLVVVDVIPSDTSLYADVVLPECTYLERHDGLIIGKGRALSASI -RQPAVAPMYDSKPAWWIAKELSKKLGLEDYFPWENFEDRLNELCLTYNIDYDELKQKGVISFPDTAKPFI -TADNQPVFKTKSGKIELYSKELEELGFEPIPAYEKNEEPPQGFYRLLYGRSAVHTFSRTVNNPALNELYK -ENELWLSSVQARKMGLTDGQYVALQNQEGITSNRVRLKVTERIREDCVYMVHGFGQQSKGLTKAFRRGAD -DQQLISSYPVDPICGGTGMRCTFVKLVKGA - - ->TtrA_Pyrobaculum_arsenaticum_YP_001152643 -MTSRRTYLKAIAAAAALGVALWGYWPVVDKIIKPKRNPYGPDPQYGKNVRYVHTTCLGCNVRCGIRVRVV -KYGDVEVIERIEGNPYHVYNRAVSFDSQVKRYKQLPYNTPVKEALERWSGTLCPRGVDGIHYVYDPYRVL -KPLKRAGPRGSGKWKVITWEQLNNEVVNGGIIEETGERLPGLKDFFVYGKLKEAGFEDPNAVLSEMKADV -DNIMKIARDPNKTYDELVKAIEGFKAKWSQKLGEKGLKLEDVFIDPDRPDLGTKANMVMYLRGRGQPPTD -YFSQRWIYAFGSVNWTRHTSACQLGFYTGNRIWAGYTDIQADPVGAKVIIGAGWSMGRLHPGATGQGLII -ERACEGDLKLYYINPVAPRTPCNGNIIWIPVKPGEDATLAFAVIRWLIENKRYNEEFLSLPNRDSAKKAG -YPVNTNATWLVITEGQRFGEYLKARDIGLENSDKPVVWTGEKFATYDSVDKADLYYVGKVTLPTGEAVAV -KTAFMILREEAFSRSFEEWLAIASPYEPGTPEFRDYVKKVEQMARDFADAAPRAGTMIHRGVGMHPNGEY -ITWAYRAIDTLIGNFHRMGGLLGRAANTSYLSYVYNVGYSGFGEPPRWGPPIDRHNYAYEATLEYWLRVK -EALKEGKSWEDAVKAAFPTKRPWYPLTPEESYTEIFAGIAEGYPYKIGAFIMFYANPVLATNYGVKFVEV -LKDTSKIPLFIAITTTINETAMYADYIVPDTTYLETGTMGVQFLYATSGGVTLAEPWRSPAIMPLTQRIS -DCPNGHPRYASFWEFFIDTAKALGMPGFGDRAVPGVKGKKYEGRWFPLHCEWEYVMRVFANAALDAKDRG -LIPEQVPEEEVKFVEENYPIAQFKDIIPPEEWKYVAYGLARGGVFTSYEQSFDERGVSKRSVPGRGTLYL -WDETLAKTRNSVTGEKFWGGPKYFPIATYAPAGPAFQKADKWLHGTPLRQLYPEKDWPFMLVFYTGPIYT -KHRSQFYYWIKQIAPENFVLINPEDAAKIGVETGDVVRVETPVGFFEAPAVVEPTVAPGVIMVPYGMGRW -ADTVLVKPKYFELRDAKLKLTVDGLPEKMEVPEDAVNPVKGLPDVVKKILFTKSPAEYYEKGLAPDKWRF -NGVTPNVVQMSDPSLGGWPLLSWLGASQAYFDTPVRITKTGQKHKFETPYIVW - ->TtrA_Pyrobaculum_aerophilum_NP_559177 -MTSRRAYLKAIAAAATLGIALWGYWPVVDKIIKPKRTPYGPDPQFGTNVRYVFSSCLGCNVRCGIVARVV -KYGDVEVIERIEGNPYHVYNRAVSFDKQIKRYAPLPYNTPVKEALEKWSGTLCPRGADGIHYVYDPYRVL -KPLKRAGPRGSGKWKAITWEQLINEVVNGGVIEETGERLPGLKEFFAYGKLKEAGFEDPNAILSEMKIDV -DNIMKVARDPNKTYDDLIKAIEEFKAKWSQRLGEKGLKLEDLLIDPDRPDLGTKANMVMYLRGRGQGHTD -YFSQRWIYAFGSVNWTRHTSACQLGYYAGNSIWAGYHDIQADPIGAKVIIGAGWSMGRVHPGATGQGLMI -ERACEGELKLYYVNPVAPRTTCNGNIIWIPVKPGEDAALAFAVIRWLIENKRYNEEFLSIPNRDSAKKLG -YPVNTNATWLVITEGERFGEFLKARDVGIEDSDKPVVWTGERFATYDSVDKADLYYVGKVTLPSGETVTV -KTAFMIVRDEAFSKSFEDWLAIASPYERNTPEFADYVKKIEQMAKDFADAAPKAATTLHRGVGMHPNGEY -IVWAYRTIDTLVGNFHRMGGLLARAAHTAYENYVYNVGRSGFGEPVRWGPPIDRHRYAYENTLEYWLRVK -KALKEGKSWDEAVKAAFPTKRPWYPHTPEESYTEIFAGIAEGYPYRIGALILFYANPVLATNYGVKFIEV -LKDPAKLPLFIVITTTINETALYADYIVPDTTYLETGTMGIQYLYATSGSVTLAESWRSPVIMPLTQRIS -DCPNGHPRYASFWEFFIDTAKALGMPGHGDKAIPGVKGKKYEGKWFSMHCEWEYILRVFANAALDAKDKG -LIPEDVPEEEVKFVEENYPIAQFRDILPPDEWKYVAYGLARGGVFTKYEESFDERGISKRRVPGRGTLYL -WSEEVAKTRNNVTGEKFWGGPKYFPIATYAPAVPAFQKADEWLHGTPLRQLYPEKEWPFILILYTGPLYT -KHRSQFYYWIKQVVPENFVLINPEDAAKLGVETGDVIKVETPVGAFEAPAVVEPAVAPGVIMVPYGMGRW -ADTVVVKPKYFELKDARAKSLIDELPDKVEIPEDAVNPVKHLPDVVKKLLFTKSPAEYYEKGLAVDKWRF -NGVTPNVAEMADPSLGGWPLLSWLGAAQAYFDTPARIVKTGQRHKFEVPYIVW - ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 -MSHLLDQLRFFNRKQGEFADGHGETRIESRDWENVYRSRWQYDKIVRSTHGVNCTGSCSWKIYVKNGLIT -WETQQTDYPRTRNDLPNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLKLWREARRNMTPVDAWASIVE -DKAKAESYKSKRGMGGFIRSSWDEVNEIIAAANVYTVKQYGPDRVIGFSPIPAMSMVSYAAGSRYLSLIG -GVCLSFYDWYCDLPPASPQIWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVAI -TPDYAEVAKLTDLWLNPKQGTDAALAQAFAHVIFKEFHLEKPSEYFRDYAKRYTDLPVLVRLNEKDGSYI -ADRFLRASDLADNLGQENNPEWKTIAVDGSTGELVSPLGSIGYRWGEKGKWNIEAREGKDGRDVDLSLTQ -IEGGETAEVAFPYFGGILHEHFQHAEGESIQLRRVPVRTITLADGSTTKVATVFDLMAANLGIDRGLGGG -NVASSYDDASVPGTPAWQEVITGVSREKAIQIAREFADNADKTHGRSMIIVGAAMNHWYHMDMNYRGLIN -MLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLDWSRPPRQMNGTSFFYNHSSQWRHEKMSIHEVL -SPLADKSQFPEHMLDYNIRAERAGWLPSAPQLNRNPLQICRDAEAAGMSPVDYVTQSLKDGSLKFACEQP -DNPDNFPRNMFVWRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDLGKRADGFKPTEAEWQDEGAIGKLDLV -TTLDFRMSSTCVYSDIVLPTATWYEKDDMNTSDMHPFIHPLSAAIDPAWEAKSDWEIYKGIAKAFSKMAE -GQLGVEKDLVTVPLLHDSPGELAQPFGGTDWKTAGVDPQPGKNCPNMAVVERDYPATYKKFTSLGPLLDK -LGNGGKGINWNTQDEVDFLGELNYKVRDEGVSQGRPQIESAIDAAEVILSLAPETNGHVAVKAWAALSEF -TGRDHSHLALPKEHEAIRFRDIQAQPRKIISSPTWSGLEDEHVSYNAGYTNVHEYIPWRTITGRQQFFQD -HPWMQAFGEQLMSYRPPINTRTIDYVKGKKSNGNPEIVLNWITPHQKWGIHSTYSDNLIMLTLSRGGPIV -WMSEVDAKKAGIEDNDWIECFNANGALTARAVVSQRVMEGMVMMYHAQERIVNVPGAESTKTRGGHHNSV -TRVVLKPTHMIGGYAQQAYGFNYYGTVGCNRDEFVVVRKMAKVDWLDGPNGNDLPQPLPQDI - - ->NarG_Pseudomonas_fluorescens_gb_AEV63780 -MSHLLDQLRFFNRKQGEFSDGHGETRKESRDWENVYRSRWQYDKIVRSTHGVNCTGSCSWKIYVKNGLITWETQQTDYPRTRNDLPNHEPRGCPRGASYSWYIYSANRLKYPKIRKPLLKLWREARQTLPPVEAWASIVEDKAKADSYKSKRGMGGFIRSNWEEVNEIIAAANVYTVKEHGPDRVVGFSPIPAMSMVSYAAGSRYLSLIGGVCLSFYDWYCDLPPASPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQGTDAALAQAFNHVIFKEFHLDKPSAYFTEYAKRYTDLPVLVMLKPMLGAAPGAGYQPDRFLRASDLTDNLGQDNNPEWKTIALDAAGELVSPQGSIGYRWGEKGKWNILPREGGEGREIDLKLSLIGGDVAEVAFPYFAGEAQEYFQHVAGDAVQFRRVPVHSVVLADGSVAKVATVFDLSAANLAIDRGLGGANVAKDYNDASVPGTPAWQEQITGVSREKAIQIAREFADNADKTRGRSMIIVGAAMNHWYHMDMNYRGLINMLMLCGCVGQTGGGWAHYVGQEKLRPQCGWLPLAFGLDWNRPPRQMNGTSFFYGHSSQWRHEKMSMHDVLSPLADKSQFPEHALDYNIRAERAGWLPSAPQLNTNPLHICRDAAAAGMEPKDYVVKSLQDGSLRFACEQPDSPVNFPRNMFIWRSNLLGSSGKGHEYMLKYLLGTKNGVMNEDIGHSTECKPTEAEWVDEGAIGKLDLVTTLDFRMSSTCVYSDIVLPTATWYEKDDMNTSDMHPFIHPLSAAIDPAWESRSDWEIYKGIAKAFSAMSVGHLGVEKDLVTVPLMHDSVGELAQPFGGTDWKSAGVAPVPGKNAPNLQVVERDYPNIYKQFTSLGPMLEKLGNGGKGINWNTDTEVKFLGELNHKEVEAGISQGRPKIDSAIDAAEVILSLAPETNGHVAVKAWAALSEFTGIDHSHLAISKEHEAIRFRDIQAQPRKIISSPTWSGLEDDHVSYNAGYTNVHESIPWRTITGRQQFYQDHPWMQAFGEQLMSYRPPVNTRTIAGVKGKRSNGETEIVLNWITPHQKWGIHSTYSDNLLMLTLSRGGPIVWLSEIDAKRAGIEDNDWIECFNVNGALTARAVVSQRVKEGMVMMYHAQERIVNVPGSETTKTRGGHHNSVTRVVLKPTHMIGGYAQQAYGFNYYGTVGCNRDEFVVVRKMVKVDWLDGSSGDDLPRPLPTDIEEN - ->NarG_Halomonas_maura_gb_AAT47523 -MSHFIDRLNFFRKAREPFANDHGEVRDESRGWEDGYRQRWQHDKVVRSTHGVNCTGSCSWKIYVKNGLVTWETQQTDYPRTRPDLPNHEPRGCPRGASYSWYLYSANRLKHPLVRKPLLKLWREALEEKGDPVDAWASIVEDPAKTKQYKRARGMGGFVRADWNELNELIAASNVYTAKQYGPDRIIGFSPIPAMSMVSYAAGSRYLSLIGGVCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVSVTPDYAEVSKLTDEWLSAKQGTDAALAMAMGHVILKEFHLDRPSAYFTDYVRRYTDMPCLVELEAREDGSYVPGKQLRASDFEASLGQDNNPEWKTVAWDETRDQLVVPRGSIGFRWGEEGKWNLEPRDAEGAEIKTRLSLAEAHDDVARVAFPYFGGIAHEHFDHVKSGGASDELLFHSLPAKRLTLADGREILAVTVFDLMCANYGIDRGFRSQEGKEGEDDGATAYDQVKPYTPAWQEKITGVPAEQCLRIAREFADNADKTHGRSMIIVGAGMNHWYHMDMNYRGLINMLVMCGCIGQSGGGWSHYVGQEKLRPQTGWLPLAFGLDWQRPPRHMNSTSFFYNHSSQWRYXKLEIKEILSPLAKPADYSGSLIDFNVRSERMGWLPSAPQLATNPLSLAGKAAEAGQSTADYVVDQLKAGGLRFAAEDPDDPQNFPRNMFIWRSNLLGSSGKGHEYLLKYLLGTRHGIQGKDLGEDGGQKPEEVVWHEAAPEGKLDLLVTLDFRMSTTCLYSDIVLPTATWYEKDDLNTSDMHPFIHPLTAATDPAWESRSDWDIYKGIARAFSKACVGHLGEETDLVTLPLQHDSPAELAQPEVKDWKRGECEPIPGKTMPALVEVKRDYPATYERFTSVGPLLDSLGNGGKGIGWKTEKEVELLGKLNYVKTEGPAKGRPRIESAIDAAEVILTLAPETNGQVSVKAWEALSKITGRDHRHLAEPKEEEKIRFRDVVAQPRKIISSPTWSGLEDEHVSYNAGYTNVHELIPWRTVSGRQQFYQDHAWMRAFGESLLVYRPPIDTKAAVSLADDKGNGNPEIALNWITPHQKWGIHSTYSDNLLMQTLSRGGPIVWLSKDDARSIGVEDNDWIELYNANGAIAARAVVSQRVKNGMAMMYHAQERILNMPGSEVTGTRGGIHNSVTRVCPKPTHMIGGYAQLAYSFNYYGTVGSNRDEFVIVRKMKKIDWLDGEGNDYEQEAVK - ->NarG_Escherichia_coli_NP_415742 -SKFLDRFRYFKQKGETFADGHGQLLNTNRDWEDGYRQRWQHDKIVRSTHGVNCTGSCSWKIYVKNGLVTWETQQTDYPRTRPDLPNHEPRGCPRGASYSWYLYSANRLKYPMMRKRLMKMWREAKALHSDPVEAWASIIEDADKAKSFKQARGRGGFVRSSWQEVNELIAASNVYTIKNYGPDRVAGFSPIPAMSMVSYASGARYLSLIGGTCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAHFFTEVRYKGTKTVAVTPDYAEIAKLCDLWLAPKQGTDAAMALAMGHVMLREFHLDNPSQYFTDYVRRYTDMPMLVMLEERDGYYAAGRMLRAADLVDALGQENNPEWKTVAFNTNGEMVAPNGSIGFRWGEKGKWNLEQRDGKTGEETELQLSLLGSQDEIAEVGFPYFGGDGTEHFNKVELENVLLHKLPVKRLQLADGSTALVTTVYDLTLANYGLERGLNDVNCATSYDDVKAYTPAWAEQITGVSRSQIIRIAREFADNADKTHGRSMIIVGAGLNHWYHLDMNYRGLINMLIFCGCVGQSGGGWAHYVGQEKLRPQTGWQPLAFALDWQRPARHMNSTSYFYNHSSQWRYETVTAEELLSPMADKSRYTGHLIDFNVRAERMGWLPSAPQLGTNPLTIAGEAEKAGMNPVDYTVKSLKEGSIRFAAEQPENGKNHPRNLFIWRSNLLGSSGKGHEFMLKYLLGTEHGIQGKDLGQQGGVKPEEVDWQDNGLEGKLDLVVTLDFRLSSTCLYSDIILPTATWYEKDDMNTSDMHPFIHPLSAAVDPAWEAKSDWEIYKAIAKKFSEVCVGHLGKETDIVTLPIQHDSAAELAQPLDVKDWKKGECDLIPGKTAPHIMVVERDYPATYERFTSIGPLMEKIGNGGKGIAWNTQSEMDLLRKLNYTKAEGPAKGQPMLNTAIDAAEMILTLAPETNGQVAVKAWAALSEFTGRDHTHLALNKEDEKIRFRDIQAQPRKIISSPTWSGLEDEHVSYNAGYTNVHELIPWRTLSGRQQLYQDHQWMRDFGESLLVYRPPIDTRSVKEVIGQKSNGNQEKALNFLTPHQKWGIHSTYSDNLLMLTLGRGGPVVWLSEADAKDLGIADNDWIEVFNSNGALTARAVVSQRVPAGMTMMYHAQERIVNLPGSEITQQRGGIHNSVTRITPKPTHMIGGYAHLAYGFNYYGTVGSNRDEFVVVRKMKNIDWLDGEGNDQVQESVK - ->II_OP1_uncultured_candidate_division_UNIPROT_TREMBL_H5SSA4 -MHLRRLSRRTFLKAAVATSAATAVLSHWPRSGRGIQEGATPAQERWVKSVCLQCPAACGI -MVRVVKDSLGERAVKIEGNPNHPSNQGGICPKGHIGLQILYDPDRLQGPLRRVGPRGEGK -WEPISWEEALQIVTERLKKLRERGEPHKLVIMSGRNRGQMGALIDRFLAAFGSPNHVGHS -SICSDGAKLAHYLTQGFKHYAAYDWDNCNYLLSFGAGFIEAWRPTVRLLRAFGHMRRGRP -IRAKIVQIETRFSVTAAKADEWLPINPGTDGALALAIAHVIVREGLYNKKFVEEHTFGFE -DWEDEQGHFHQGFKTLIRQYTPAWAAPITGVPEETIVRIAREFATTPPQIAAGQRGAMMQ -TNGIYNYMAIHALNALVGSIDAPGGVLVQIDPPLTPWPPLAQDEIAQTGVKQPRIDHAGT -EEFPLAANVYAALPDFIINEDPYAIDTLMLYYTNPVFSSPDAPKYSQAFEKIPFIVSFSP -FLDDSSLFADLILPDHTYLERWHDDVIYPSLGYPVYAVRQPVIAPLYNTRNTGDLLIELA -HRLGGTVKESFPWKDFLELIQFRARGIYESGRGNIQANSFEEFWQQLLEVGFWTDPPYPF -GQWERVFKTPSKKFEFFSQKLAHTLEDLAKKKAEHEGIPEEEALDKILTRLKITARGDAA -FMPHYEEPRFVGDPKEYPLYLNTYKLMAHAEGRGANSPWLQEILGTHVGRRWETWVEINP -TTAQKLGITEGDWVWVESPLGKIKVRAKLHPGAKPDVVNIPFERGHRSYGRWAVGFGANP -NEVLAREYDYLGGDAAFFSTRVKVYKAQEGE - ->QrcB_Syntrophobacter_fumaroxidans_YP_844744 -MKVGRRAVLQFMAGAVGGTLLSPLPWKLTDDAAIWSQNWFWRPSPARGEITRKPTVCALCEGGCGVQARL -VDGKRAILLEGNPNHPVNQGGICALGAAGLQFLYAPYRIAQPLKQTKRRGDPTGFQPIAWNEAVGELAKK -LGQMRADGKPNGLAGITRRRCSSMDALLNQFFAAYGSPNLFKMPAHADSLKLAGAVTTGREAPFGCNIED -APYILSFGAGLVEGWGSPGRMQAAFRRWRQGGKSAAKIVQVDSRCSTTAAMADRWIAVPPGTEAALALGI -AHLMVKDKLYDAEFMADRVFGFEDWTDSQGKNHKGFKFLVQTDAYTPEAISKLTGVDPAKIRELAKEFGT -QKGAVAVWGQPQGSVPKDMYNELSFLALNALKGNIKAGGAIGLAPEVPLGALPELPGDPSALKGLKQLRL -DLASSQKGPPPVLPGNNLHGFLDAVSNGGKYPIEVMLVHEANPAYGLCENKLFQQALTKIGTLVSLSSYM -DETAQQADLILPIHTAFEGFDDVIGIPGAPYAYYGVCAPVLKPHLNTKAAGDIVMSVAKQLGGSIAAALP -WASHEEYLKKRAEGLAASARGALADKKGVELWKLQPEEAVKPNYKDGADLWKKLAGGACWYDAPVDPLKD -LKTESGKFELAAQLLLAKGQTGDDDQVYLPHFSQVPPRGSDKDYPLLLVTYQMSALADRDLANPPFMTKT -VFDFILRQNDQFVEINPATASELGMAEGDSAVLKTPQGEVPVRVHLYAGARPKVVYLAQGLGHKAYDEYI -KDKGVNANGVVEVQLDRVTGLGTVWAARAHLRRA - ->ArxA_Ectothiorhodospira_sp_PHS_1_ZP_09695308 -MKLLETLINRRRFLKATGAVAGAGVVAGGAGVVPGLTTLSHARSPAPSADTTITKNICHQCPARCGIDVY -TTGGRVHAIYGTSDHPISNGKLCPKGPLGAYILYDPDRFKGPMKRTNPNKGRDQDPGFVPISWNEALDMV -ADRLNGLREREESHRFALLYGRGWGASCAGLLGNFGKLYGSPNVAIGHSSMCSDGSIISKKAVDGIGGYN -SYDYKNANMLLMFGAGFLEAFRPYNNNMQVWGYIRGVKVPKTRITAVDVHMNTTLAGSDRALLIKPGTDG -ALALAIAHVILVDGLWEKAFVGDFSDGVNRFIPGETVDPDSFEEKWVKGLVEWWNAELKDRSPRWAAQVT -TLYERDILATAREFGTTRPAIALYERGAHAHSNGIFNGMAIHTLNALVGSLYAKGGLAYQVGPSYGPLPV -NADDYLDDWARTGGWKAQPRIDLKGHPDGYLLANNMMQEIGPNSLQGKPYKLDTIMFYLNNAIWTAPDVK -AWEEALKELFVIETSPFPSETAMFADVILPDHTYLERLQDAPTYPFQGWPMTQLRVPAVKPLYDTKYFGD -VLIELGKRIQGSMGEYYQALDNTENVIRHLAKGFESDPGDNGVNSFESWKEKGVWYKRVYPYRQIDGEFY -EWDGQDHTRLMSADEVRGALFKTASGKFEIRSGWLEAHADWIAAKTGRDPSRLMFPIWEEPSHPGGGDLY -MVTPKVALHAEGRGANLPVAIANMQPTLGGRNTIYIEINPKTARARGIPDGSRVRISSDLGAIEGYCKYY -EGVRPDTLVFPMEHGHWAHGRWAKGRKPGHSGEITVNQSDRITGQCSYYTTKVRIERA - ->ArrA_Wolinella_succinogenes_NP_906980 -MEINRRDFLKATALTAGAVGIAQIPEIEANTQVSGEVGKWVASTCQGCTSWCSIQGYVVDGRLVKVRGNPNAKGNHGKICPRPHLAIQQVYDPDRVKTPLKRTNPKKGKGIDPQFVPISWDEAIDTIADKIMALIKSGESHKFALFRGRYTHMNEILYNTFPKLIGSPNNISHSSICAEAEKFGRYYTEALWDYADFDLDNTRYVLGWGADPLASNRQVPHFINIWGKVRDQARIAIIDPRLSATAAKADHWLPIIPGEDSALAVAMAHVILAGGAWNKGYVGDFVDGHNYFKPGELVPESIEVEGKIIPVEFKEKHTYGVVKWWNLELFDKTPEWAEPITGIPAKQIRQVALEFAAAGSRAISWVSPGACMQIRGSYASMAAHALNGLVGSCDSVGGILQGTSVPSGKTPDIKPYLSEEIASALKQKKIDQRGTPKFPALNKKTGGGVVTANVANAILDEKPYDLKMAIGYWNNFVFSINGTHLWEKAMEKLPFYAHITTHMAEMTMYADIVLPAKMHMFERYGFSKNKQNLHGYLSIHQPMVKPLGEAKTDETEIVFMIAQALAKKGHDAPLRYYQENFKDPETGKIPSTPEEFDLFSVKYFTQPIWDGSSNDKGDSINSWKELLEKGVWSTKRYSIGKKIDNFKTETKKFEFYSETLKKVLEEHVEKNKLSSIDEAIEASNNTARGERVFVPHYEPSVRYGDPKIYPLIFAEHRSRLNREGRSQNAPWYYEHKDVDPGDEIEKDVAKINPETAKQFGIKTGDRIRIVGTQASIETEVKLWEGIRPGIVVKCYGQGHWAYGSVASEKFGSKPRGTNNNDIHIHEYDRLSGSTARHGGTARVKIEKI - ->ArrA_Bacillus_selenitireducens_gb_AAQ19491 -EQGEWIASVCQGCTAWCAVQVYRIDGRATKVRGNPNAKANHGHSCVRSHIGLQQVYDPDRVKQPMKRTNPNKGRDEDPEFVPISWEEAMDTIADKIIELRENNETHKFSVWRGRYTSNNGILYGNMPKIIGSPNNISHSSICAESEKFGRYYTERYWGYADYDHENALYEIFWGGDPIATNRXVPHTASIWGELSDRATLACVDPRFSTTAANQMNGCRLIPGEDGAIASAIAHVILTEGVWYKPFVGDFKDGQNRFVEGRDVNEDDFEEIQTHGLVKWWNLELKDKTPEWAAERSGIDADQIYRVARGFANAAPKAISFSSPGSSMTIRGGYTAMTQAALNGLVGSADNLGGVISNGISVPNNGFPDPSDYIDEIAANGLEQDRIDWGGRLEFPALKDSKSGGVKVTNTVADAVLAEDPYEFKSRIELLDELQFLQPRNGSLGQSFGQDSIHGAYDCQSGEQTHFADIVLPVPHSQFERQSPVAGSNGNLHRHLHLQNKVIESPFDIRVDETEIPWMIGESLEKKGYSNLIDYFRNEFRDPETGEAPTNAAEFDEIATKHYTHPVWDPTFEKDGDQIDGWEEYKRLGTWNTNKYEFRQKWDGNWGTETGQFEFYSETLKVALQDHADKHNASIDDVMEATFNTAKGELAFVPHYEPAMRVGDESEYPLIFMEHRSKLNREARSANTSWYQEFKDIDLGDEAWDDVAKLNPKDAAELGIQNGDMVRLVTPEGQIEVKAKLWEGTRPGVVAKCYGQGHWAYGHIASLDRRRQIARGGNNNIILAPVHEALSGSGARHGGQTRVRVEKV - ->ArrA_Chrysiogenes_arsenatis_gb_AAU11839 -MRIKRREFLKASAAVGAVAVASPTLNAFAQTGTGASAMGEAEGKWIPSTCQGCTTWCPVEFLFRMAVRSKYAATQLSKANNGYCCVRGHLMLQQLYDPDRIKTPMKRTNPVKGRKEDPKICPYHMGMKQWDTIADKIMELRKNNETHKYLLMRGRYSDHNSIFYGDLTKMIGSPNNISHSAICAEVEKMGSMATEGFWGYRDYDLDNMKYLIAWACDPLSSNRQIPNAIRKIQGVMDRGKVVAVDPRMNNTASKAQEWLPIKPSEDGALALAMAHVIITKGLWSKEFVGDFKDGKNKFVAGKTVKEEDFEEKLTNGIVKWWNLEVKDRTPKWAAKVTGIDEATIIRVATEFAQAAPACAIWYGPNMQPRGSYAVMCIHALNGLVGASDSEGGLCTGMGSPSSSYPKIDAYQDDVAKAGAKNKKIDQRGTLKFPAMGSAKPGTGVVTNNVADALLAADPYDIKVAIGYFCNFNFSGTDGARWDKALAKVPFFVHCVPMFSEMTYFADIVLPAALHHTEDWAVIRSKANLHGHTSIQQPVVERMFDVKGVETEITWLLAEKLKAKGFENMYNWLYNEYKDPETGKNPTNSLEFALYATKIRSKKCWDPKENAEYKGDKLNGWADFMEKGIVNSPKFKFRQKWEKGFPTETKKFEFYSETLKKGLLAHAEKNKVTVDQVMEATNYEARGELAFIPHYESPKRHGDVKEFPFSLIDMKSRLNREGRSTNATWYHAFKKCDPGDVNQEDVLQINPADAKKLGINEGDMVKVTSVIGSLTVKARLWEGVRPGCVAKCYGQGHFAMGRVSAKDFGKAVARGANFNDIMPADYDRITGATARNGGFTGVKIEKA - ->ArrA_Halarsenatibacter_silvermanii_gb_ACF74513 -MSRNKTSGISRREFLKVMGSTGAALGLGLSATSGNKVLAEEDPYEVLPEGEHKSGEWVPTGCAGCTSWCSLEANVVDGRVIKIRGNSRSKVNGESSCPRSHLSLQQVYDPDRIKRPMKRTNPEKGRDVDPEFVPISWEEAFEEIADKIIELRENGESHKFVLWRGRYTRLRDILYGILPEFVGSPNKISHSSICAEAEKFGPYYTEGYWAYRDYDLQNSDYILIWGTDPIQSNRQVSLYSREWGNILEGARIATVDPRFSRTAAKSNEWLPVKPGEDGALALAMAHVILTEGLWHKEFVGDFVDGENKFTAGEEVDEDEFEENYTHGVVKWWNEELKDRTPEWAADKTGIPAEQIVRVAAEFGEAAPHACVFMGGGGVMQTRGGYNSMAIHGLNGLVGSIDNEGGAVRGASVPNQSFPDHSEFLDDISREGLDHEMIDRRGRLEFPAFKDGESGGGVVTNLSADGIIEEDPYEIKMGIGYWNNFNFAAPETERWDEAMSKLDFYVHLVTHQSEMTQYADIVIPSTHHMFEQWGMLYQKGNLHTHFWLSRPMINRHWELIEPEAEFSWLLAEKLAEKGYSNMLDYFKTIVDPETGEEPEDYREFAKYATKHYMQPVWDPEMESHGDQFDGWEDFKEAGVWNSDEFEFQQYWGEFTNSTGDFEFYSETLKEALEEHAEKHDVSIEEVLEACKYEAEGELAFLPHYEEPYTVGDDEEYPLLLVDSKSALNREGRSANANWYYDLKDIDPGDSTEADVIKIHPRDAEELGLEDGDEVVVSSPAGEITCQLNVWEAVKPGTASKTFGMGHWAYGRVAAEDFADGEPRGGNNNEIIPAEYERLSGSTSFYSHIKVNIERA - ->ArrA_Sulfurospirillum_barnesii_gb_AAU11840 -TSWCPIQGLVVDGKVVKVRGNPNSPSMGRICPRPHLAIQQVYDPDRVKTPLKRTNPKKGKGIDPKFVPISWDEAINTIAEQILGLIKAGESHKFVLMRGRYTHMNEILYNTFPKLIGSPNNISHASICAKTEKFGRYYTEGFWDYADFDLTIPVIFWDGERDMVSSNRQIPWFMNQQGYVKDRAKITIIDPRLSATAAKADRWAPIIPGTDSALAVAIAHVILSEGRWNKSFVGDFQDGKNYFIPGSTVPTEVIVDEKSLPVVFEENHTYGVVAWWNLELKERTPEWAEKITGISAKDIRTIAREFSDAGSKAISWVTTGASMQIRGAYASLAAHALNGLVGSVDAVGGTLQGSXAPSGKTPDIKPYLPAEFEAALKQKKIDQRGTLKLGAFNKKTGGGVVTQQVADSILTDKPYDVKVAIGYWNNFVFSINGANVWEKAMEKLPFYAHITTHLAEMSMXADIVLPAKMHMFERYGFSKNKQNLQGYLTIHQPLVKSFADAKTDETEIPFLIAQALAKKGFDGPLRYFQDNFKDPESGKAPTNPRRVDLYAVKQFTXPIWSGESNEKGDTINSWNELLDKGVWKTKKYKIGKKVDNFATETKKFEFYSETLKKVLIEHAEKNKVTVDEALEALNYTCRGELGFVPHYEEAVRHGDEKTYPFIFAEHRSRLNREGRSQNAPWYYEIKDVDPGDVAGKDVTKINPLDGKKLGLKDGDKIKITSVQGSIESEVKLWEGTRPGT - ->Halorhodospira_halophila_YP_001001949 -MSVLDHLVSRRRFLQATGVGGGAVAAGGVGHLLSFSAGGSHARADGPVGGGETQITKNVCHQCPARCGID -VYTTDGRVHAIYGDPGNPIANGRLCPKGHLGSYILYDPDRFKGPMKRTNPNKGRDEDPQFEAISWDEALG -IVAERLNRLREQEESHRFALMYGRGWGASCAGLLGPFAKLYGTPNVIGHSSMCSDGSMVAKGLTDGNESY -NAYDYRNTNYILNFGAGFLEAFRPYNYLMQVWGHMRTKSPKTRVTAVDVHMNPTLAAADRAVTIKPATDG -AMALAIAHEMLVNGYWDRDFVGDFTDGANRFEAGTEIDPDDFEEVWTQGLIRWWNDELKDRTPEWAESIT -TVPAETIRRVAYEFGTTRPAMAIMERGPTSHSNGTYNGMAIHALNALAGTLFTEGGLFYQMDVPYGDGPA -DPDDYLDDYAGRMQERFDEGEIPRIDKLGTDRWPLARNMMQEVGPNHAAGEPYKLDTILFYLNNPIWTAP -DATAWEEALKDVFIIDTSPFPGETARYADLILPDHTYLERLQDAPTYPFEGYPMTALRTPAVEPLYDTKV -FGDILIEIGKRLDGPAGEYWQAVGDTENLLRHLAEGFRDHPGDNGVEDFESWKAKGVWYKKPYHWKQERG -VFYEWVEDDGDYTHEMSAEEVADKLMPTPSGRFEFFSEKLQEHADFVASEFGIDHERAGLIQWVDPDHPG -GGDLYFSTPKTALHAEGRGANIPHAIAHVQPVMGGRTTVYLEIHPRTARERGIRSGDRVRIVSDVGEIEA -YARLFEGTRPDTVCLPMEHGHWAQGRWAEGRKPGHSGEVTVNQSDRISGLASYYTTKVRVERA - ->Alkalilimnicola_ehrlichii_ABI55571 -MKMILDTLLNRRRFLKATGATGAAAATTAGVGKLAGFTAASTTSTHVNARPGGETRVTKNICHQCPARCG -INVYTTNGRVHAIYGDPGNPIANGKLCPKGHLGTQLLYDPDRFKGPMKRTNPNKGRDEDPEFVPISWDEA -FDIVAERLNRLRERGESHRFAHFYGRGWGSSDAGLYGDFGKLYGTPNSAIGHASMCAEGSKRAKRATDGN -DSYNSYDYRNTNYILNFGAGFLEAFRPYNYLMQVWGHMRTKSPKTRVTTIDVRMNPTMAASDRALMIKPG -TDGALALAIAHVILTEGLWDKEFVGDFEDGRNHFRTGETIIPDAFQANWTHGLAEWWNGELKDRTPEWAE -EITTIPAKHIYTVAREFATTRPAMAIMERGPTAHFNGTYNGMAVHALNALVGSMFAEGGLFYQMGPSYGP -LPVSADDYMDDYAREMQGKHPRIDMAGTEKWPMAGTMMQECAKHHLAGDPYKLDTAMFFVTNPIWTAPDP -RLWEEALKDVFIIDTSPYPGETAMYADIIMPEHTYLERLQDSPTYPFEGWPMAALRTPAVDPVYDTKHFG -DMIIEIGKRINSPMADYYRELGDVENMLRHRAAGFANDPGDNGVNDFESWKEKGVWYKKPYHWRYWRGTF -YEWDGEGYNIEMSEDEVKDKLMPTASGKFEFKSSFLENNANYIAREMGIAEDRVGLIQWVEPRHTGDGDL -HFVTPKTPLHAEGRSANIPQAQAYMQPIVGGRGTCYLEIHPKTAQERGINDGDTVRLSAQVRGETKSILA -VARYMPGHRPDTLVLPMEYGHWAQGRWATAQGRDMKPGHSGDLTENLSDPISGLACYYTAKVRLEKA \ No newline at end of file diff --git a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model b/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model deleted file mode 100644 index a39f2545..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_refs.fasta.model +++ /dev/null @@ -1,581 +0,0 @@ - - -ProtTest 3.2 Fast selection of the best-fit models of protein evolution -(c) 2009-2010 Diego Darriba (1,2), Guillermo Taboada (2), Ramón Doallo (2), David Posada (1) -(1) Facultad de Biologia, Universidad de Vigo, 36200 Vigo, Spain -(2) Facultade de Informática, Universidade da Coruña, 15071 A Coruña, Spain -Contact: ddarriba@udc.es, dposada@uvigo.es ----------------------------------------------------------------------------------------------- - -Thu Apr 25 13:41:55 MDT 2024 -OS = Linux (3.10.0-1160.88.1.el7.x86_64) - -Citation: Darriba D, Taboada GL, Doallo R, Posada D. ProtTest 3: fast selection of best-fit - models of protein evolution. Bioinformatics, 27:1164-1165, 2011 - - -ProtTest options ----------------- - Alignment file........... : dmso_refs.fasta.phy - Tree..................... : BioNJ - StrategyMode............. : Fixed BIONJ JTT - Candidate models......... : - Matrices............... : JTT LG DCMut MtREV MtMam MtArt Dayhoff WAG RtREV CpREV Blosum62 VT HIVb HIVw FLU - Distributions.......... : Uniform +G +I +I+G - Observed frequencies... : false - - Statistical framework - Sort models according to....: - BIC - Sample size.................: 871.0 (not calculated yet) - Other options: - Display best tree in ASCII..: false - Display best tree in Newick.: false - Display consensus tree......: false - Verbose.....................: false - -********************************************************** -Observed number of invariant sites: 2 -Observed aminoacid frequencies: - A: 0.098 C: 0.011 D: 0.055 E: 0.053 F: 0.033 - G: 0.091 H: 0.024 I: 0.052 K: 0.051 L: 0.078 - M: 0.023 N: 0.041 P: 0.059 Q: 0.032 R: 0.059 - S: 0.052 T: 0.054 V: 0.071 W: 0.025 Y: 0.037 - -********************************************************** - - - -Model................................ : JTT - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77104.53 - (seconds)) - -Model................................ : JTT+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 77032.91 - (seconds)) - -Model................................ : JTT+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.767 - -lnL................................ = 75965.79 - (seconds)) - -Model................................ : JTT+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.916 - proportion of invariable sites... = 0.003 - -lnL................................ = 75938.30 - (seconds)) - -Model................................ : LG - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 76250.92 - (seconds)) - -Model................................ : LG+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 76186.27 - (seconds)) - -Model................................ : LG+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.812 - -lnL................................ = 75187.90 - (seconds)) - -Model................................ : LG+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.971 - proportion of invariable sites... = 0.003 - -lnL................................ = 75162.49 - (seconds)) - -Model................................ : DCMut - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77745.30 - (seconds)) - -Model................................ : DCMut+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 77663.69 - (seconds)) - -Model................................ : DCMut+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.545 - -lnL................................ = 76472.93 - (seconds)) - -Model................................ : DCMut+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.719 - proportion of invariable sites... = 0.003 - -lnL................................ = 76442.91 - (seconds)) - -Model................................ : MtREV - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 81641.26 - (seconds)) - -Model................................ : MtREV+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 81620.49 - (seconds)) - -Model................................ : MtREV+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.151 - -lnL................................ = 79797.61 - (seconds)) - -Model................................ : MtREV+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.169 - proportion of invariable sites... = 0.002 - -lnL................................ = 79793.93 - (seconds)) - -Model................................ : MtMam - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 85263.49 - (seconds)) - -Model................................ : MtMam+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.005 - -lnL................................ = 85241.92 - (seconds)) - -Model................................ : MtMam+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.35 - -lnL................................ = 82190.94 - (seconds)) - -Model................................ : MtMam+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.351 - proportion of invariable sites... = 0.001 - -lnL................................ = 82190.85 - (seconds)) - -Model................................ : MtArt - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 83730.92 - (seconds)) - -Model................................ : MtArt+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 83711.55 - (seconds)) - -Model................................ : MtArt+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.408 - -lnL................................ = 80931.73 - (seconds)) - -Model................................ : MtArt+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 1.414 - proportion of invariable sites... = 0.001 - -lnL................................ = 80929.13 - (seconds)) - -Model................................ : Dayhoff - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77755.96 - (seconds)) - -Model................................ : Dayhoff+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 77674.16 - (seconds)) - -Model................................ : Dayhoff+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.536 - -lnL................................ = 76479.03 - (seconds)) - -Model................................ : Dayhoff+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.709 - proportion of invariable sites... = 0.003 - -lnL................................ = 76448.96 - (seconds)) - -Model................................ : WAG - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 76009.19 - (seconds)) - -Model................................ : WAG+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 75929.91 - (seconds)) - -Model................................ : WAG+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.468 - -lnL................................ = 75177.79 - (seconds)) - -Model................................ : WAG+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.74 - proportion of invariable sites... = 0.003 - -lnL................................ = 75142.56 - (seconds)) - -Model................................ : RtREV - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 76648.25 - (seconds)) - -Model................................ : RtREV+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 76576.75 - (seconds)) - -Model................................ : RtREV+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.027 - -lnL................................ = 75659.47 - (seconds)) - -Model................................ : RtREV+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.245 - proportion of invariable sites... = 0.003 - -lnL................................ = 75630.40 - (seconds)) - -Model................................ : CpREV - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 77052.70 - (seconds)) - -Model................................ : CpREV+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 76973.87 - (seconds)) - -Model................................ : CpREV+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.08 - -lnL................................ = 76046.86 - (seconds)) - -Model................................ : CpREV+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.267 - proportion of invariable sites... = 0.003 - -lnL................................ = 76014.06 - (seconds)) - -Model................................ : Blosum62 - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 75915.50 - (seconds)) - -Model................................ : Blosum62+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 75849.78 - (seconds)) - -Model................................ : Blosum62+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 4.24 - -lnL................................ = 75230.55 - (seconds)) - -Model................................ : Blosum62+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 4.538 - proportion of invariable sites... = 0.003 - -lnL................................ = 75199.67 - (seconds)) - -Model................................ : VT - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 75962.73 - (seconds)) - -Model................................ : VT+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.003 - -lnL................................ = 75896.24 - (seconds)) - -Model................................ : VT+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.669 - -lnL................................ = 75166.63 - (seconds)) - -Model................................ : VT+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 3.909 - proportion of invariable sites... = 0.003 - -lnL................................ = 75137.60 - (seconds)) - -Model................................ : HIVb - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 79715.18 - (seconds)) - -Model................................ : HIVb+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 79632.32 - (seconds)) - -Model................................ : HIVb+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.407 - -lnL................................ = 78258.49 - (seconds)) - -Model................................ : HIVb+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.558 - proportion of invariable sites... = 0.003 - -lnL................................ = 78228.20 - (seconds)) - -Model................................ : HIVw - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 83544.07 - (seconds)) - -Model................................ : HIVw+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.005 - -lnL................................ = 83433.56 - (seconds)) - -Model................................ : HIVw+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.2 - -lnL................................ = 81960.13 - (seconds)) - -Model................................ : HIVw+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.373 - proportion of invariable sites... = 0.003 - -lnL................................ = 81919.21 - (seconds)) - -Model................................ : FLU - Number of parameters............... : 169 (0 + 169 branch length estimates) - -lnL................................ = 79156.27 - (seconds)) - -Model................................ : FLU+I - Number of parameters............... : 170 (1 + 169 branch length estimates) - proportion of invariable sites... = 0.004 - -lnL................................ = 79066.08 - (seconds)) - -Model................................ : FLU+G - Number of parameters............... : 170 (1 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.477 - -lnL................................ = 77863.83 - (seconds)) - -Model................................ : FLU+I+G - Number of parameters............... : 171 (2 + 169 branch length estimates) - gamma shape (4 rate categories).. = 2.635 - proportion of invariable sites... = 0.003 - -lnL................................ = 77828.33 - (seconds)) - -************************************************************ -Date : Thu Apr 25 17:59:51 MDT 2024 -Runtime: 4h:17:51 - - - -*************************************************************************** -Best model according to BIC: VT+I+G -Confidence Interval: 100.0 -*************************************************************************** -Model deltaBIC BIC BICw -lnL ---------------------------------------------------------------------------- -VT+I+G 0.00 151432.82 0.99 75137.60 -WAG+I+G 9.91 151442.73 0.01 75142.56 -LG+I+G 49.77 151482.59 0.00 75162.49 -VT+G 51.28 151484.10 0.00 75166.63 -WAG+G 73.60 151506.42 0.00 75177.79 -LG+G 93.82 151526.64 0.00 75187.90 -Blosum62+I+G 124.12 151556.94 0.00 75199.67 -Blosum62+G 179.11 151611.93 0.00 75230.55 -RtREV+I+G 985.58 152418.40 0.00 75630.40 -RtREV+G 1036.96 152469.78 0.00 75659.47 -Blosum62+I 1417.58 152850.40 0.00 75849.78 -VT+I 1510.51 152943.33 0.00 75896.24 -Blosum62 1542.26 152975.07 0.00 75915.50 -WAG+I 1577.84 153010.66 0.00 75929.91 -JTT+I+G 1601.38 153034.20 0.00 75938.30 -VT 1636.72 153069.53 0.00 75962.73 -JTT+G 1649.60 153082.42 0.00 75965.79 -WAG 1729.64 153162.45 0.00 76009.19 -CpREV+I+G 1752.92 153185.74 0.00 76014.06 -CpREV+G 1811.75 153244.56 0.00 76046.86 -LG+I 2090.56 153523.38 0.00 76186.27 -LG 2213.09 153645.91 0.00 76250.92 -DCMut+I+G 2610.62 154043.43 0.00 76442.91 -Dayhoff+I+G 2622.71 154055.53 0.00 76448.96 -DCMut+G 2663.88 154096.70 0.00 76472.93 -Dayhoff+G 2676.07 154108.89 0.00 76479.03 -RtREV+I 2871.53 154304.35 0.00 76576.75 -RtREV 3007.75 154440.57 0.00 76648.25 -CpREV+I 3665.77 155098.59 0.00 76973.87 -JTT+I 3783.85 155216.67 0.00 77032.91 -CpREV 3816.66 155249.48 0.00 77052.70 -JTT 3920.31 155353.13 0.00 77104.53 -DCMut+I 5045.40 156478.22 0.00 77663.69 -Dayhoff+I 5066.34 156499.15 0.00 77674.16 -DCMut 5201.86 156634.68 0.00 77745.30 -Dayhoff 5223.18 156655.99 0.00 77755.96 -FLU+I+G 5381.44 156814.26 0.00 77828.33 -FLU+G 5445.67 156878.49 0.00 77863.83 -HIVb+I+G 6181.20 157614.02 0.00 78228.20 -HIVb+G 6235.01 157667.82 0.00 78258.49 -FLU+I 7850.18 159283.00 0.00 79066.08 -FLU 8023.79 159456.61 0.00 79156.27 -HIVb+I 8982.66 160415.48 0.00 79632.32 -HIVb 9141.61 160574.43 0.00 79715.18 -MtREV+I+G 9312.65 160745.47 0.00 79793.93 -MtREV+G 9313.23 160746.05 0.00 79797.61 -MtArt+G 11581.48 163014.30 0.00 80931.73 -MtArt+I+G 11583.06 163015.87 0.00 80929.13 -MtREV+I 12958.99 164391.81 0.00 81620.49 -MtREV 12993.76 164426.58 0.00 81641.26 -HIVw+I+G 13563.22 164996.03 0.00 81919.21 -HIVw+G 13638.29 165071.10 0.00 81960.13 -MtMam+G 14099.91 165532.73 0.00 82190.94 -MtMam+I+G 14106.49 165539.31 0.00 82190.85 -HIVw+I 16585.14 168017.96 0.00 83433.56 -HIVw 16799.38 168232.20 0.00 83544.07 -MtArt+I 17141.12 168573.94 0.00 83711.55 -MtArt 17173.09 168605.91 0.00 83730.92 -MtMam+I 20201.87 171634.68 0.00 85241.92 -MtMam 20238.23 171671.04 0.00 85263.49 ---------------------------------------------------------------------------- ---------------------------------------------------------------------------- -*********************************************** -Relative importance of parameters -*********************************************** - alpha (+G): 0.000 - p-inv (+I): 0.000 - alpha+p-inv (+I+G): 1.000 - freqs (+F): No +F models - -*********************************************** -Model-averaged estimate of parameters -*********************************************** - alpha (+G): 3.669 - p-inv (+I): NaN - alpha (+I+G): 3.908 - p-inv (+I+G): 0.003 - -*************************************************************************** -Best model according to LnL: VT+I+G -Confidence Interval: 100.0 -*************************************************************************** -Model deltaLnL LnL LnLw -lnL ---------------------------------------------------------------------------- -VT+I+G 0.00 75137.60 0.92 75137.60 -WAG+I+G 4.96 75142.56 0.08 75142.56 -LG+I+G 24.89 75162.49 0.00 75162.49 -VT+G 29.02 75166.63 0.00 75166.63 -WAG+G 40.18 75177.79 0.00 75177.79 -LG+G 50.30 75187.90 0.00 75187.90 -Blosum62+I+G 62.06 75199.67 0.00 75199.67 -Blosum62+G 92.94 75230.55 0.00 75230.55 -RtREV+I+G 492.79 75630.40 0.00 75630.40 -RtREV+G 521.86 75659.47 0.00 75659.47 -Blosum62+I 712.17 75849.78 0.00 75849.78 -VT+I 758.64 75896.24 0.00 75896.24 -Blosum62 777.90 75915.50 0.00 75915.50 -WAG+I 792.30 75929.91 0.00 75929.91 -JTT+I+G 800.69 75938.30 0.00 75938.30 -VT 825.13 75962.73 0.00 75962.73 -JTT+G 828.18 75965.79 0.00 75965.79 -WAG 871.59 76009.19 0.00 76009.19 -CpREV+I+G 876.46 76014.06 0.00 76014.06 -CpREV+G 909.26 76046.86 0.00 76046.86 -LG+I 1048.67 76186.27 0.00 76186.27 -LG 1113.32 76250.92 0.00 76250.92 -DCMut+I+G 1305.31 76442.91 0.00 76442.91 -Dayhoff+I+G 1311.35 76448.96 0.00 76448.96 -DCMut+G 1335.33 76472.93 0.00 76472.93 -Dayhoff+G 1341.42 76479.03 0.00 76479.03 -RtREV+I 1439.15 76576.75 0.00 76576.75 -RtREV 1510.64 76648.25 0.00 76648.25 -CpREV+I 1836.27 76973.87 0.00 76973.87 -JTT+I 1895.31 77032.91 0.00 77032.91 -CpREV 1915.10 77052.70 0.00 77052.70 -JTT 1966.93 77104.53 0.00 77104.53 -DCMut+I 2526.09 77663.69 0.00 77663.69 -Dayhoff+I 2536.55 77674.16 0.00 77674.16 -DCMut 2607.70 77745.30 0.00 77745.30 -Dayhoff 2618.36 77755.96 0.00 77755.96 -FLU+I+G 2690.72 77828.33 0.00 77828.33 -FLU+G 2726.22 77863.83 0.00 77863.83 -HIVb+I+G 3090.60 78228.20 0.00 78228.20 -HIVb+G 3120.89 78258.49 0.00 78258.49 -FLU+I 3928.48 79066.08 0.00 79066.08 -FLU 4018.67 79156.27 0.00 79156.27 -HIVb+I 4494.71 79632.32 0.00 79632.32 -HIVb 4577.57 79715.18 0.00 79715.18 -MtREV+I+G 4656.32 79793.93 0.00 79793.93 -MtREV+G 4660.00 79797.61 0.00 79797.61 -MtArt+I+G 5791.53 80929.13 0.00 80929.13 -MtArt+G 5794.12 80931.73 0.00 80931.73 -MtREV+I 6482.88 81620.49 0.00 81620.49 -MtREV 6503.65 81641.26 0.00 81641.26 -HIVw+I+G 6781.61 81919.21 0.00 81919.21 -HIVw+G 6822.53 81960.13 0.00 81960.13 -MtMam+I+G 7053.25 82190.85 0.00 82190.85 -MtMam+G 7053.34 82190.94 0.00 82190.94 -HIVw+I 8295.95 83433.56 0.00 83433.56 -HIVw 8406.46 83544.07 0.00 83544.07 -MtArt+I 8573.95 83711.55 0.00 83711.55 -MtArt 8593.32 83730.92 0.00 83730.92 -MtMam+I 10104.32 85241.92 0.00 85241.92 -MtMam 10125.88 85263.49 0.00 85263.49 ---------------------------------------------------------------------------- ---------------------------------------------------------------------------- -*********************************************** -Relative importance of parameters -*********************************************** - alpha (+G): 0.000 - p-inv (+I): 0.000 - alpha+p-inv (+I+G): 1.000 - freqs (+F): No +F models - -*********************************************** -Model-averaged estimate of parameters -*********************************************** - alpha (+G): 3.668 - p-inv (+I): 0.003 - alpha (+I+G): 3.896 - p-inv (+I+G): 0.003 diff --git a/assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt b/assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt deleted file mode 100644 index 47ec8bde..00000000 --- a/assets/trees/dmso/dmso.refpkg/dmso_search_terms.txt +++ /dev/null @@ -1,12 +0,0 @@ -K00370 -K00371 -K00374 -nitrate reductase -nar -NAR -narG -narH -narI -narJ -EC: 1.7.99.4 -EC: 1.7.5.1 diff --git a/assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv b/assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv deleted file mode 100644 index d7836d63..00000000 --- a/assets/trees/nar_nxr/nar_nxr-tree-mapping.tsv +++ /dev/null @@ -1,76 +0,0 @@ -gene call -sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1 other-None -riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60 other-None -providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4 other-None -NASQAN2015_111_B_bin.76_k121_226837_116 other-None -NASQAN2014_190_B_bin.96_k121_3766_2 other-None -muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5 other-None -icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5 other-None -icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14 other-None -greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4 other-None -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1 other-None -sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1 nxr-None -riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32 nxr-Nitrifier -riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5 nxr-Nitrifier -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4 nxr-Nitrifier -blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11 nxr-Nitrifier -blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9 nxr-Nitrifier -NASQAN2011_330_B_bin.17_k121_430440_3 nxr/nar-N utilization -gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3 nxr/nar-N utilization -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7 nxr/nar-N utilization -Yukon_2004-1_F_bin.10_scaffold_25058_1 narG-N reducer -Yukon_2004-1_F_bin.10_scaffold_678_1 narG-N reducer -yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1 narG-N reducer -yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1 narG-N reducer -whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1 narG-N reducer -watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7 narG-N reducer -nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5 narG-N reducer -NASQAN2016_164_F_bin.17_scaffold_1152_1 narG-N reducer -NASQAN2016_164_F_bin.17_scaffold_8891_2 narG-N reducer -NASQAN2015_227_F_bin.21_scaffold_2406_1 narG-N reducer -NASQAN2015_227_F_bin.21_scaffold_4919_3 narG-N reducer -NASQAN2015_227_B_bin.17_k121_559871_7 narG-N reducer -NASQAN2015_172_B_bin.54_k121_327740_1 narG-N reducer -NASQAN2015_010_A_bin.16_Ga0466474_000034_25 narG-N reducer -NASQAN2011_286_F_bin.29_scaffold_54_27 narG-N reducer -NASQAN2011_286_B_bin.1_k121_764018_13 narG-N reducer -NASQAN2011_265_B_bin.52_k121_465271_4 narG-N reducer -NASQAN2011_265_B_bin.52_k121_959771_6 narG-N reducer -NASQAN2011_028_B_bin.24_k121_53788_5 narG-N reducer -logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2 narG-N reducer -littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6 narG-N reducer -littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7 narG-N reducer -lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5 narG-N reducer -lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1 narG-N reducer -lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1 narG-N reducer -lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206 narG-N reducer -lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3 narG-N reducer -king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1 narG-N reducer -flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1 narG-N reducer -eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23 narG-N reducer -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1 narG-N reducer -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5 narG-N reducer -cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17 narG-N reducer diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json b/assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json deleted file mode 100644 index 5050a094..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/CONTENTS.json +++ /dev/null @@ -1,25 +0,0 @@ -{ - "files": { - "aln_fasta": "nar_nxr_seqs_for_tree_aligned.faa", - "phylo_model": "phylo_modelNQB2rG.json", - "tree": "nar_nxr.tre", - "tree_stats": "RAxML_info.nxr_nar_raxml" - }, - "rollback": null, - "log": [ - "Stripped refpkg (removed 0 files)", - "Loaded initial files into empty refpkg" - ], - "metadata": { - "create_date": "2022-08-01 19:38:05", - "format_version": "1.1", - "locus": "16s_rRNA" - }, - "rollforward": null, - "md5": { - "aln_fasta": "e8299c2a452284b846fbe1954d731e61", - "phylo_model": "8ddf52f289613477eb526cf7accab5f0", - "tree": "21dd28b872d3f481dee55388c088ebc0", - "tree_stats": "0dd942d28693dd101dbc1c19e8e95c30" - } -} diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml b/assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml deleted file mode 100644 index 00d9db3d..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/RAxML_info.nar_nxr_raxml +++ /dev/null @@ -1,95 +0,0 @@ - - -IMPORTANT WARNING: Sequences g_8 and g_9 are exactly identical - - -IMPORTANT WARNING: Sequences g_11 and g_12 are exactly identical - - -IMPORTANT WARNING: Sequences g_13 and g_14 are exactly identical - - -IMPORTANT WARNING: Sequences g_40 and g_41 are exactly identical - - -IMPORTANT WARNING: Sequences g_43 and g_44 are exactly identical - - -IMPORTANT WARNING: Sequences g_60 and g_61 are exactly identical - - -IMPORTANT WARNING: Sequences g_76 and g_77 are exactly identical - - -IMPORTANT WARNING: Sequences g_82 and g_83 are exactly identical - -IMPORTANT WARNING -Found 8 sequences that are exactly identical to other sequences in the alignment. -Normally they should be excluded from the analysis. - -An alignment file with sequence duplicates removed has already -been printed to file /home/projects-wrighton-2/GROWdb/USAfocus_FinalBins110121/dereplicated_bin_analyses/metabolism/nxr_nar//nxr-nar_seqs_for_tree_aligned.faa.phy.reduced - - -This is RAxML version 7.7.2 released by Alexandros Stamatakis on July 31 2013. - -With greatly appreciated code contributions by: -Andre Aberer (HITS) -Simon Berger (HITS) -Nick Pattengale (Sandia) -Wayne Pfeiffer (SDSC) -Akifumi S. Tanabe (NRIFS) - - -Alignment has 1565 distinct alignment patterns - -Proportion of gaps and completely undetermined characters in this alignment: 40.94% - -RAxML rapid hill-climbing mode - -Using 1 distinct models/data partitions with joint branch length optimization - - -Executing 1 inferences on the original alignment using 1 distinct randomized MP trees - -All free model parameters will be estimated by RAxML -GAMMA model of rate heteorgeneity, ML estimate of alpha-parameter - -GAMMA Model parameters will be estimated up to an accuracy of 0.1000000000 Log Likelihood units - -Partition: 0 -Alignment Patterns: 1565 -Name: No Name Provided -DataType: AA -Substitution Matrix: WAG -Using empirical base frequencies - - - - -RAxML was called as follows: - -raxmlHPC -m PROTGAMMAWAGF -n nxr_nar_raxml -s /home/projects-wrighton-2/GROWdb/USAfocus_FinalBins110121/dereplicated_bin_analyses/metabolism/nxr_nar//nxr-nar_seqs_for_tree_aligned.faa.phy -p 11 - - -Partition: 0 with name: No Name Provided -Base frequencies: 0.073 0.060 0.047 0.065 0.011 0.031 0.053 0.083 0.031 0.048 0.064 0.059 0.031 0.036 0.057 0.050 0.060 0.030 0.049 0.063 - -Inference[0]: Time 7855.233752 GAMMA-based likelihood -104967.862139, best rearrangement setting 5 -alpha[0]: 1.530755 - - -Conducting final model optimizations on all 1 trees under GAMMA-based models .... - -Inference[0] final GAMMA-based Likelihood: -104967.862114 tree written to file /home/projects-wrighton-2/DRAM/scratch_space_flynn/jul_27_22_trees/second_try/RAxML_result.nxr_nar_raxml - - -Starting final GAMMA-based thorough Optimization on tree 0 likelihood -104967.862114 .... - -Final GAMMA-based Score of best tree -104967.862114 - -Program execution info written to /home/projects-wrighton-2/DRAM/scratch_space_flynn/jul_27_22_trees/second_try/RAxML_info.nxr_nar_raxml -Best-scoring ML tree written to: /home/projects-wrighton-2/DRAM/scratch_space_flynn/jul_27_22_trees/second_try/RAxML_bestTree.nxr_nar_raxml - -Overall execution time: 11244.438291 secs or 3.123455 hours or 0.130144 days - diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre b/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre deleted file mode 100644 index 72500eef..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr.tre +++ /dev/null @@ -1 +0,0 @@ -(OOP57237|Brocadia_caroliniensis:0.010806074,(RIK02127|Brocadia_sp:0.000910858,(KKO18748|Brocadia_fulgida:0.000000005,OQZ00558|Brocadia_sp_UTAMX2:0.000914005)0.781:0.000917034)0.992:0.013579216,(WP_052562588|Brocadia_sinica:0.009341785,(OHB44699|Planctomycetes_bacterium_GWE2_41_14:0.028539476,((WP_070066136|Brocadia_sapporoensis:0.005501886,RZV59451|Brocadia_sp_BROELEC01:0.002673850)1.000:0.025826757,((((OHB72803|Planctomycetes_bacterium_RBG_16_41_13:0.009726587,(WP_099324707|Kuenenia_stuttgartiensis:0.000917459,NxrA_Candidatus_K_stuttgartiensis_CAJ72445:0.000000005)0.998:0.017229244)1.000:0.098072241,((((RBG1_10:0.249943905,((GCA_001803565_00046|MHDQ01000004unannotatedprotein:0.399259377,((BBJ23760|Nitrotoga_sp_AM1:0.0,BBJ23368|Nitrotoga_sp_AM1:0.0):0.003761140,((RFC31618|Nitrotoga_sp_SPKER:0.006020303,((SPS06998|Nitrotoga_fabula:0.0,SPS06751|Nitrotoga_fabula:0.0):0.042255811,(RFC37636|Nitrotoga_sp_CP45:0.000000005,(RFC33776|Nitrotoga_sp_LAW:0.000000005,RFC30723|Nitrotoga_sp_MKT:0.001768416)0.953:0.002651540)0.916:0.006621566)0.695:0.008594937)0.950:0.008908972,BBJ23476|Nitrotoga_sp_AM1:0.013693167)0.440:0.001391552)1.000:0.666812638)1.000:0.321755680,((((greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3:0.011379394,(NASQAN2014_190_B_bin.96_k121_3766_2:0.017081478,(NASQAN2015_111_B_bin.76_k121_226837_116:0.021392246,icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5:0.002525334)0.985:0.013886431)0.102:0.014633186)1.000:1.045689577,((flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14:0.290495020,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1:0.289900857)1.000:0.977544665,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3:0.182186058,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4:0.220237367)1.000:0.733397499)0.485:0.198655286)0.560:0.125080923,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1:0.429037937,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1:0.433198646,((NASQAN2011_330_B_bin.17_k121_430440_3:0.641466723,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7:0.393884505,(gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3:0.324547720,((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1:0.157095605,((whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1:0.167523285,(NASQAN2011_265_B_bin.52_k121_959771_6:0.026017376,NASQAN2011_265_B_bin.52_k121_465271_4:0.000000008)0.818:0.115349202)1.000:0.087988271,(logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2:0.159911107,(lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5:0.020931878,(watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30:0.032515342,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1:0.071100891)0.951:0.024998611)0.985:0.042982912)1.000:0.086501401)0.986:0.042923050)1.000:0.086203118,(((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6:0.320376687,(flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9:0.147904578,(nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5:0.099435688,lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3:0.013429712)1.000:0.121234242)0.749:0.040234813)0.863:0.055442056,((king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1:0.156531059,NASQAN2015_010_A_bin.16_Ga0466474_000034_25:0.177178519)0.992:0.044604086,((((NarG_Escherichia_coli_NP_415742:0.203008887,NarG_Halomonas_maura_gb_AAT47523:0.153894902)0.981:0.047232779,watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1:0.311887965)0.998:0.063567006,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6:0.106781950,(NASQAN2011_286_B_bin.1_k121_764018_13:0.005660724,NASQAN2011_286_F_bin.29_scaffold_54_27:0.000000005)1.000:0.123919793)1.000:0.131403606,(NarG_Pseudomonas_stutzeri_gb_AAZ43099:0.046987015,(NarG_Pseudomonas_fluorescens_gb_AEV63780:0.078508524,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16:0.074914222,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11:0.000000008)0.885:0.078978122)0.708:0.032866426)1.000:0.168519259)0.242:0.019184033)0.998:0.047390479,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1:0.199222465,((littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6:0.090260755,(littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7:0.175888927,watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2:0.078834694)0.544:0.015106087)0.765:0.040298684,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1:0.189261863)0.493:0.037097247)1.000:0.139855980)0.732:0.020426298)0.995:0.035229012)0.458:0.027215325,((((((NASQAN2015_172_B_bin.54_k121_327740_1:0.048321373,((cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17:0.003316375,Yukon_2004-1_F_bin.10_scaffold_678_1:0.110287220)0.999:0.034293344,(cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5:0.010147982,(NASQAN2015_227_F_bin.21_scaffold_4919_3:0.024300445,NASQAN2011_028_B_bin.24_k121_53788_5:0.000000005)0.990:0.014294289)0.365:0.007073108)0.988:0.017900532)0.950:0.016382079,(watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1:0.104162330,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1:0.054766712)0.871:0.041502925)1.000:0.076566993,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4:0.104610952,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2:0.070583667,eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23:0.043655384)1.000:0.048776638,((yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1:0.089459252,cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1:0.023635532)0.326:0.001148673,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1:0.090302159)0.885:0.013388066)0.878:0.032405321)0.565:0.021969185,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2:0.152164297,(NASQAN2016_164_F_bin.17_scaffold_1152_1:0.081072836,NASQAN2015_227_F_bin.21_scaffold_2406_1:0.055593684)0.976:0.109893377)0.649:0.067627453,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2:0.064995222)0.815:0.039464533)0.963:0.029952893)0.148:0.015135463,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17:0.129369944)0.861:0.019065424,(((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1:0.392541235,yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1:0.171599398)0.840:0.248083204,((Yukon_2004-1_F_bin.10_scaffold_25058_1:0.105822798,NASQAN2016_164_F_bin.17_scaffold_8891_2:0.030238438)0.312:0.015380827,NASQAN2015_227_B_bin.17_k121_559871_7:0.039959075)0.928:0.056585084)0.234:0.007394197,(watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7:0.604640728,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3:0.181397923)0.845:0.147304633)0.903:0.041551231)0.908:0.028658570,lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206:0.136445862)1.000:0.145006781)0.508:0.034596552)0.999:0.098317003)0.563:0.079911427)0.999:0.168588838)0.985:0.135263217,(CRI68048|Thiocapsa_sp_KS1:1.094261762,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4:0.488541056,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1:0.401066831,((GCA_003453735_00577|DMNE01000186unannotatedprotein:0.309801231,(((AFN37208|Nitrolancea_hollandica_Lb:0.039042664,AFN37205|Nitrolancea_hollandica_Lb:0.011623567)0.981:0.018883572,(AFN37207|Nitrolancea_hollandica_Lb:0.059889634,AFN37206|Nitrolancea_hollandica_Lb:0.035086850)0.741:0.017421853)1.000:0.237080104,((WP_005004540|Nitrococcus_mobilis:0.005243894,Nitrococcus_mobi_EAR23355:0.002640284)1.000:0.244172179,((WP_011314088|Nitrobacter_winogradskyi:0.002534990,(Nitrobacter_sp_Nb_311A_ZP_01048070:0.009400785,(A_Nitrobacter_hamburgensis_YP_578638:0.031550923,B_Nitrobacter_hamburgensis_YP_578186:0.023740548)1.000:0.053836401)0.978:0.022733577)0.963:0.016265428,Nitrobacter_winogradskyi_gb_ABA05326:0.037260949)1.000:0.216806507)0.880:0.055888930)1.000:0.201356108)0.974:0.063994885,(blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11:0.000000005,blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9:0.000000005)1.000:0.282418622)0.992:0.095642727)0.132:0.041822075)0.986:0.188699247)0.017:0.049701189)0.871:0.184584331)0.173:0.116759705)1.000:0.987285179)0.550:0.236304701,(providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4:0.472026440,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60:0.325258151,(icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14:0.332187014,muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5:0.705095308)0.418:0.106182937)0.994:0.312896913)1.000:0.774651657)1.000:0.778950754)0.975:0.154198707)1.000:0.231811834,((((cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor:0.000877951,cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor:0.000943888)1.000:0.055806636,(GCA_003523945_00056|DOFS01000023unannotatedprotein:0.004579427,DJ_nxrA:0.006504779)0.999:0.028051194)0.999:0.046515340,(DJ_nxrA2:0.074233359,DJ_nxrA1:0.060036576)0.694:0.026270877)0.990:0.045759227,(((((WP_053378142|Nitrospira_moscoviensis:0.008325164,(riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5:0.012480447,GCA_002083555_01644|MSXN01000007unannotatedprotein:0.002680030)0.924:0.008235322)0.880:0.003077004,(((GCA_002420115_02525|DIHK01000043unannotatedprotein:0.012092376,GCA_002483475_03556|DLHZ01000062unannotatedprotein:0.002691200)1.000:0.023236403,(GCA_900078535_00262|FJVM02000053unannotatedprotein:0.014982211,(GCA_001458695_00808|LN885086unannotatedprotein:0.023036213,GCA_002451055_00821|DKBD01000269unannotatedprotein:0.007573759)0.688:0.003976613)0.390:0.001522946)0.694:0.004052451,GCA_002331335_02310|DCZO01000011unannotatedprotein:0.017101140)0.922:0.006393889)0.980:0.016473529,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32:0.002308752,GCA_002737345_00863|NSIK01000010unannotatedprotein:0.006832549)1.000:0.023034521)0.393:0.016407361,WP_080886776|Nitrospira_japonica:0.032980329)1.000:0.048957408,(((Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein:0.0,Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein:0.0):0.048648714,((CBK42946|Nitrospira_defluvii:0.0,NxrA2_Nitrospira_defluvii_YP_003798871:0.0):0.003132849,GCA_900170025_02937|FWEX01000006unannotatedprotein:0.002326236)1.000:0.046043049)0.987:0.028241355,((CUS31266|Nitrospira_nitrosa:0.032070423,CUS38776|Nitrospira_nitrificans:0.014206130)1.000:0.059565512,(GCA_001567445_02228|JZQY01000048unannotatedprotein:0.031898730,((CBK42928|Nitrospira_defluvii:0.0,NxrA1_Nitrospira_defluvii_YP_003798853:0.0):0.020188049,GCA_003456605_00391|DMQK01000091unannotatedprotein:0.020042828)0.973:0.029005902)1.000:0.049275974)0.916:0.026734542)0.987:0.030138243)0.163:0.019579673)1.000:0.351067665)0.984:0.079553236,((OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14:0.144751486,OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b:0.164104591)0.967:0.106906909,(((OUC07869|Chloroflexi_Litorilinea_aerophila:0.108541565,RCK74665|Chloroflexi_Anaerolineae_bacterium:0.109258954)1.000:0.169950317,(KRT77589|Armatimonadetes_bacterium_CSP1_3:0.210493116,KRT68888|NC10_bacterium_CSP1_5:0.135568128)0.411:0.038266264)0.915:0.031759119,(GBC85351|bacterium_sp_HR11:0.152552869,(GCA_002328125_01442|DCWK01000050unannotatedprotein:0.001947491,GCA_002685755_01556|NYYB01000002unannotatedprotein:0.001760896)1.000:0.300590274)1.000:0.072067691)0.853:0.038248286)0.986:0.048595639)0.582:0.046460101,((MSP_nxrA:0.025354205,(((MBL09191|Acidiferrobacteraceae_bacterium:0.033838550,TDJ60388|Nitrospina_sp:0.042298150)0.934:0.011901270,((Nitromaritima_KMP11423|SCGC_AAA799_A02:0.031363214,((GCA_002705185_00880|PAJA01000060unannotatedprotein:0.0,MAX17737|Nitrospina_sp:0.0):0.009948403,(GCA_001542995_01387|LFLA01000024unannotatedprotein:0.011368914,(GCA_002453875_01196|DKHT01000003unannotatedprotein:0.0,GCA_002454045_00625|DKID01000024unannotatedprotein:0.0):0.025625262)0.731:0.006753767)0.957:0.010197443)0.837:0.006601827,cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor:0.016703925)0.925:0.009659103)0.780:0.008734629,PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15:0.031915291)0.638:0.007806333)0.907:0.014421329,(WP_042250442|Nitrospina_gracilis:0.018020385,WP_042251421|Nitrospina_gracilis:0.040064063)0.228:0.014895744)1.000:0.388356661)1.000:0.140833958)0.990:0.036064959,((((WP_007222969|Jettenia_caeni:0.0,NxrA_planctomycete_KSU_1_ZP_10101005:0.0):0.002251376,TLD40744|Candidatus_Jettenia_ecosi:0.013337202)0.983:0.006913180,TLD41279|Candidatus_Jettenia_ecosi:0.021669001)0.000:0.000000005,WP_007220240|Jettenia_caeni:0.000000005)0.998:0.026966168)0.882:0.017606145,((WP_070067449|Brocadia_sapporoensis:0.003688908,(OQZ04816|Brocadia_sp_UTAMX1:0.003783493,RZV56287|Brocadia_sp_BROELEC01:0.003479253)0.233:0.001151055)0.997:0.020857077,(KKO18624|Brocadia_fulgida:0.021890769,(OOP55454|Brocadia_caroliniensis:0.024026386,(WP_052561322|Brocadia_sinica:0.000917852,KXK29028|Brocadia_sinica:0.000923980)1.000:0.023040103)0.993:0.017011726)0.725:0.010490186)0.877:0.013675102)0.965:0.015645586)0.779:0.007537636)0.931:0.007662564)0.935:0.007110293); diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa b/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa deleted file mode 100644 index 8620f8d1..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/nar_nxr_seqs_for_tree_aligned.faa +++ /dev/null @@ -1,5425 +0,0 @@ ->RBG1_10 -----------------------------------------------MTLSRRRFLKISSL -SAAGA---------LVDLPELKFLQFLET------VENPLEYYPNR------DW-EKIYR -DQYRY------DSSFTFVCT-PNDTHACRLRAYVRNGIVIRVEQAYDVQNYTDLYGNKAS -VMWSPRGCNKGYNLPRRVYGPYRVKHPMVRKGWKE----------WAE----------AG -FPDPTLPENQQKYF--RRGEDSWVKVSWDEGFELVAKGLLHTMEKYSGEKGAEIL-RKQG -YPEEMIEAM------HGSGAQTIKIRGAMPLLGATRIFGFYRFAN-MLGLYDGK------ ----LGARGWSNFSWHGDLPPGHPMVTGVKCSDPELNDFRHSKLLVFLGKNMVESKMADAH -WWIETIERGGKVVNISPEYSATSSKSDYWIPIRPG-TDTALLLGVTQIIIQEKLY----D -------QDFIKKHTDLPLLIRMDNLKLLRPTDIIKG---YK----------NQILTG--- ---------------YSVKVQKIKPELREKW---------GDFVVWDLKTKK--PQTVT-- --------REDLGEKIERKGL------N---------------------PALEGNY----- -------------------------------------KIKLV-NGKEIEVKTVFQL----- ----YKELLSE-YDLETVS-----------------------------QITGSPKNLIYQL -AQDL-----------ATIKPASIHTGEGVNHFFHCD-LVTRAVWLPLALTGNIGKPGA-N ---VGHWAGNYKGEVFD--------GLG--------------------------------- -------------------------------VYLNE-----DPFNPNLDPSAKLEDIKLKK -YYK------GEEVCYW-----NY---------------EDRPLIVKG----------KCF -TGKTHMPTP---TKAEWVGNGN-LLNNAKWAHN----------------MIANVE--GKV -EMIVYNEIEWTASCEYADVVFPVHSWMELTLPDMTASCSN-PFLQV----W-KGGIKPIF -DTKQDNEVLAGVAAKLSELT---------------------------------------- ----------------HDNRY--KDYWKF-------------------------VLEG--- --------------------------------NNEVYLQRILDACSTTKGYKIDELL-KSD ------RG----WLMNFRT----Y-PRIPFW----EQIQESK--PFYTKT----------- --------------------GRMEFYREEDEFIDYGENLIVHREPVEATPYL--PNVILG- -THKAIR---PNSYGISPESIN---ADERQVRNLKMSWKQVKLSKNPLWEKGFRFYCLTPK -SRHTVHSSWSVLDWNMIWQSNFGDPYRMDNRTPGVGEHQMHMNPLDAKELGINDGDYAYV -DANPEDRPYTGWKEEDPFYKVSRLMVRVKYNPAYPRGITMIKHASFIATHKSVKAHESRP -DKRAVSED-TGYQSSFRYGSQQSIT---RGWLQPTMMTDSLVRKNYMGQEIGEGYEIDVN -APN-TCPKETLVKIIKAE-DGGMGGKGKW---EPARTGYTPAG--ENKDMKKFLEGGFIL -KV-- ->cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLITQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ECLVTQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_003523945_00056|DOFS01000023unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAVMTKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRM-REQG -YPPEMIEMT------KGSAIRSFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENLY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLSKNQ--AVPIH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-NGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPECIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAIMSKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRL-REQG -YPPEMIEMT------KGSAIRAFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENMY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLNKNQ--AVPLH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-SGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDISFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA2 -----------------------------------------------MLVTKRQFLKITAG -TVAAVA--------LADNALA--LTALQP--VVE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDMYGNRGT -FAHNPRMCLKGYTYHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPELD-PTVMTKYKFSARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEAGARRL-REQG -YPPEMIEMM------KGSGVRSMKFRAGMPVLGVIGKMGITRMNGGCGALLDSWVRKVGP -DSAQGGRYFNNLTWHGDQDPSQPFWSGAQAIDCDLSDMRFSKMNTSWGKNFVENKMPEAH -WKLESIERGGRVVVITPEYNPTAQRADYWMPVRPE-TDGALFLGACKIILDDGLQ----D -------NDFIRSSTDFPLLIRTDTLQYLDPRDVIKD---YA---------FPDFSKS--- ---------------YSGKVQGLSPSQIARL---------GGFMVWDLNQDK--AVPLH-- --------RELVGWHFKKSGI------D---------------------PALTGSF----- -------------------------------------RVKLL-SGREADVMPLFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDN-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAAMVMTLTGNMGKFGS-G ---CHTWSGNYKVGVWA-ATPWSGEGIG--------------------------------- -------------------------------IHTGE-----NPFKITTDPNAHGKEINYRP -YYY------GEETTYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKLRWVANVN-ILNNSKHHYD----------------MVKNVD--PHI -ETIVTQDIEMTSDVNHADVSFAVNGWMEFTYPEMTATVSN-PWMQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDAGSTSYGYSADTML-KSE ------KG----WMVMTRT----Y-PRIPLW----EETNESK--PMWTRS----------- --------------------GRLETYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHVNPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQLDSLPGKMANKWKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA1 -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTMHRRVYGPYRLKGPLMRRGWKQ----------WMD----------DG -SPEFT-PAIQTKYKFNARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEYGARKL-REQG -YPPEMIEMM------KGSGVRAFKFRAGMPVLGIIGKMGITRMNGGCGALLDSWVRKVGP -ENAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDIDLSDMRFCKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAYRADYWIPIRPE-SDGSFFLGACKMIVDEGLF----D -------ADFVRANTDMPLLVRTDTLQYLDPRDVIKD---YQ---------FPDFSNT--- ---------------YSGKVQTLKPAEIARL---------GGIMVWDLNKNQ--AVPIH-- --------RELVGWHFKKSGI------D---------------------PALTGTH----- -------------------------------------RVRLL-TGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QICRSPKDLIVRW -ARDM-----------GTVKPAAIHNGEGVCHYFHMT-QNGRAAALTLIYSGNMGKFGS-G ---CHTWSGNYKAGTWA-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFKITTDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNSKHHYD----------------MVKNVD--PHN -ECLVHQEVEMTSDVNHFDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRLLDAGNCSYGYNADTML-KSE ------KG----WMVMTRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRVETYRVEPEAIEYGENFIVHREGPEATPYL--PNAIMS- -SNPYIR---PDDYGVPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPFVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHPVAWKFKWGFAIDHH -AVN-TTPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_001567445_02228|JZQY01000048unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPIFQL----- ----YQVHLQD-YDLDTVH-----------------------------QVNRSPKDLIVRW -ARDC-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLTTDAHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNSKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVSAKLKELT---------------------------------------- ----------------GEARM--ADTYRF-------------------------VYQN--- --------------------------------RMDIYVQRILDASTTFYGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFIVHREGPECTPYL--PNAIMS- -TNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYCFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42928|Nitrospira_defluvii ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->NxrA1_Nitrospira_defluvii_YP_003798853 ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->GCA_003456605_00391|DMQK01000091unannotatedprotein ----------------------------------------------MMQVSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VVE-VDNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLVVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPYEVVKE---YQ---------LPDFTKS--- ---------------YSGRIQGLTQDHIRRL---------GGMMVWDLAKGQ--AVPLH-- --------REQVGLHFAQTGI------D---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDVMPVYQM----- ----YTIHFQD-YDLDTVH-----------------------------QINRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLKDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFSGVAVKLKEIT---------------------------------------- ----------------GDQRM--ADTYKF-------------------------VYQN--- --------------------------------RVDIYVQRILDASSTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFISHREGPECTPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKQQANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQANFRYGAQQSFT---RSWLMPMHQTDSLPGKQANAMKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMAKWLKGEHIK -IKV- ->Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42946|Nitrospira_defluvii ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->NxrA2_Nitrospira_defluvii_YP_003798871 ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900170025_02937|FWEX01000006unannotatedprotein ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -DKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPLRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NGREIDVMSIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS31266|Nitrospira_nitrosa -----------------------------------------------MVITRRQFMKASAG -TIAAIA--------VADKVLA--LTALQP--VTE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLIRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFASRFLDDMLRVSWDTAFTYAAKAMVVIATRYSGEAGARRL-REQG -YAPEMVEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPVLDTWVRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARLAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMH----D -------VDYLKQFTDMPLLVRTDTLQYLDPREVIPD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDLAKQK--AVPLH-- --------REQVGWHFDSSGI------Q---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDAQPIYQM----- ----YQIHFQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-SNGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWS-ATPWSGSGSG--------------------------------- -------------------------------VHLSE-----DPWQINLDPNAHGKEIKYKS -YYY------GEEPGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAARLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRVEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPHVR---PDDYGIPVTAQH---HDDKTIRNIKLPWVEIKRHTNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS38776|Nitrospira_nitrificans -----------------------------------------------MLVSRRQFMKATAG -TIAAAA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WAD----------DG -SPELT-PEAKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPLLDTWIRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMQ----D -------IDYLKQFTDMPLLVRTDTLQYLDPRDVIQD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDMAKKQ--AVPLH-- --------REQVGWHFDKSGI------E---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDALPIYQL----- ----YLIHLQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-ANGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWN-ATPWSGVGGG--------------------------------- -------------------------------VHLSE-----DPWHINLDANAHGKEIKYRN -YYY------GEEPAYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPIAAQH---HDDKMIRNIKLAWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_080886776|Nitrospira_japonica ---------------------------------------------MTMFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMMRVSWDTAFTYAAKSMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVTS -DQAQGGRYWSNYTWHGDQNPSQPWWCGAQASDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGGRIVVITPEYNPTAYRADYWMPLRPQ-SDGAIFLGAMKIITDENMH----D -------IDFLKGYTDAPVLVRTDTLQFVDPRDVVRD---YK---------FPDFSKS--- ---------------YSGRVQTLKPEQVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYSNSGI------D---------------------AALTGTY----- -------------------------------------RIKLL-NGREIDVMPVWQL----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLLVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHMT-VNSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWV-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PSI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQV----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEIT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYMN--- --------------------------------RVDVYVQRLLDASATFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRVPFW----EETNESK--PMWTRT----------- --------------------GRFETYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYCR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHANGLKWKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRVQSLKPEQVERL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-STPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002737345_00863|NSIK01000010unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRTFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPREVVAD---YQ---------FPDFSKS--- ---------------YSGRVQSLKPEGIARL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002420115_02525|DIHK01000043unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDSWIRKVSP -DQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFMGAMKIIIDENMH----D -------VDFLKQFTDAPILIRTDTLQYLDPRDVVPD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGVPITAQH---HDDKTIRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002483475_03556|DLHZ01000062unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------VDFLKQFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGCWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_001458695_00808|LN885086unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -APELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGVQGSDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFLGAMKIIVDENMH----D -------VDFLKSFTDAPILVRTDTLQYLDPRDVIPD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIQRL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIHTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VVNNAKHHYD----------------MVKNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRPEAEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWDEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPFVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGCQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900078535_00262|FJVM02000053unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------IADNVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------SDFMKQFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQTLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKQ -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTIRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMSKHAPYVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002451055_00821|DKBD01000269unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRRYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIMVDENMH----D -------IDFMKSFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKGEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-ANARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VVNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAVAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002331335_02310|DCZO01000011unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVIMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFMKSFSDAPILIRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKAEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDVEMTSDVNHNDIAFACNTWVEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYSN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMTKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_053378142|Nitrospira_moscoviensis -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIVATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGTAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYLN--- --------------------------------RVDVYAQRMLDASSTFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAYIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVNP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFIGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDT------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->GCA_002083555_01644|MSXN01000007unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMVIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVKD---YA---------FPDFSKS--- ---------------YSGRMQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALNGTF----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYTN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002328125_01442|DCWK01000050unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDTFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNL------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVH-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPETAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->GCA_002685755_01556|NYYB01000002unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDIFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNI------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVY-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPEAAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->WP_042250442|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKIRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDDTFTYLAKGHVAVGKAYSGQRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGIYRLAN-MVGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVCPEYNPPSTKADYWIPCRAGASDISIFLGCAKIIMDEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDTNTDK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDSVN-----------------------------QISHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------SMVAE-----DPFNPVLDISKNVDWANVKG -YLK------GEEVGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---SKLIWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYADFVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTAGMGYNIDDII-NGK ------YGEPGACLLLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTAMMKHSCWTSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMFGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQY-- ----- ->WP_042251421|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRVTWDETFTYLAKGHVAIGKAYSGSRGAQRL-KNEG -YQPEMIEAM------GGSGSRSMKYRGGMGLLGVVGKYGIYRLAN-MMGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPTRAGLADISIFLGVAKILMDEGLV----D -------GEYVKEYTDMPLLVRTDNLIRLHPEDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNYDRDKM---------PDFVVWDTNTDK--PVALT-- --------REDIGAKMRRKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWSGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVLDVTKNVGWENIKA -YAK------GEEPGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLLWFVNVN-VINNAKWFYE----------------MVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQIT---------------------------------------- ----------------GDKRF--ADYMK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTSTSGMGYNIDDII-NGK ------YGEPGCCLLLYRT----Y-PRSPFW----EMYTESK--PFYTAH----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTSMMKHSAWQSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKSKTKMKFVHGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPARTGYTPESPLKDRFAEMYLAGQY-- ----- ->MBL09191|Acidiferrobacteraceae_bacterium -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNRYPMIRVGWKQ----------WAD----------DG -FPYLD-KANREKYKMTSRGTDEFVRMSWDDTFTYLSKGHIAVGRAYSGPRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISVFLGCAKIIMDEGLV----D -------IEYVKDYTDMPLLVRTDNLKRLHADDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFSRDQM---------PDFAVWDANTNK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DVKLT-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLVVRV -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDPAQNTDWKNVKG -YLK------GEEVSYW-----AH---------------RDEALIVNTP-----RYGRKVF -TGRSHMPTP---TKLFWFVNVN-VINNAKWFYE----------------LVFNTD--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFARRMSEVT---------------------------------------- ----------------GDKRF--GEFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -XGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKFGYEADNH -AVN-ATPXEXLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->TDJ60388|Nitrospina_sp -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKRVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRLSWDQTYTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MMALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPVRAGLSDISVFLGAAKIIMDEGLV----D -------VPFVKEYTDMPLLVRTDTLVRLHPDDYIPG---YK---------VQALPKD--- ----------------GFTTKWLKNFNRSKM---------PDYTVWDTNTNK--PVAIT-- --------REDIGAKMLKKKI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPMYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLIIRL -SRDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---AHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFHIILDPAKNVDWKNVKG -YLK------GEEISYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLMWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIIAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLMHREFGKRMAQIT---------------------------------------- ----------------GDKRF--ADFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PYYTPN----------- --------------------GRLQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEEEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYTR -VKI- ->MSP_nxrA ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPLYEM----- ----YKIHLKD-YDLETVN-----------------------------QISHAPKDLVVRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPEMDPAKNTTWAQIKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRMAEVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTGTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPH----------- --------------------GRLQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15 -------------------------------------------------------MQVSAG -VATAMA--------LTSKKVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGSRVMKYRGGMGLLGVVGKYGIYRLAN-MVALLDAIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------VNFVKEYTDMPLLVRTDTLMRLHPDDFIPG---YR---------NQDLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDANTDK--PVAIT-- --------REDIGSKMKKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTIPVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIMPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVMDIAKNTDWANVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRSHMPCP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNCWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFARRLAEVT---------------------------------------- ----------------GDKRF--SDYMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWASTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->Nitromaritima_KMP11423|SCGC_AAA799_A02 -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTGKKVG---AQLKP--VVK-VGNPLDTYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRLSWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTMKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGVNKIIMEEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDFIPG---YK---------AQQLPKD--- ----------------GFTTKWMKNYNRNQM---------PDFTVWDTNTNK--PVAIN-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DVKLV-NGKTITVMPLYEM----- ----HKIHYKD-YDIDTVN-----------------------------QISHAPKDLIIRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFTPLMLTGNVGPKGS-G ---SMTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----TPFDTELDPAKNIDWNRVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PFYTPN----------- --------------------GRTQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPFMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWTATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor ---------------------------------------------------------MSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGVRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVIGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISIFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDNLIRLHPEDFIPG---YK---------VQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFTVWDINTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKVHLKD-YDIDTVN-----------------------------QISHAPKDLILRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTVLDASKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEFGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFLHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002705185_00880|PAJA01000060unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->MAX17737|Nitrospina_sp ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_001542995_01387|LFLA01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSKRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAVAPEYNPPATKADYWIPVRAGLSDISLFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDANTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNIVMDPSKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRMAEVT---------------------------------------- ----------------GDKRF--MDHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002453875_01196|DKHT01000003unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GCA_002454045_00625|DKID01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GBC85351|bacterium_sp_HR11 -----------------------------------------------MKLTRREFMQTTAA -GAAALV--------LDDALRG--LRLLQP--VVE-VGNPLAAYPNR------DW-EAVYR -DQYRY------DRSFTWVCS-PNCTHECRLRAFVRNGIVLRSEQNYDLHRISDLYGNKAT -AHWNPRGCLNGYTFQRRVYGPYRLKYPMIRRGWKQ----------WAD----------DG -FPELT-PENMAKYKFDSRGTDTFVRVSWDEAYTYVARGMIAIARRYSGEEGRRRL-LEQG -YPEEMLEHW------EGSGVRTFKLRGGMGLLGVIGKYGLYRFAN-MLALLDAHVRKVPP -EEAKGARIWSNYTWHGDQAPGQPFVHGLQTSDVDMNELRFARLHIQCGKNLVENKRPESH -FFIELMERGAKIVAIIPEYGPQATKADYWIPIRPA-TDAALWLGITRVMIDNGWY----D -------VDFLKKWSDMPLLIRTDTLRRLRAHEVFPG---YR---------GGLDPKG--- ---------------PSFQVQDLKPDQYEKI---------GDFVVFDEKSQS--LKPLT-- --------RDDVGGRLTAKGI------D---------------------PALSWRG----- -------------------------------------KVRLV-DGTEVECMTLWEA----- ----YKIHLQD-YDLDTVC-----------------------------EITHAPKELVLRL -ARDIWETTQEVRRQNPDMGAVAIHIGEGLNHWFHAT-EMNRAVYLPLILTGNIGKPGA-G ---CHTWAGNYKAALFQ-GSPWTGPGFL--------------------------------- -------------------------------GWIAE-----DPFHPLLDPKADGTQVKVKK -YTH------DEEPAYW-----NY---------------DDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKLMWFTNVN-LLNNAKWVYE----------------MIKNVN--PKV -ELIIAQDIEMTSSCEYADVILPANSWMEMETYEITASCSN-PFLQI----W-KGGIRPIF -DTKDDVLIMAELAKKLGEIL---------------------------------------- ----------------KDRRF--ADYWKF---A----------------------LER--- --------------------------------KTEVYIQRLLDTCTTTKGYRVEDIL-AGK ------YGEPGAALMLFRT----Y-PRVPFW----EQVHDDL--PFFTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNVIVS- -SNPLIR---PEDYGIPLDHMG---RDERQVRNVKLPWSEVKKTKNPLWEKGYRFYCLTPK -TRHATHSSWQVTDWHLLYNNDFGDPYRLDKRSPGVGEAQLHMNPQAAKDLGINNGDYVYV -DANPADRPYVGWKPGDPFYRVARLMLRVKYNPAYPYHVVMMKHAAWIATEKSVRAHETRP -DGRALSED-TGYQASFRYGSQQSVT---VGWLMPMHQLDSLFHKAKAKVGFIFGGEADNH -AVN-TTPKETLVKVTKAE-DGGLGGKGVW---EPARTGYTAGD--EDDFMKRYLNGELVE -IVGE ->WP_099324707|Kuenenia_stuttgartiensis -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALSPS--GYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->OHB72803|Planctomycetes_bacterium_RBG_16_41_13 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKAKYMFDNRGNDELLRASWDEAFTYASKGILHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVDP -DQALGGRNWTNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKIVVITPEYSPSSQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLVRTDTLKRVSPKDIIPN---YK---------LQDISEG--- ---------------PSYQIHGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PALEGSF----- -------------------------------------KLKTV-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------DMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAANFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITTSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEH---WDDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDAFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELVK -VDA- ->WP_070066136|Brocadia_sapporoensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IVNKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFSD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------AAIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTIRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->RZV59451|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKTIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYSGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->OHB44699|Planctomycetes_bacterium_GWE2_41_14 -----------------------------------------------MKLTRRTFLQIAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFVCS-PNDTHGCRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGALGIIGKYGMYRFNN-MLSLVDSHHRGVGA -DKALGGRNWSNYTWHGDQAPGHSFSHGLQASDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSSQKADYWIPIKCN-TDTALFLGVTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQPKDIFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREIV---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLRD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GYVAE-----DAFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPENAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGVW---DPVKTGYTTGN--ENDFMKKYLNGELIK -VEKA ->WP_052562588|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGILHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIIRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKIKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMTKYLNGELIK -VEKA ->OOP57237|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREIL---------GDFVVWDAKTNG--PQPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFYQI----W-KGGIRPVN -DSKDDVMVIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTAKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVTMIKHSSWIATEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVTKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -VEKS ->RIK02127|Brocadia_sp -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPSLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->KKO18748|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->OQZ00558|Brocadia_sp_UTAMX2 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGVGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->TLD40744|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->TLD41279|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------MKHSACISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELVK -MEKA ->WP_007220240|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNIGYPGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->WP_007222969|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->NxrA_planctomycete_KSU_1_ZP_10101005 -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->WP_052561322|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRADTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->KXK29028|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWIYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->OOP55454|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFS--------LADKTMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRSFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGFTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISQG--- ---------------PSFKMHGLHDDQRETI---------GDFVVWDAKTNG--PSPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPYAPATDLKVRG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWAEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSRDDVMILAGMAAKLGDLL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFDAIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAEVKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAMDMGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAD-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMRRYLSGELIK -IEKA ->KKO18624|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LADKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRRGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDEAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPVRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFLN---YQ---------LEDISQG--- ---------------ASFKIHGLHDDQREII---------GDFVVWDTKTNS--PKPIT-- --------RDDVGDKLVGKGI------D---------------------PALDGTF----- -------------------------------------MVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVMILAGMATKLGELL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRMQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDNYGIPESAEH---WDERTVRNIKKSWSDTKQTRNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNPSYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGVW---DPAKTGYTAGN--ENDFMKRYLNGELIK -IEKA ->WP_070067449|Brocadia_sapporoensis ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------RGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTNG--PKAIT-- --------RDDVGDKLVAKDI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLRNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->RZV56287|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPESAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->OQZ04816|Brocadia_sp_UTAMX1 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLVENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVVKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRVKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->KRT68888|NC10_bacterium_CSP1_5 -----------------------------------------------MEITRRTFLKAAAT -GATAF---------LADDAWA--LRLLQP--AVE-VGNPLSEYPDR------GW-ERIYR -DQYGY------DRTFTFVCS-PNDTHACRLRAYVRNGVVMRIEQNYDVSRYADLYGNKAT -PHWNPRGCLKGYTLHRRVYGPYRVKYPLVRKGWKR----------WAD----------DG -FPDLT-PANKTKYRFDSRGTDELMRISWDDAYSYIAKGMIQIARRYSGEEGVRRL-REQG -YPEEMIRET------HGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-TLALLDVHVRGVGP -DQALGGRTWSNYTWHGDQAPGHPYSHGLQGSDVDLNDFRFSKLHIQCGKNLIENKMPESH -FFNELMERGAKIVVITPEYSPPAAKADYWIPIRPN-TDTALFLGLTKILMEERHY----D -------AAFVKRFTDFPLLVRTDTLKRLRAHEVFPG---YR----------GRLPEN--- --------------GPSFTIQGLTKEQYEKL---------GDFVVFDAKSQS--LKPLT-- --------REDVGDRLAQQGT------D---------------------PTLDWQG----- -------------------------------------KVKLA-DGTEVEAMTLWAM----- ----YTIHLKD-YDLDTVH-----------------------------EITHSPKELIQRL -ARDI-----------ATIKPVAIHIGEGINHWFHAT-LSNRAFYLPLMLTGNIGVPGA-G ---SHTWAGNYKAALFQ-GSSWSGPGFK--------------------------------- -------------------------------GWVAE-----DPFNPNLDPNAPGQAVKVKG -YTK------DEEPAYW-----NH---------------GDLPLIVNTP-----KYGRKVF -TGLTHMPTP---TKVMFFNNVN-LINNAKHVYE----------------MLKNVN--PRV -EMIISVDIEMTASIEYADFALPANSWMEFQTPEITASCSN-PFLQI----W-KGGIKPLY -DSKDDVTILAELAQKLGAIV---------------------------------------- ----------------NDHRF--AAYWRF-------------------------ALEG--- --------------------------------RPEVYIQKLLDTSSTTAGYRVDEIM-AGK ------YGEPGACLMLFRT----Y-PRVPFW----EQVHDSD--PFYTDT----------- --------------------GRLHAYCDIPEAIEYGENFIVQREGPEATPYL--PNVIVS- -TNPYIR---PEDYGISPDAMH---WDERTVRNIKMAWADAKRTTNPLWEKGYRFFFLTPK -TRHRVHSQWSVCDWNQIWDSNFGDPYRMDKRMPGVGDHQLHMNPQAAKDLGINDGDYVYL -DANPADRPYIGWKPSDPFYRVSRCMVRVRYNPAYPYQVVMMKHAPYIATERTVKAHETRP -DGLALSE--TGYQANLRYGSQQSLT---RNWHMPMHQTDTLFHKAKATMSFLFGGEADNH -ALN-TVPKETLVKVTKAE-DGGMRGKGIW---EPARTGFTPGN--ESDFMKRYLAGEIVQ -IKKR ->OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------MIWDSNFGDPYRMDKRTPWVGENQLHINPQAGKALGINDGDYVYV -DANPADRPYIGAKPEDPFYKVARLMLRAKYNSAYPYHIVMMKHAPNIATERSVKAHETRP -DKRALS-E-LGYQSNFRYGSQQSIT---RNWHMPMHQTDSLFHKAKVFMGFLFGGEADNH -AVN-TVPKETLVRVTKAE-DGGLGGKGVW---APATTGYTPGA--ESEAMRKYIDGGFVS -T--- ->OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b -----------------------------------------------MNESRRDFLKISAV -TAVTLA--------LSNKPFL--LWALEP--VAN-VENPLAYYPNR------DW-EKIYR -DQYRY------DRTFSWVCS-PNDTHACRALAYVRNGIIIRSGSEYNYETYGDLYGNKAT -QNWNPRQCAKGFTFHRLMYGPYRLKYPLVRRGWRE----------WAD----------AG -FPDLT-PENKTKYKFDSRGTDQLEKATWDEAYTYIANGIMSIAKRYSGVEGKRKL-LAEG -YPEEMLAPM------KGAGTRTMKFRGGMGLLGVFGKYGMYRLAN-TMALLDVNIRGVSE -EGAMGGRAWSNYTWHGDQAPGHPWVHGLQNADCDFNDLRFSKLIIQDGKNLVENKLTDSH -WFIECMERGAKLVTISPEYSPPASKSDYWIPIRPQ-TDAALFLGITRLMIDQGWY----D -------KEFVAQFTDFPLLVRTDNLKRLRAADIFPD---YK---------LGLSKNG--- ---------------PSFKYQGLKQEQYEKL---------GDFVVWDETKGA--PVAIT-- --------RDDVGKNLSKKGI------N---------------------PALEGSY----- -------------------------------------KVKTV-DGKEIEVTTLFSL----- ----YKIHLRD-YDLDSVV-----------------------------EITKAPKDLIEQL -AKDI-----------AAIKPVAIHQGEGINHWFHAT-EMNRAAYLPLMLTGNIGQKGA-G ---AFGWAGNYKAALFQ-GSAWTGPGFK--------------------------------- -------------------------------GWVAE-----DPFHPNLDPQTPGKAINAHA -YFR------DEEPAYW-----NH---------------GDRALIVDTP-----AEGKKVF -TGSTHMPTP---TKAMLFTNVN-LINNAKHTYD----------------MLKNVN--PNV -EMILSIDIQMTASIEYADIALPANTWMESEGLEVTASCSN-PFLQI----W-KGGIPPIF -DSKDDLVILSEIAAKLGDLT---------------------------------------- ----------------GDARF--RDYWKF-------------------------ALEG--- --------------------------------KREVYIQRLLDSSTTTTGYKLDDIM-KGK ------YGPPGGALMLFRT----Y-PRIPFW----EQVHEDQ--PFYTDH----------- --------------------GRLQAYTDVPEAIEYGENFIVHREGPEATPYL--PNVIVS- -SNPYIR---PKDYGIPLDAEH---WDERTIRNVKLPWSEVKNTKNFLWEKGFQFFCLTPK -SRHRVHSLWSNVDWHQIWDSNFGDPYRMDKRTPGVGEQQIHLNPQAAKDLGINDGDYVYV -DANPADRPYRGAKPGDPFYKVARLMLRAKYNSAYPYHVAMMKHGTYIATEKSVKAHETRA -DKRALSEG-GAYQANFRYGSQQSVT---RNWHMPMHQTDTLFHKAKVFMSFIFGGEADNH -AVN-TVPKETLVRISKAE-DGGLGGKGLW---EPVKTGYTPAH--ENDVMKQYLHGGFIK -T--- ->KRT77589|Armatimonadetes_bacterium_CSP1_3 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------MDFNELRHARLHIQVGKNLIENKMPESH -FFNELMERGAKIAVITPEYSPPAAKADYWMPIRPQ-TDAALFLGITRLMMDRRWY----D -------EAFVKQFTDFPLLIRKDTLKRLRAAEVFPG---YK----------PGLDPD--- --------------GPSFKRHNLKLDQYEKL---------GDFVVFDRKTRK--LQAIT-- --------RDQVGERLAQAGL------D---------------------PDLRWRG----- -------------------------------------KVKLI-DGREVECLTLWEA----- ----HRDHLRD-YDLDTVA-----------------------------EITQTPRAMIERL -ARDI-----------ATIKPVSIHIGEGINHWFHAT-LANRAFYLPLMLTGNIGKPGA-G ---CHTWAGNYKAGIFQ-GSPWTGPGIT--------------------------------- -------------------------------GWLFE-----DPFHAALDPATSGTEIKVKK -YLK------DEEPAYW-----DH---------------GDVPLIVNTP-----KAGRRVF -TGTTHMPTP---TKVMWYNNVN-IINNAKWAYG----------------VIKHVN--PNV -ELIINQDIEMTASAEYADIILPANSWVEFETPELTASCSN-PFLQI----W-KGGIKPLF -DTKDDGVIIAEVAAQLTAQT---------------------------------------- ----------------GDRRF--RDYFKY-------------------------LLER--- --------------------------------RPEVYIQRILDSSTSTVGYRVADVV-NGK ------YGEPGAALMLFRT----Y-PRIPFY----EQVHDSE--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENFIVHREGPEATPYL--PNVIVT- -TNPLVR---PEDYGIPLDALH---WDQRTVRNVKLAWRDVKKTKNPLWEQGYRFYLLTPK -TRHRVHSSWSTVDWNMIWDSNFGDPYRLDKRAPGVGEHQLHIHPQAARDLGINDGDYVYV -DAYAADRPYIGWKPSDPFYRVARCMVRVRFNPAYPYSVLMMKHAPFMATEKSVRAHETRP -DKLARSAD-TGYQANLRYGSQQSVT---RDWLMPMHQTDTLFHKSKGTMAFIFGGEADNH -AVN-TVPKETLVKITKAE-DGGIGGKGLW---EPARTGFSPGR--EGDFMKRYLAGTLVK -VTKR ->OUC07869|Chloroflexi_Litorilinea_aerophila ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------EITASCSN-PFLQI----W-KGGIPPLY -NTRDDARILAEVSAALADEI---------------------------------------- ----------------GEPRL--RDYWRF-------------------------ILEG--- --------------------------------RPEIYIQRLLDSSLTTSGYRVEDII-AGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSV--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENIISHREGPEATPYL--PNVIVT- -RSRFVR---PEDYGIPADHMG---WEERTVRNIALPWNQVKETKNPLWAQGFHFYCLTPK -TRHRVHSSWSTVDWTIILDSNFGDPYRADKRLPGPGDHQLHMNPQAAKDLGIEDGDYVYV -DANPADRPYIGWKPDDPFYKVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVKAHETRP -DGLAKSEG-TGYMANLRYGSQQSVT---RDWSMPMHQTDTLFHKQKTGMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGLDGKGPW---EPTKTGYTPAH--ENEFMLRYLAGETIE -VTT- ->RCK74665|Chloroflexi_Anaerolineae_bacterium ----------------------------------------------MSHLSRREFLKLSSV -AALGTV--------INDLD----WKLLDP---IQ-VDNPLAAYPSR------DW-EAVYR -NQYRY------DSSFTFVCS-PNDTHACRLRAFVRNGIILRAEQNYDVERYSDLFGNTAT -AHWHPRGCKKGQTFHRRLYGPHRLKGPLMRKGWKE----------WAD----------AG -FPELD-EENKTKYKFNARGQDELLPVSWETAYDYIARGMIAIARRYSGEEGARLL-RKQG -YPEEMIQAM------SGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-MLALLDVHVRNVPP -EEAKGGRTWSNYTWHGDQAPGIPFVTGLQASDEDLNDLRNSRLHIQCGKNLVENKMAESH -FFIEAMERGAKIVTITPEYSPPATKSDYWIPIRPA-TDTALFLGLARWIIENQKY----D -------EQFVKRFTDFPTLVRADTLKRLRADEVFSN---YQ---------PGLDPQG--- ---------------ASFTLQGLKPEQYEKL---------GDYVVINEKTGR--PQAIT-- --------RDQVGEVMDKAGI------Q---------------------PLLDWKG----- -------------------------------------KLRLV-DGSEVEVLTVWSM----- ----YLEHLKD-YDLETVL-----------------------------EITHVPKDLFLRL -AEDI-----------TTLSPVALHIGEGINHWFHAT-LANRAQFLPLMLTGNIGKPGA-G ---LYTWAGNYKAALFQ-GSAQSGPGFK--------------------------------- -------------------------------GWVGE-----DPFAPNLDENASGKEIKVHA -YTK------DEEPAYW-----NH---------------SERPLIVDTP-----KYGRKVF -TGQTHMPTP---TKVQFFTNVN-LLNNAKHHYE----------------MIKNVN--PNV -ELIISVDIEMTSTVEYADFALAANTWAEFETYEITASCSN-PFLQI----W-KGGIPPLY -DSRDDARILGELAARLGELL---------------------------------------- ----------------EDNRF--RDYWKF-------------------------ILEG--- --------------------------------RPEVYIQRLLDSSITTSGYRFTDII-EGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSI--PFYTDT----------- --------------------GRMNTYCDIPEAIEYGENLISHRESPEATPYL--PNVIVT- -SSRFVR---PEDYGIPPDATG---WEERTVRNLKMPWSEVKNTRNFLWEAGYHFYCLTPK -TRHRVHSSWSTVDWTLILDSNFSDPYRVDRRQPGVGEHQLHINPQAAKDLGLEDGDYVYV -DANPADRPYIGWKAEDPFYRVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVLAHETRP -DGLARSAD-TGYQANLRYGSQQSIT---RDWSMPMHQTDSLFHKQKTAMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGIEGKGIW---EPAKSGYTPAH--ENEFMSLYLQGKTIE -IKR- ->GCA_001803565_00046|MHDQ01000004unannotatedprotein --------------------------------------------MSFDRVSRRQFLETLAA -TATAAL--------VSKPAIGLALEKLQP--IPE-IKNPLEHYPPR------EW-EKIYR -DIYNP------DSSYIFACT-PNDTHNCYLRAYIKNGIVTRIGPSQRYRDATDIYETKAS -ARWDPRICNKGVAMVGRFYGDRRVKYPTVRKGFKE----------WVE----------KG -FPRD--ENGQPPLKYFKRGEDQWEKVSWDEAYTIVAQSMIDTVKTYSGTKGAELL-QKQG -YDAKMIEKM------MGAGTQAMKFRGGMPLLGVIKLFGLYRMAN-SMALLDSYIRGVGP -DKAIGGIGFDNYSWHTDLPPGHPMVTGQQTIDFDLVNAEYANIILCWGMNWICTKMPDGH -WLSEARLKGAKVVTITTDYNSTSSKADEIVIIRPG-TDPAFALGLAQVIINERLY----D -------EEFVEGFTDLPFLVRMDTRELLRAHEIISG---YN---------NAELKYT--- -RVIKKEEKPPPPFATNLGMPAVSSDMRQEW---------GDFVVWDSNAKK--ATPVS-- --------RDDTGERFTNKGV------K---------------------PALEGEF----- -------------------------------------EISLT-NGEKIKVRPIFDI----- ----IKQHLEDTWNVDSTS-----------------------------KITWAPKEAIINL -AREI----------AANKEKVLFTVGMGPNQLFNAD-QKDRAIFLVAALTRNVGFFGG-N ---VGSYAGNYRAALFN--------GMP--------------------------------- -------------------------------QYIAE-----DPFNIILDPTKPA---KVKP -YFK------MQSAHFY-----AH---------------GDTPLKVHDI----------YF -NGETHMPTP---TKFFWFAASNSILGNSKGMYD----------------VVMNLLRNRKI -EAVVVNEWWWSASCEYADVVLPADSWGEYNVHDMTASVTN-PFVMV----MPLTGVSRIW -DTKSDSETYAGVSEKLGELT---------------------------------------- ----------------GDSRF--KDYWRF-------------------------IADG--- --------------------------------KAKPYLQRIIDHSNTMKGYQIDNLISKAK ------DGIP--ALLMSRT----Y-PKFIGY----DQSVESA--PWYNKT----------- --------------------GRLEFYREEPEFLDYGENLPVHREPVDATFYE--PNVIVAK -GHPLIKPKTPTDYGWPMDDLS---GETRQVRNVVYTPDELLNTKHPLRKEGFTHIYLTPK -FRHAVHTFGVDLDLLSIWFGPFGDMYRRDKRKPWVNEGYVEINPDDARELGIEDGDYIWV -DPDPKDRPFKGWQDKPADYKVARCLLRARYHPNLPKGITRTWFNMYQATHGSVRGHESRK -DGLARNPD-TNYQSMYRYGGHQSST---RSWLRPTLLTDTLVRKNLMGQMIGKGFEPDVH -CAN-GAPRESFVKFTRAE-DGGESGKGKW---RPAVLGFRTGY--ENVAMKKYIKGGFIS -KGGK ->SPS06998|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->SPS06751|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->RFC37636|Nitrotoga_sp_CP45 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC33776|Nitrotoga_sp_LAW ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC30723|Nitrotoga_sp_MKT ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-STAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC31618|Nitrotoga_sp_SPKER --------------------------------------------------------KLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGA -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIIPD---YK---------LAELTHH--L -KVMKPGEGPTMPPAFQ-STAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVTPVFQL----- ----QKEYLEE-YTAENTS-----------------------------IMTGVPSEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KMAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--TIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGH -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23760|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23368|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23476|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRAGFKA----------WVE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYAGDKGAALL-TRQG -YDPEMIASM------HGCGCKVMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGS -DEASGAKVMDSYSWHTDLAPGCPMVSGHQQLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGEEPTQPVAFQ-ATAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVAPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HVAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------KEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYHAPE-------------- ---RTISVPKSPMRGNKRAGGHNSPT---RVHLKPSLMVGGYGQ---------FTYSFNYW -GPT-GVNRDTFILVRKLP------GKPEF------------------------------- ----- ->CRI68048|Thiocapsa_sp_KS1 ------------------------------------------------------------- -------------------MSK--TKDDNG--NGG-SRWFRELDEPR------KW-EDFYR -RRWQY------DKSVRTSHS-VNCSGSCSWEVFVKNGMITWELQKTDWPQI-----NDET -PNYEPRGCQRGISASWYPYSPVRPKYPYVRAVLLDFWRAERAAGKDPI----------AA -WGAIVENPERSKAYRNARGKAGWRRTTWDEATEIIAAAKIYTIKEH-------------- ----------GADHLASFSPIPAMSMVSFLSGHRL-------------------------- -SNLLGGTMLSFYEWYHDLPHVMPMIWGDQTDVHESADWYQSAYWIVMGSNLPMTRTADAH -FASEHKYNGGKLVNLSPDYSDVTKFADLWVPVRPG-TDTAFILSCIHVILQEFHV----N -RRSEYFHSYVAQYTNLPFLVILD-----QEGDHFASGRFLR---------ASDVAAY--- ---------------------AD--EELADW----------KLPCFD-KEGE--LRLPGGT -LGFRWEEKNTGRWNLKNEDAVTAQPFD---------------------PLLTLMDGEFEE -VIVEYADFTHTFNVEFGTTALRGEKARKSLRGVPSRVLTKK-DGTK---VRVATA----- ----YDLLLAS-FGVNRGLSGSGYPKDYDDASEAYTPAWQE-------QETGVDRNLAIRV -AREW------ADTAEKTKGKCLFITGSGILHWYHGGSLTYRSEAVMGILTGCQGRNGG-G ---FAHYVGTEKIRNMA---AIGTIGNAADWGNVGRQQNSTSYFYFHTDQWR-YDGMSLDP -LWAPRAKEMPARANHAADMNAVAVRNGWLPFFPQF-----DERNPTDVMQDARKAGCKSL -EDVK-----TWVAQQF-----KE---------------RKLKFALPNVDAPK-NHPKVLW -IYRGNLIGT---SMRGHELNLKHMLGTHNNVLGGETRA----KDMVNEIDWTENAPLGKL -DLIYNVNLRMDSSANYSDIVLPTAHWYEKFDLTCTD--LH-SFLHP----F-TPAHDPAY -ESKHDWEAFRLIAEKISELAKVHLPDPIEDLVMTALSTDTPDEMAQPM---GELRDWWKG -ESEPIPGKTFPNVSVVTRDY--TKIHDMYTTLGPAVTKPNSYGAKGIKGDLAEVYEQMKE -SYLVGEKQGRPNMETAAKVCEVILRISPESDGELSY-----------QIFKNLEKR---- ------CGVPLAHIVEPER----E-TAYHYP-DLISQPRRALTSPHWSAIETKGRTYSPWT -LNIEALKPFHTLT------GRQEIYYDHRMFRDLGEDFPVYKPPVDMV--S--IGDVAQ- -------------------------KDIKMKGAKLFRF-------------------ITPH -QKWGIHSMFGDSWQMQNMFR---------------GGPTVWINDDDARDIGVKDNDWV-- ----------------EIFNENGIQVARAVVSHTVPRDMSIVYHQTERH-------VNVP- ---FSSLAR-ERGASDLRGGNNNATT---RIMMNPATMVGGYANWTYWLNYQGTS------ -----PSERDCVVLIRKKP-METRGRKVIY---QESQL--------NVGA----------- ----- ->NASQAN2011_330_B_bin.17_k121_430440_3 rank: A; amyy:YIM_22320 narG; Nitrate reductase alpha subunit; K00370 (db=kegg) -----------------------------------------------------MFHNASLG -HTATMGRTDDVPNGTEEALIK--FGRFFAGGEVSKDLLSVTKAGGR------EG-DVFYR -DRWSH------DKVVRSTHG-VNCTGSCSWKVYVKDGIITWETQQTDYPSVG-----PDS -PEYEPRGCPRGAAFSWYTYSPTRIRFPYIRSVLLE---------MYREAKGRL-GDSVLA -WADVVDNSENRQRYHRARGKGGLVRVSWSEVSEIIAAAHVHTIKKY----GPDRI-FGFS -PIPAMSMAS------HAAGARFISL----------------------------------- ----MGGSMLSFYDWYADLPVASPQVFGDQTDVPESADWFNASYLIMWGSNVPVTRTPDAH -FMTEARYKGQKVIAISPDYADNTKFADEWVAPHPG-TDGALGMAMGHVILKEFFV----D -KQVPRFQDYVKKFTDLPYLVSLRK----KDGSWVPDKFLVASD-------LGDVSEG--- -----SRFKTVVLDSSTGETFVPNGSLGHRY-------NDSSTGKWNLDLEGVDPLLSV-- --------YGKKGAVSAPVLM----------------------------PRFDQGQ----- -------------------------------------EVSES-GGVLARGVPVIEIAGKTV -TTVYDLMLAQ-YGVAREG--------LDGDWPEGYDDRSPYTPSWQEEITSVPAVQAIRI -AREF------AQNAIDSEGRSMILLGAGTNHWFHSD-TMYRTFLALVTLTGCQGVNGG-G ---WAHYVGQEKCRPVT---GWAQLAFGADWSRPARQMIGTAFWYVSTDQWRYDALGSDLL -------ATPLGEGRFKDMTAIDVIAQSARMGWMPS-----YPSLN-RNSLDLVDEAREKG -VDPA-----QHVINEL-----KS---------------GDLQFAIENPDAPE-NWPRVLT -VWRANILGS---SSKGNEYFLKHLLGTDNSVRA----NENEPDARPKDVKWHEDAPEGKL -DLLVSVDFRMTSTGLFGDILLPAATW--YEKHDLSSTDMH-PFVHA----F-TPAINPPW -ETKTDYEIFQMLGRQVSEQAKGHLGER-EDLVVVPLLHDTPDAMATPG---GVVLDWKKG -EVEPIPGVTMPKLVVVKRDY--SQIGEKMAALGPLIDTLGTNTKGVPVSVLPEIELL--- -------RHSNGVASTGVGAGRPSLARDVDACEAILALSGTTNGRVAVAGFRALEKR---- ------TGQKLTDLALDNE----G-KRITFA-DTQARPVPVITSPEWSGSEHGGRRYTAFA -INVERLKPWHTLT------GRQHFFIDHDWMSELGEQLPVFRPPLNMHRIF--GS----- -------------------------QGDGVAKEVTVRY-------------------LTPH -SKWSIHSEYQDNLFMLSLSR---------------GGQEIWMSVEDAEIIGVKDNEWI-- ----------------EAYNRNGVVVARACISHRMPSGTVFMYHAKD-------------- ---RVVDVP-LAETSGKRGGIHNSLT---RLVIKPTHLIGGYAQ---------LTFAFNYL -GPT-GNQRDEVTVIRRRS--------------------------QDVEY----------- ----- ->GCA_003453735_00577|DMNE01000186unannotatedprotein ------------------------------------------------------------- --------------------MG--------------WIKDIFDPKAR------LW-EEFYR -SRWQY------DKKVRSTHG-VNCTGGCSWEVYVKDGIITWEMQETDYPLLE-----PGL -PHYEPRGCQRGITFSWYIYSPLRIKYPYIRGVLLD---------LWRKAKSIH-TDTVAA -WESVVENEESRRSYQKARGKGGLRRTTWEEALEIIAASTIYTAKKY----GPDRV-IGFT -PIPAMSMLS------YASGTRFLQL----------------------------------- ----FGGVALSFYDWYADLPPASPEVWGEKTDVAESADWYNSKYIVAMGANLSMTRTPDVH -FVAEARNNGTKLVVLSPDFSQVSKYADWWLPVTAG-HDGAFWMAVDHVILKEFFV----D -RQVQYFSDYLKRYSDAPFLVEIE-----GGEGSLRAGRFLR---------ANTLSRY--R -DAENGEWKLLVFDGKAKEPRMPNGSVGFRW--------QERKGQWNLEM----------- --------KDGADDTIIQPLLSLFEDRD---------------------AAVSINF----- ---------------------TEFASGRTFKRAVPVKYLQTE-KGR----VLVATV----- ----FDLLMAQ-MGVGRGL--------EGDFAEDYNDAERPYTPAWQEQFTGVSRDTLVCF -AREW------AVTAEKTKGKCTIIVGSGVNHWYHSN-LNYRAGITALILCGCVGVNGG-G ---MNHYTGQEKVAPEA---SWKSIAFALDWIKPPRLQNTPSFHYVHSDQWRYAE------ --------PENGIKVLEYMHPMDVLVNAVRMGWLPF-----YPQFN-RNPIDLVREAEESG -AKS------EQEIIEWLVLQLKD---------------KKIRFAVEDPDAPE-NWPRVWY -IWRGNAILA---SMKGHEYVLKHYLGTSTNAVA-----DEIVSASIKEVHSKGSAPEGKL -DLVIDINFRMDTSALFSDIILPAATW--YEKDDLNTTDLH-SFIHP----L-SAAVPPCW -EAKNDWDIFKEIALKISQLAPAHFSEPFREIVATPLMHDTRQEISQPQ-----VKDWHKD -KCQAIPGKTMPKFSVVERDY--TNLFKQFISYGHKEKEEGMGERGIQWKIGDMYDEF--- --------MKGVPVEQWGGERYPSLSEARDAANVILHFAPETNGEIAYRGFKALEEI---- ------TGMPLSDLAERQR----S-VRTIFP-DLLDQPKRILTSPCWSGITNGGRAYAPYC -INVERLMPWRTLTGRQHXAGRQHFYLDHEGYISFGENLPTFKSRVLLQN----------- ----------SGDIG----------KSTAIEKSLVLNF-------------------LTPH -GKWHMHTTYYDNLLMLTLSR---------------GVEPFWLNSKDAEDIGVKDNDWV-- ----------------EVYNDNGVVVTRAVVSARTPAGVGIFYHAPERT------------ ----ISFPK-SPLRNMKRGGGTNSLT---RIRLKPVLMVGGYAQ---------FSYAFNYW -GPI-GPDRDTYAYVHKLD------GKPVF------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------MRGALLD-------------------------------LW-QEARR -QH-------------------------------------------------------PDD -PV--------------------------------------------------------AA -WASITDDPARRKRYQEARGKGGFRRVSWSEAQELIAAANLHTVKKY----GPDRL-VGFS -PIPAMSMIS------YAAGARFLQL----------------------------------- ----MGGLCLSFYDWYCDLPPASPEIWGEQTDVAESADWFHSKFIATVGSNVLMTRTPDAH -FLVEARHKGAKVVVFSPDFSQTSKVADEWIPINQG-SDTAFWMAVNHVILREFHA----E -RSVPYFQTYLRENTDAGFLVVMKA----DAQGNYRPGSLLR---------ASQLAET--Q -GEENAEWKSFVLD-TQGNLRVPVGQVGHRW--------QKSKGQWNIKQED--ARTGE-- --------AFEAALTLRDSAT----------------------------GAVKAVF----- ------------------DDFSEGRTDRVRVREVPVREVQTV-EGP----VYVTTV----- ----YDLHLAQ-HGVNRGF--------GGDWPTGYADDTHPFTPAWQEQYTGIKAETVINF -ARQW------ATTAEKSQGKCTVIIGAGVNHWYHNN-LIYRACINALIYCGCVGRNGG-G ---LNHYVGQEKLVPQA---SWGPIAFGTDWSAPPRLQNAPSFHYMHSDQWRYDRKFDEMC -------PVADKSHLMASGHTADKQALAVRSGWLPC-----YPQFTEHN-FKLVQEAEDRG -ADPV-----QHVVGRL-----KD---------------RSLKFAMEDVDNPA-CFPRVWY -IWRGNAIQA---SAKGHEYFLKHYLGTHHNSIA-----VEHAREDVKEVTWHDKLELGKM -DLIVDVNFRMDTSALYSDIVLPTASW--YEKDDLSSTDMH-SFIHP----L-QAAVPPCW -EAKSDWKIFRGIAEETSRMAQRYLPEPVKDFVCTPLMHDTPAEIAQPT-----VKDWAKG -ECEAIPGKTMPNMKVVERDY--TKIFQKYITLGRNFRNNGLGIHGTTYPVDDLYDAY--- --------LQDHPVEEVDGERYPSLRADRSVCEAILHFAAETNGELAYRAYEAESHK---- ------TGIDHTHLAAPTR----G-VRYNFA-DLCTQPRRSLTTPFWTGITNGSRTYSAYC -QNVEERIPWRTLT------GRQHLYFDHEAYVAYGEHLPTFKPRADLRTTR--DLDMTG- ----------------------------VESGALVLNY-------------------LTPH -GKWHIHSTFGDTLRMETLSR---------------GIEPFWMNEQDAGLLGIHDNDWI-- ----------------EVLNDHGTVVTRACVSARIPRGICFIYHATERT------------ ----IGNPK-SKHRGMRRAGGHNSLT---RARLKPLFMIGGYAQ---------FTYAFNYW -GPQ-GVNRDTFVVVKKLD-------KPEW------------------------------- ----- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MN-WIEEISNPHAR------QW-EEFYR -NRWQH------DRVVRSTHG-VNCTGSCSWMIYVKDGIVTWELQALDYPVLN-----NGL -PPYEPRGCQRGISFSWYQYSPIRVKHPYMRGVLMD---------LWRKAKETH-QDPVEA -WTAVVEDEAARKSFHQARGKGGFRRASWDEVTEIIAASTMYTIKKY----GPDRI-IGFS -PIPAMSMLS------YAGGSRLMQL----------------------------------- ----LGAVSMSFYDWYSDLPPASPETWGEQTDVAESADWFNSKYIVSVGSNMSMTRTPDVH -FAAEARHNGTKLVVFAPDFNQVAKYADWWVPVNAG-QDGAFWMAVNHVIMNEFHY----Q -NPTPYFLDYMKRYTDSPFLVELN-----EVDGKFVPGRMVR---------AGQVERT--K -DVENGEWKFLVWDELSNAPRMPQGSLGFRW--------QQQKGQWNLEPKD--G------ --------LDGSEIRPQLTFL---GATD---------------------EQLSVSF----- ---------------------AEFGEGKSFQRNIPVRTIETA-NGK----VAVATI----- ----YDLLMAQ-YGVGRGL--------EGDYPASYDDENLSYTPAWQERYTGIDRQTVIQF -AREW------ATTAEKTEGKCMIIIGAGVNHWYHNN-LIYRACIGALMLTGCVGRNGG-G ---LNHYVGQEKLAPAA---PWASIAFALDWQKPPRQMNSPSFHYINSDQWRYERTYTEPQ ---PVSRPDSESHRDMTQEHTLDANIRAVRMGWLPS-----YPQFN-VSSLEIIRKAEQAG -AKS------DAEIRQWVVNQLKS---------------GELKFAVQDPDAPE-NWPRLWF -IWRGNALNA---SAKGQEYFFKHYLGTHHQIIS-----EEVDKSHFNEVTYRDEAPEGKF -DLVVDINFRMDTSALYSDIVLPTASW--YEKDDLNSTDMH-SFIHP----L-QMAVPPSW -ESKSDWDIFKILAEKFSELAPTHFPEPVRDLVAMPLQHDTPAEMAQAH-----IRDWAKG -ECEPIPGVTMPNFIVTERDY--VNLGKRFVSLGPKVEKEGFAIHGIHMEVGDLYREL--- --------LKSKPTVTWNGQTYPSLTVARDAANIILNLAPETNGEVAYRAFKAEEER---- ------IGLKLTDLAEPTR----A-VRTDFK-DVVRQPRRLLNSPIWTGIMTDGRPYAAYT -LNVERLVPWRTLT------GRQHFYLDHEGYLAYGEHLPTYKPRPD-------------- ----------PLAFGDLEKSHS-------EGKTIQLNY-------------------LTPH -AKWHIHSNYFDNDRMLTLSR---------------GLEPLWISEKDAKEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYH----------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3 rank: A; htq:FRZ44_42870 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------ILDKLMF--FKAGTE--RFA-DGYGAVTEESR------AW-EDGYR -QRWQY------DKVVRSTHG-VNCTGSCGWQVYVKSGFVTWETQVLDYPLTR-----PDL -PNHEPRGCARGASASWYLYSSNRIKYPLMRRQLMD---------LWREARRRH-KDPVEA -WRSIVETPELARRYKQARGRGGFVRAEWDEANELIVASNTYTIKEY----GPDRV-VGFS -PIPAMSMVS------YSAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSNFLIVWGSNVPQTRTPDAH -YFAEVRYKGTKTVVVTPDFSEAAKFADLWLDPKQG-TDAAMAMAMGHVILKEFHA----D -NPEPYFRDYCQQYSDLPFLVRL-----VKQGEHYVPERFVR---------ASDFADG-QG -QDNNPEWKTLGFDELTDELVVPNGSIGFRW---------GEDGRWNLEQKD--A------ --------RSGVAAKLRLSLL------EAPSEAPGPKSERSTQVANVAFPYFGGRH----- -----------------HEFFESSPQDEIQVRNVPARTLALK-DGE----YLVATV----- ----FDLMLAH-YGIDRGL---------GGVAASSYDDDVPYTPAWQERITGVSRDKVIAV -ARGF------ADNAAKTRGRSMVIIGTGVNQWFNND-MTYRAVINMLILCGTVGRSGG-G ---WAHYVGQEKLRPQP---GWQTLAFALDWSRPPRLMNGTSFWYAHTDQWRYEKVQASEL -------LSPTREQGDWDVSLIDYNVRSERMGWLPS-----APQLE-KNPLRLGREIHEQK -LDAP-----TAVAHQL-----ET---------------RTLRLSCEDPDNPR-NFPRNLF -VWRSNLLGS---SSKGHEYFLKHLVGAKHGVLG--ADLKELGERLPTEVDFHDEAPEGKL -DLLVTIDFRMSSNCMYSDIVLPTATW--YEKNDLSTTDMH-PFIHP----L-TGAVDPLW -ECKSDWEIFRGFAEKFSEVCEGHLGTE-YDVVLQPLQHDAPGELGQAL----GVVDWKKG -ECRAIPGKTMPNVQLVERDY--PATYKRFVSLGPLVNSLGMSTKGLKWDATEEVELL--- ------KEKNGEVAEAGVGHGRPRIQTDLHACETILALSPETNGRVAVKAWKALEVR---- ------TGRQHAHLAEGRA----A-ERITFD-DVVAQPRKVITSPTWSGAESEKVTYSAGY -INVEEQVPWRTLT------GRQQTYQDHPWMRAFGEHFPSYKPPIDTK--T--VGTLLR- -------------------------SQENGNPQLVLNF-------------------LTPH -QKWGIHSSFTDTQMMLTLSR---------------GGPNIWVSEQDARRLGISDNDWI-- ----------------EAYNSNGALVARAVVSQRIKAGCAFMYHSQD-------------- ---KTVNAP-GTETTGTR-GIHNSIS---RIVVKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDDFVVIRKVR-----------------NLDFMDGTPVRILAPAVSVGGAE-- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7 rank: A; ddz:DSYM_27970 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--FERVQS--TFS-GGHGIVTNEDR------KW-EDAYR -NRWRH------DKIVRSTHG-VNCTGGCSWKIFVKNGLVAFEMQQTDYPRTR-----DDL -PNHEPRGCQRGASFSWYLYSPHRIKHPLVRGRLLD----------LYRAERKSGKDPVEA -WEAIQADPAKRIQYTAVRGLGGFVRTNWDEVTEIAAAANVYTIKKW----GPDRI-YGFS -PIPAMSMLS------YAAGSRYLSL----------------------------------- ----IGGACGSFYDWYCDLPAASPQTWGEQTDVPEAADWYNSTYLIICGANLPMTRTPDAH -FATEVRYKGAKVVSMAPDYAEFVKFADLWMPVKQG-TDSAAFLAMGHVALKEFHV----K -RQDPYFQEYIRKYTDLPMLVMLR-----KTDDGYASDRTLR---------ASDFTGN-LG -ESNNPEWKTIVYDEKTKSYVAPNGSVGFRW---------GEEGKWNLLPKNAANQEEILA -ELTCIDSRDDV----ASVGF----------------------------PHFNAGE----- --------------------------PGLLYRNVPVRKLKLA-SGEDVLVSSV-------- ----YDLQVAQ-YGIDRGL-------GGGNVTDSYEDDKVAYTPAWAEKVTGVKRADLIRT -GREF------AENASKTKGKSMVIMGAAINHWYHND-LSYRAIMNLLHMCGCVGQSGG-G ---WAHYVGQEKLRPQA---GWAPIAFATDWHRPPRHMNSTTFWYFQTDQWRYEKVSADGL -------LADNAKSKYKGYQLADYNVVSQRLGWLPS-----APHFN-KNPIDIVTEAEKAG -ATD------EASIAKHMVEQLKS---------------GKLYFASEDVDAPE-NFVRNLF -VWRSNLLGC---SAKGHEYFLKHLIGAQNGVLQ-----EGVEGRACKEIKWHENGPTAKL -DLMVDINFRLNSTGAYSDIILPTATW--YEKHDLNTTDMH-PFVHP----L-SEAVSPGW -ESKSDWQIFQNIAKAFSKLAEKHLGTK-KDVVALPMQHDSPFELAQAM----GVKDWKKG -ECEPIPGKTLPLLKVVSRDY--PNTLKKFQAIGPLLNKLGNNVKGIDWNTDQELNEL--- ------KSLNGEILEDGISKGMPSIAADIAACDAVLRMAPETNGEVAHKSWSALSKK---- ------TGIDHHHLYAGRH----E-DKITFR-DIQAQPRKIITAPTWSGIESETVSYTAGY -TNIHEHIPFRTLT------GRAQFYQDHEWMLDFGEGFCAFRPGLDMKAIEATPKSVLA- ------------------------------KPHLVLNW-------------------ITPH -SKWGIHSSYQDNLRMLNLFR---------------GGPYFWIAEDDAKSIGLEDNDWV-- ----------------EAVNGNGATVARVVVSQRVPRGMALMYHAQE-------------- ---KIVNVP-GSPTTGKRGGILNSVT---RVVVKPTNMVGGYAQ---------LSYGFNYY -GTV-GTQRDEFVVVHKIE-----DKDVDW-----LERPLTPER--EGKLNPPGVGPR--- ----- ->NASQAN2011_286_B_bin.1_k121_764018_13 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D-----------AHDGFVNVCFPYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->NASQAN2011_286_F_bin.29_scaffold_54_27 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D--------AHDGFVNVCF---PYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6 rank: A; thes:FHQ07_07000 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSY--------FLDRLNF--FKPAPE--PFA-DGHGAARREDR------SW-EDSYR -RRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLIRAALLK---------LWREARKS--KSPVEA -WASIVSDPVKAKSYKQKRGMGGFVRSTWDEVNEIIAASNLYTVKEF----GPDRV-VGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGGCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVAITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHV----D -QPSQYFTDYCRQYSDMPMLVRLER----RADGRLVPERYLR---------AADLGGL--G -ETNNPEWKTLAIDDNSGDITVPNGSVGFRW---------GEKGKWNIEEKD--------- --------SAGRETRLRLSLK------D--------HADGVESVSF---PYFGGIE----- -----------------NEYWTESKFSDVLERNVPVKRLNLA-DGKEWVVASV-------- ----YDLLLAQ-YGVDRGL--------GGGNVASSYDDNVPGTPAWQEKITGVPRAEVIQI -AREF------ARTADKTHGRSMVIVGAAMNHWFHND-MNYRGLINMLVMCGCVGQTGG-G ---WAHYVGQEKLRPQS---GWAPIAFGTDWSKPPRQMNGTSFFYFNSSQYRYEKLGVEEI -------LSPLADKSKYSGSLADYNLRAVRMGWLPS-----LPQLN-TNPMKLVREAEAAG -VAPV-----DYAVGKL-----KD---------------GSLDFAFADPDAPE-NYPRNLF -IWRSNLLGS---SGKGHEYMLKHLLGTRHGLQG--KDLGERGAAKPEEIKWRDEAPEGKL -DLLVTLDFRMCTTALYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIFKGIARTVSQLAPGVLGIE-KDLVLVPTLHDTPNEIAMPY----GVTDWKKG -ECDLIPGKTAPSMVVVERDY--PNLYKKFTSIGPLLDTQGNGGKGMNWDTTHEIEFL--- ------GKLNHEVLEAGVSHGRPQLETAIDCAEAIMHLAPETNGHVAVKAWASLETF---- ------TGREHQHLAVGKE----H-EAIRFR-DIQAQPRKIISSPIWSGLEDENVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHEWMRDFGEGFMQYRPPVDTKTIK--P--IIG- -------------------------KKPNGNREIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKSAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRMMNGIAMMYHAQE-------------- ---RILNTP-GSEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------LAYGFNYY -GTV-GTNRDELVVVRKMN-------KVDW---LDGEPVPATKEAAR-------------- ----- ->NarG_Escherichia_coli_NP_415742 -----------------------------------------------SK------------ ---------------FLDRFRY--FKQKGE--TFA-DGHGQLLNTNR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKYPMMRKRLMK---------MWREAKALH-SDPVEA -WASIIEDADKAKSFKQARGRGGFVRSSWQEVNELIAASNVYTIKNY----GPDRV-AGFS -PIPAMSMVS------YASGARYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYAEIAKLCDLWLAPKQG-TDAAMALAMGHVMLREFHL----D -NPSQYFTDYVRRYTDMPMLVMLE-----ERDGYYAAGRMLR---------AADLVDA-LG -QENNPEWKTVAFN-TNGEMVAPNGSIGFRW---------GEKGKWNLEQRD--GKT---- --------GEETELQLSLLGS------Q----------DEIAEVGF---PYFGGDG----- -----------------TEHFNKVELENVLLHKLPVKRLQLA-DGSTALVTTVYDL----- -------TLAN-YGLERGL--------NDVNCATSYDDVKAYTPAWAEQITGVSRSQIIRI -AREF------ADNADKTHGRSMIIVGAGLNHWYHLD-MNYRGLINMLIFCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWQPLAFALDWQRPARHMNSTSYFYNHSSQWRYETVTAEEL -------LSPMADKSRYTGHLIDFNVRAERMGWLPS-----APQLG-TNPLTIAGEAEKAG -MNPV-----DYTVKSL-----KE---------------GSIRFAAEQPENGK-NHPRNLF -IWRSNLLGS---SGKGHEFMLKYLLGT-EHGIQGKDLG-QQGGVKPEEVDWQDNGLEGKL -DLVVTLDFRLSSTCLYSDIILPTATW--YEKDDMNTSDMH-PFIHP----L-SAAVDPAW -EAKSDWEIYKAIAKKFSEVCVGHLGKE-TDIVTLPIQHDSAAELAQPL----DVKDWKKG -ECDLIPGKTAPHIMVVERDY--PATYERFTSIGPLMEKIGNGGKGIAWNTQSEMDLL--- -------RKLNYTKAEGPAKGQPMLNTAIDAAEMILTLAPETNGQVAVKAWAALSEF---- ------TGRDHTHLALNKE----D-EKIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLS------GRQQLYQDHQWMRDFGESLLVYRPPIDTRS----VKEVIG- -------------------------QKSNGNQEKALNF-------------------LTPH -QKWGIHSTYSDNLLMLTLGR---------------GGPVVWLSEADAKDLGIADNDWI-- ----------------EVFNSNGALTARAVVSQRVPAGMTMMYHAQE-------------- ---RIVNLP-GSEITQQRGGIHNSVT---RITPKPTHMIGGYAH---------LAYGFNYY -GTV-GSNRDEFVVVRKMK-------NIDW---LDGE---------GNDQVQESVK----- ----- ->NarG_Halomonas_maura_gb_AAT47523 ------------------------------------------------------------- ----MSH--------FIDRLNF--FRKARE--PFA-NDHGEVRDESR------GW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKHPLVRKPLLK---------LWREALEEK-GDPVDA -WASIVEDPAKTKQYKRARGMGGFVRADWNELNELIAASNVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVSVTPDYAEVSKLTDEWLSAKQG-TDAALAMAMGHVILKEFHL----D -RPSAYFTDYVRRYTDMPCLVELEA----REDGSYVPGKQLR---------ASDFEAS-LG -QDNNPEWKTVAWDETRDQLVVPRGSIGFRW---------GEEGKWNLEPRD--------- --------AEGAEIKTRLSLA------E--------AHDDVARVAF---PYFGGIA----- -------------HEHFDHVKSGGASDELLFHSLPAKRLTLA-DGREILAVTVFDL----- -------MCAN-YGIDRGF-RSQEGKEGEDDGATAYDQVKPYTPAWQEKITGVPAEQCLRI -AREF------ADNADKTHGRSMIIVGAGMNHWYHMD-MNYRGLINMLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWLPLAFGLDWQRPPRHMNSTSFFYNHSSQWRYXKLEIKEI -------LSPLAKPADYSGSLIDFNVRSERMGWLPS-----APQLA-TNPLSLAGKAAEAG -QSTA-----DYVVDQL-----KA---------------GGLRFAAEDPDDPQ-NFPRNMF -IWRSNLLGS---SGKGHEYLLKYLLGT-RHGIQGKDLG-EDGGQKPEEVVWHEAAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAATDPAW -ESRSDWDIYKGIARAFSKACVGHLGEE-TDLVTLPLQHDSPAELAQPE-----VKDWKRG -ECEPIPGKTMPALVEVKRDY--PATYERFTSVGPLLDSLGNGGKGIGWKTEKEVELL--- -------GKLNYVKTEGPAKGRPRIESAIDAAEVILTLAPETNGQVSVKAWEALSKI---- ------TGRDHRHLAEPKE----E-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTVS------GRQQFYQDHAWMRAFGESLLVYRPPIDTKAAV--SL----- ----------ADDKG-------------NGNPEIALNW-------------------ITPH -QKWGIHSTYSDNLLMQTLSR---------------GGPIVWLSKDDARSIGVEDNDWI-- ----------------ELYNANGAIAARAVVSQRVKNGMAMMYHAQE-------------- ---RILNMP-GSEVTGTRGGIHNSVT---RVCPKPTHMIGGYAQ---------LAYSFNYY -GTV-GSNRDEFVIVRKMK-------KIDW---LDGE---------GNDYEQEAVK----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7 rank: C; this:HZT40_10960 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FKQRKT--PFA-QGHGAVTHEKR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASFSWYIYSANRLKYPLIRKPLME---------LWRSAKARH-TDPVVA -WESIVENPLSTNDYKTKRGLGGFIRSSWEEVNELIAAANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCMSFYDWYCDLPPASPMIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKHADQWLNPKQG-TDAALALAFGHVILKEFHL----D -KPSTYFTDYVRRYTDWPNLVLLEK----RDDGSYQAGRFAR---------ASDFVEG-LG -ESNNPDWKTVAIDEATGEIIAPNGSIGYRW---------GENSKWNIQQKHG-------- --------TDQQEVTLALSLI---------------------------------------- ------------------------------------------------------------- ----------------------------------------------------KQHDQIVEL -CLPY--------------------FGGVPSDYFKGN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------VLKDVL----- ----------------------------RYQLPARQVTLAD-------------------- ------------------------------------------------------------- ----------------GTTGL---------------------------------------- --------------------------------LVTVYDLNMAN------------------ -----------------------Y------------------------------------- --------------------GISRGLGADDSAQDFNDA---------TAPYT--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------PAWQEAI------------------------- ------------------------------------------------------------- ----- ->king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1 rank: A; gpb:HDN1F_13240 narG; Nitrate reductase, alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLQF--FNKVKS--TFA-DGHGAVVNEDR------GW-ENAYR -SRWQY------DNIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCQRGASYSWYLYSANRLKYPMMRKPLLE---------LWRE--ARKSLSPVDA -WESIVENPVKSKAYKTKRGLGGFIRVDWEEANELVAAANIYTAKKY----GPDRI-NGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPSSPQTWGEQTDVPESADWYNSTFLMLWGSNVPQTRTPDAH -FYTEVRYKGAKSVVITPDYSEAAKFADLWLAPKQG-TDAALAMAFGHVVLKELHL----D -NPSEYFTEYCRKTTDMPHLVMLKT-----RGNAFVADRFLR---------ASDLSDN-LQ -QSNNPEWKTLVINENTNEMVVPNGSIGFRW---------GEDGKWNIQATDS-------- --------ADGSDIKARLSLI------E-----------NADQVVSVEFPYFGNLN----- -----------------HPHFTHTEHAEILERNVPARRIQLA-DGSDAYVVTVFDL----- -------LVAN-YGIDRGL--------GGENVAKSFDDDQPYTPAWQERITGVKREHVITV -ARQF------AENAHKTHGKSMVILGAGLNHWYHMD-MNYRGIINLLMMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWHRPPRHMNGTSFFYNHTSQWRHEKLDVREI -------LSPLADKTAWSGSLLDYNVRAERMGWLPS-----APQLN-VNPLELTKAAAAAG -QSPV-----DYAVENL-----KS---------------GKLAFACEDPDNPV-NFPRNLF -VWRSNLLGS---SGKGHEYFLKYLLGTTHGVQG--KDLGEMGAPKPEEVVWHEQGAEGKL -DLLVTLDFRMSTTCMYSDVVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIARKFSELSVGHLGVE-KDLVLVPTLHDTPSELGQAV----GVKDWKKG -ECEPIPNKTLPNMVVVERDY--PNTYKKFTALGPLLDKLGNGGKGISWNTQSEVEQL--- ------RDLNYRVTEEGVSKGLPRIESDIDACEVVLMLAPETNGQVAMKAWAALSKI---- ------TGRDHTHLALPRE----D-DKIRYR-DVQAQPRKIISSPTWSGLESEHVSYNAGY -TNVHEMIPWRTLT------GRQQFYQDHLWMLGFGESLCVYKPPIDTKTIA--P--LLN- -------------------------QRSNGNGEVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPCVWMSETDAKKVGIEDNDWI-- ----------------EAFNLNGALVARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-ASEITKTRGGIHNSVT---RTCPKPTHMIGAYAQ---------QSYGFNYY -GTV-GSNRDEFVIVRKLS-------KVDW---LDTPVAQA-------------------- ----- ->NarG_Pseudomonas_fluorescens_gb_AEV63780 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFS-DGHGETRKESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKIRKPLLK---------LWRE--ARQTLPPVEA -WASIVEDKAKADSYKSKRGMGGFIRSNWEEVNEIIAAANVYTVKEH----GPDRV-VGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----D -KPSAYFTEYAKRYTDLPVLVMLKPMLGAAPGAGYQPDRFLR---------ASDLTDN-LG -QDNNPEWKTIALD-AAGELVSPQGSIGYRW---------GEKGKWNILPREG-------- --------GEGREIDLKLSLI-------------------GGDVAEVAFPYFAGEA----- -----------------QEYFQHVAGDAVQFRRVPVHSVVLA-DGSVAKVATVFDL----- -------SAAN-LAIDRGL-------GGANVAKDYNDASVPGTPAWQEQITGVSREKAIQI -AREF------ADNADKTRGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWNRPPRQMNGTSFFYGHSSQWRHEKMSMHDV -------LSPLADKSQFPEHALDYNIRAERAGWLPS-----APQLN-TNPLHICRDAAAAG -MEPK-----DYVVKSL-----QD---------------GSLRFACEQPDSPV-NFPRNMF -IWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN--EDIGHSTECKPTEAEWVDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -ESRSDWEIYKGIAKAFSAMSVGHLGVE-KDLVTVPLMHDSVGELAQPF----GGTDWKSA -GVAPVPGKNAPNLQVVERDY--PNIYKQFTSLGPMLEKLGNGGKGINWNTDTEVKFL--- ------GELNHKEVEAGISQGRPKIDSAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGIDHSHLAISKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDDHVSYNAGY -TNVHESIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVNTRTIA----GVKG- -------------------------KRSNGETEIVLNW-------------------ITPH -QKWGIHSTYSDNLLMLTLSR---------------GGPIVWLSEIDAKRAGIEDNDWI-- ----------------ECFNVNGALTARAVVSQRVKEGMVMMYHAQE-------------- ---RIVNVP-GSETTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMV-------KVDW---LDGSSGDDLPRPLPTDIEEN-------- ----- ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFA-DGHGETRIESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWREARRN--MTPVDA -WASIVEDKAKAESYKSKRGMGGFIRSSWDEVNEIIAAANVYTVKQY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQIWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKLTDLWLNPKQG-TDAALAQAFAHVIFKEFHL----E -KPSEYFRDYAKRYTDLPVLVRLN-----EKDGSYIADRFLR---------ASDLADN-LG -QENNPEWKTIAVDGSTGELVSPLGSIGYRW---------GEKGKWNIEARE--G------ --------KDGRDVDLSLTQI------E---------GGETAEVAF---PYFGGIL----- -----------------HEHFQHAEGESIQLRRVPVRTITLA-DGSTTKVATVFDL----- -------MAAN-LGIDRGL-------GGGNVASSYDDASVPGTPAWQEVITGVSREKAIQI -AREF------ADNADKTHGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWSRPPRQMNGTSFFYNHSSQWRHEKMSIHEV -------LSPLADKSQFPEHMLDYNIRAERAGWLPS-----APQLN-RNPLQICRDAEAAG -MSPV-----DYVTQSL-----KD---------------GSLKFACEQPDNPD-NFPRNMF -VWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN-EDLGKRADGFKPTEAEWQDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EAKSDWEIYKGIAKAFSKMAEGQLGVE-KDLVTVPLLHDSPGELAQPF----GGTDWKTA -GVDPQPGKNCPNMAVVERDY--PATYKKFTSLGPLLDKLGNGGKGINWNTQDEVDFL--- ------GELNYKVRDEGVSQGRPQIESAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLALPKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHEYIPWRTIT------GRQQFFQDHPWMQAFGEQLMSYRPPINTR------------ -TIDYVK-------GKKSNGNP----------EIVLNW-------------------ITPH -QKWGIHSTYSDNLIMLTLSR---------------GGPIVWMSEVDAKKAGIEDNDWI-- ----------------ECFNANGALTARAVVSQRVMEGMVMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMA-------KVDW---LDGPNGNDLPQPLPQDI----------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16 rank: A; ocm:CBP12_03810 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------ETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRVKYPKVRKALLK---------LWRE--ARKNLKPVEA -WASIVEDPVKAQSYKSKRGLGGFVRSSWDEVQELIAAANVYTTKTY----GPDRV-VGFS -PIPAMSMIS------YASGARYLSL----------------------------------- ----MGGACLSFYDWYCDLPPSSPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----E -KPSEYFTDYVRRTTDFPMLVLLD-----EHGEGYKTGRFLR---------ASDLTGQ-LG -QDNNPEWKTIALDELSGELVSPLGAIGYRW---------GEKGKWNIEAREG-------- --------SKGADTKLKLSLI------D------------EGQVAEVAFPYFGGDL----- -----------------HDHFQHVEGDNLQYRRIPVREVQLA-DGRSAKVATVFDI----- --------TAGGLAIDRGL-------GGKNVASSYDDASIPGTPAWQEQITGVTREKAIQI -AREF------ADNADKTKGRSMIIVGAAMNHWYHMD-MNYRGLINMLMMCGCVGQTGG-G ---WAHYVGQEKLRPQT---GWTPVAFGLDWHRPPRHMNGTSFFYNHSSQWRYEKMNMHDI -------LSPTANKAEFPEHALDYNIRAERAGWLPS-----APQLN-RNPLQICRDAKAAG -LSPK-----DYAVKAL-----QE---------------GSLRFSCEQPDNPV-NFPRNMF -VWRSNLLGS---SGKGHEYMLKHLLGAEKHGVI---GDETAAGFTPKDVDFSQEGARGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EARSDWEIFKGIAKKFSELSVGHLGVE-QDLVTIPMQHDSVGELAQPF----GGLDWKTT -GEPLVPGKNAPNMVVVERDY--PNTYKKFTSLGPLLNTQGNGGKGISWNTDDEVEFL--- ------GDLNHRVLDEGVSEGRPQMLSAIDAAECVLSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLAVGKE----H-ESIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVSTRSIE----KVQG- -------------------------KMSNGNPEIALNW-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAQKVGIEDNDWV-- ----------------ECFNANGALTARAVVSQRVKEGMIMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMN-------KVDW--LEGSDTDDLPQPLPQNI------------ ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11 rank: C; pbm:CL52_03700 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ----MSR--------LLDQLRF--FKRKQD--EFA-DGHGETRIENR------EW-ENGYR -ARWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1 rank: A; reu:Reut_B5002 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLRF--LSRTKE--TFS-DGHGAVVDEDR------SW-ENAYR -GRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPLVRGRLME---------MWRE--ARQTMSPTDA -WESISQDPVKAKRYKSVRGQGGFVRASWDDVSEIIAAANAFTIKEF----GPDRV-LGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----IGGACLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTYLMVWGSNVPQTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMVKFGDIWLAPKQG-TDAALAMAMGHVILKEWHT----S -AQSDYFTRYVKQYTDLPMLVILK----LGKSGQLVPDYFLR---------ASHLSLA--E -QANNPEWKTLLIDCASGELIAPNGSIGFRW-----GESGDKVGRWNLELKDGGSARAIDP -CLS----LIDSHDDIVEVGF----------------------------DYYGGKD----- -------------------------ADDVLLRRVPAKRVKLA-DGSEALVTTVFDL----- -------TMAN-YGVDRGL--------GGGNVAMSYDDDVPYTPAWQERHTGVKRNLVIQV -AREF------AQNAHDTQGKSMVIVGAALNHWYHND-MIYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFAGDWVRPPRHMNGTSFFYNHTSQWRHEKLALDEI ------LAPTADAGPYSKLALLDLNAKAERLGWLPS-----APQLE-TNPLDIVDAADSKN -MDPV-----KYAVEEI-----KA---------------GRLNFSCDEPENPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALFG------DERDGIKPGEVKAGEAVEGKL -DLLTVLDFRMSTTCLYGDIVLPSATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKSDWEIYKTIAKKFSEIAGPYLGTR-KDLVLTPLLHDTPGELGQPF----EPKDWKHG -ECEPIPGKTMPQMTVVERNY--GDVYKKFTSIGPLLEKSGNGGKGIGWNTEHEVKEL--- ------AALNKLVTEPGVSQGRPKLETAIDAAEMILTLAPETNGHVAVKAWDALGKI---- ------TGRDHKHLAEGRD----H-DKIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHRWMLDFGEGLCIYKPAINTRTIE--P--MLG- -------------------------KHANGNAELVLNW-------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIE-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1 rank: C; cuh:BJN34_33750 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------K--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------HAN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------GNEELVLN-------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIEAKQAGIRDNDWV-- ----------------EVFNVNGTLTARVVVSQRVPVGMCLMYHAQE-------------- ---KIVNVP-GAETSGMRGGIHNSVT---RTVTKPTHMIGGYAQ---------LAYGFNYY -GTV-GSNRDEYVIVRKMK-------KVDW---LEGALKEEGEQA---------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6 rank: A; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MAACR------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------DWYCDLPPASPQIWGEQTDVAESADWYNSNYLMVWGSNIPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -RPSDYFTGYIRQYTDMPMLVMLKQ----DAAGRYLPDYFLR---------ASHLAGN-AD -QAHNPEWKTLVLDETSGNLAVPNGSAGFRW---------DQSGKWNLEEKA--G------ --------INSQPVKAQLSLI------A--------QSDEVVEVGF---PYFGAEH----- --------------------------DELITRRVPVRHIVLA-DGSTARVATVFDL----- -------MAAN-YGIDRGL--------GGGNVACSYLDDVPYTPAWQHKHTGVKPEMVIQV -AREF------AQNADQTHGRSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WCHYVGQEKLRPQT---GWAPLAFAGDWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LSPTADGKMANMALIDYNAKAERMGWLPS-----APQLT-TNPLDVTRHAAAAG -QDPI-----TYAVEQL-----KS---------------GQLDMACNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNAVMN-----SEEGCVKPSEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QAKSDWEIYKGFAKAISEVGGEYLGVQ-QDLVLTPLMHDTPEELGQPF----DPRDWKKG -ECEPIPGKTMPKMTVVERDY--RKIHDKFTSIGPLLEKVGNGGKGIGWQTGHEVDVL--- -------RGLNKTVASGVAAGQPRLDTAIDAAEMILTLAPETNGHVAVKAWAALSKI---- ------TGRDHTHLALPRE----H-DSIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHLWMRAFGEGLCLYKPHVDLK--T--TAAILG- -------------------------KKPNGHHEIVLNW-------------------ITPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWVSEIDAKKAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRVPEGMSLMYHAQE-------------- ---KIINVP-GAETSGKRGGIHNSVT---RTVVKPTHMIGGYVQ---------LAWGFNYY -GTV-GSNRDEFVIVRKMK-------NVDW---LDQPLSEHA------------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7 rank: C; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) -MEYARLVTHLAESENSRACFFLAPLLSNYPTLPPLPPPRSPSDQWAVCLRLLTIGGIGTG -LSGPANPLEARMSHFLDRLNF--LGKVKS--TFS-DGHGAVVKEDR------KW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGVLMQ---------HWRE--LRKKLGPIEA -WQRISQTPEIATQYKTQRGQGGFVRASWDEVNEIIAASNAFTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------I---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----GVPRLVL------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2 rank: A; chrm:FYK34_01610 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--MSKVKA--TFS-NGHGAVVKEDR------QW-EDAYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----ADL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGKLMQ---------MWREARKS--MGAIDA -WESISQNPEKAKEYKSRRGQGGFVRASWDEVNEMVAAANAYTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQIWGEQTDVAESADWYNSTYLMVWGSNVPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -KQSSYFTDYIRRLTDMPMLVRLK-----EEGGRYLPEYFLR---------ASHLEGG-LG -EDNNPDWKTLLIDENTGDIVAPNGSIGFRW-----GQPEGKTGKWNLEHRDGAT------ --------AREIQGQLTLLGQ------Q----------DEVVGVGF---PYFGAEH----- --------------------------DELLTRNVPAKRITLA-DGSTALVATVFDL----- --------MAANYGIDRGL--------GGGNVASSYMDDVPYTPAWQQKHTGVKPEMVIQV -AREF------AQNADQTQGKSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQS---GWAPLAFGADWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LCPTADGSMANMSLIDYNAKAERMGWLPS-----APQLS-TNPLDITRQAEAAG -QDPV-----AYTVQGL-----KD---------------GTLDMSCNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALMS-----DEANCITPTEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKTDWEIYKGFAKAISEVGGDYLGVQ-KDLVLTPLMHDTPQELGQAF----DPRDWKKG -ECEPIPGKTMPAMTVVERDY--KAIYQKFTSIGPLMEKAGNGGKGMAWKTGHEIEKL--- -------RAMNKVVQDGVAKGQPRLDTAIDAAEMILTLAPETNGHVAVKAWESLSKI---- ------TGRDHTHLAIPRE----H-DHITFR-DIQAQPRKIISSPIWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHQWMRAFGEGLCLYKPPVDLKT----------- -TAAVHR------------------HKPNGNTEILLNF-------------------LTPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWISEKDAQEAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRIPKGMTLMYHAQE-------------- ---KIVNVP-GAEMSGKRGGIHNSVT---RAVTKPTHMIGGYAQ---------YSYGFNYY -GTV-GANRDEFVVVRKMK-------NVDW---MDQPK----------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6 rank: C; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------T -ASHQAMMNSRS-----------------------------------------------NG -NPEIA------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------LN------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------F------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPCVWVSEVDATKIGLVDNDWV-- ----------------EAFNANGALCARVIVSQRVPEGMMMMYHAQE-------------- ---KIVNVP-GSEIMNTRGGIHNSVT---RAVVKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVILRKMN-------KVDWMDDEASPAGENS------------------- ----- ->nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------AW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--HRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCL-----VEKDGAYVPDRYVR---------AADLVGA-LG -EANNPDWKTLVIDEASDALTVPVGSIGFRWGQEKDGAPTADKGKWNLKEET--------- --------SDGRQIKPRLSLV------K--------HHDAVVEAAF---PYFGNIA----- -----------------HEHFNSTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVASSYDDDIPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLRVADL -------LSPLADKGKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLELSREAIAKG -LDPK-----EYVVNQL-----KS---------------GELKFSCEDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGHTGEVKPQDVVWHDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRFSELS---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DGYLGVEKDIVAVPIL--HDTAGE- ------------------------------------------------------------- -----IAQPYDTKDWKK-------------------GECEA-IPGKTMPNFVVVERNYSEI -H--------------EKFTSLGPLLDK--------------------------------- -------------------------------------------------------LGNGGK -GIN-------------------------W---NT-------------------------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------SW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--QRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCM-----VEKDGAYVPDRYVR---------AADLIGA-LG -EANNPDWKTLVIDEESDALTVPVGSIGFRWGQDKDGAPTADKGKWNLKEET--------- --------TDGRKIKPRLSLV------Q--------KHDAVVEAAF---PYFGNIE----- -----------------HEHFNNTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVAGSFDDDVPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWSRPPRHMNGTSFFYAHTDQWRYETLRVADL -------LSPLADKNKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLDLTREAIAKG -VDPK-----EYVVNQL-----KS---------------GELKFSCDDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGQTGDVKPQEVVWRDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRYSELSDGYLGVE-KDLVAVPILHDTAGEMAQPY----DAKDWKKG -ECEAIPGKTMPNFVVVERNY--SEIYEKFTSLGPLLDKLGNGGKGINWNTDHEIKLL--- ------GELNYKVRNEGVAHGRPNIDTDIDATEVVLTLAPETNGEVAVKAWAALSEF---- ------TGIDHRHLALTRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESEHVSYNAGY -TNVHELIPWRTLT------GRQQLYQDHEWMRAFGEGFCSYKPPVDLRSHQ--Q--VMN- -------------------------AKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWLSEVDAQKVGIEDNDWI-- ----------------EAFNSNGALCARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-GSEITQTRGGIHNSVT---RAVLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVVVRKMN-------KVDW---MDGPAQPAMEA----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF----FVTPTEGFA-DKHGATVDEDR------TW-EDGYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCQRGASYSWYLYSANRVKYPMVRSPLLK---------LWRE--KRKMLAPVDA -WKAITDDHNAVRSYQSQRGLGGFLRTTWDEVNEMIAAANVHTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCTSFYDWYCDLPPSSPQMWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMTEVRYRGTKVVSVFPDYAEGSKFGDLWLHPKQG-TDAALALAMGHVIVNEFHV----K -NKSDYFDQYCRQYTDMPNLVKL-----VKQGDYYVPDRLVR---------CSDFTDN-LG -QDNNPDWKTVVIDENTNMLTVPVGSIGFRW----GQKEGEDLGKWNLQEKN--------- --------AAGADIRPRLSLI-----------------GGHDGVVLVASPYFGNQQ----- -----------------HDHFQHTDHANILPHNIAVRKLQSR-DGE----ILVASV----- ----YDLFVAN-YGVDQGL--------GGPNVASSYDDDIPYTPAWQEKITGVKRHLVIQV -AREF------ADNADKTHGKSMVIVGASLNHWYHMD-MNYRSVINMLVMCGCIGQSGG-G ---WAHYVGQEKLRPQI---GWAALAFATDWHRPPRQMNGTSFFYAHTDQWRYETLSVKKI -------LSPLADPKKFSGSLIDFNVRSERMGWLPS-----APQLQ-TNPLQVCRDAQKAG -MSAK-----EYAVAQL-----KS---------------GKLRFSCEDTDHPD-NYPRNMF -IWRSNLLGS---SGKGHEYFLKHLLGTTHGVQG--KDLGQSGGQKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----F-SAAVDPAW -MARSDWEIYKGIAKKFSELTEGHLGVE-QDLVTVPIMHDTPDELGQAF----EPKDWKRG -ECEAVPGKTMPNFVLVERDY--PNTYKKFTALGPLMDKLGNGGKGINWNTQHEVKHL--- ------GELNYLVSEEGVTKGRPKIETDIDATEVILMLAPETNGEVAVKAWDALSKF---- ------TGIDHTHLAKTRE----D-EKIRYR-DIQAQPRKIISAPTWSGIESEHVSYNAGY -TNVHELIPWRTIT------GRQQLYQDHHWMRAFGEALCVYKPPIDTASHQ----AMMN- -------------------------SRSNGNPEIALNF-------------------ITPH -QKWGIHS----------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------F-GNLEH -DHFQG----------------------------------------TDHPSVLK----RRV -PVREVQL-KDGKAFVATVFDLFCANYGL-------------------------------- -----------------DRGLGG-----------------EHVARDY-------------- ------------------------------------------------------------- ----------------GAMEPYTPAWA---------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------E--------------------------------- ------------------------------------------------------------- ------------------------------------------------KITGVPADQIITI -AREF------ASNAEVTKGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLGVEEI -------LSPTAPEGDWDASLIDYNARAERMGWLPS-----APQLK-TNPLEVGKAIKASG -KDAK-----DYVAEAL-----QS---------------GALEMSCFDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGETGAQKPKEVKWHEEAPKGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWDIYKGIAKKFSEIAPEVLGVE-HDVVLTPIQHDSPNEIAQAY----DVADWGHG -QVEAIPGKTMANVALVERNY--AELYQKFTALGPLMEKLGNGGKGIGWNTDHEVEGL--- ------RKLNGTVAADGPAKGMAQIETAIDAAEVILMLAPETNGEVAVKAWADLGKK---- ------TGLDHTHLALPKE----D-EKIRFR-DIQAQPRKIISSPTWSGIESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEGLCVYRPPIDTKAVK--PML---- -------------------------DEAKDAPHVILNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KITNVP-GSPLTGQRGGIHNSVT---RAVLKPTHMIGGYVQ---------LAYGFNYY -GTV-GSNRDEYVIVRKLS-------KVDW---LEGALS-------EGETAA--------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1 rank: A; emv:HQR01_12825 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRHKKE--QFS-DGHGVTTAEAR------DW-EDSYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLIK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKKW----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALAMAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----IEQDGRLVPERLLR---------ASDFKGD-LG -EKNHPEWKSVAIDEARDEVVAPTGSAGFRW---------GDKGKWNLEEKD--------- --------GKGAEVKLRMTAI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------LDKDH---------------------------------------- ------------------------------------------------------------- -----------------------------------DEVVEVA------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKKE--PFS-EGHGVTTAEAR------DW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRKYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDFAGG-LG -ETNNPEWKCVAIDETSDEVVAPSGSVGFRW---------GEQGKWNLKEED--------- --------GRGEAVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFQGTDHPDVLMKRVPVREMQLA-EGRAYVATV--------- ----FDLLCAN-YGLDRGL--------GGQHVARDYADGAPYTPAWAEKITGIPADAIVTT -AREF------AANAEATNGKSMVILGAGVNHWYHMD-MTYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVGEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAARASG -LEPK-----DYIAQAL-----KG---------------GDLELSCMDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPREVKWHEEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESKSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGHG -EIEAIPGRTMATVALVERDY--PNLYNRFTALGPLMDKLGNGGKGIGWNTAAEVENL--- ------RRLNGVQDAGSPAAGMAKIETAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGINHRHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNQLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNTNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW------LEGALPEG--ENAA----------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKSE--TFS-DGHGLTTGEDR------HW-EDGYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWREARRT--LPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLMMWGSNVPQTRTPDAH -FMTEARYRGTKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDVKGG-LG -EGNNPEWKCVAIDEASDELVVPSGSAGFRW---------GEKGKWNLEEKD--------- --------GQGREVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFEGTDHPDVLMKRVPVRQLDLT-EGR----AYVATV----- ----FDLLCAN-YGLDRGL--------GGEHVARDYAAMSPYTPAWGEKITGVPADAIITA -AREF------AANAEATNGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVSEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAAKASG -MEPK-----DYVAQAL-----KG---------------GDLELSCLDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPQEVKWHDEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGKG -EVEPIPGKTMATVAVVERDY--PNLYKRFTALGPLMDKLGNGGKGIGWNTVTEVDNL--- ------RKLNGTVGDDGPTKGMARIDTAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGRDHKHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW---LEGALS-------EGENAA--------- ----- ->NASQAN2015_010_A_bin.16_Ga0466474_000034_25 rank: A; oca:OCAR_5043 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLLF--FKKKVD--TFS-GTHGVVTNEDR------SW-ESSYR -SRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKFPMIRGRLVR---------LWRE--ARLSLDPVDA -WASIVEDPLKSAEYKSKRGLGGLVRANWDEVNEIIAAANIYTAKTF----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVSMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FMTEARYKGAKVVVVSPDYSEASKFADLWLHPKQG-TDAALAMAIGHVILKEFHV----E -GQSPYFNGYVRENTDLPFLVMLK-----EQDGYYVQDRFLR---------ASDFSGS-LG -QDNNPDWKTVAYDELNGQIVPPCGSIGFRW---------GESGQWNIEQKT--------- --------SDNQAVKLRLSLI------D-----------IKDEVASVGFPYFGGSE----- -----------------HPHFTHSAHDAIQKRNVPVKKIILA-DGTEVLATTVFDL----- -------LVAN-YGIDRGL--------GGGNVAASYDEDVPYTPAWQEKITGVSRSNVIAV -AREF------AINAEKTKGRSMVILGAGINHWYHMD-MNYRGIMNMLMLCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWLPLAFGLDWKRPPRQMNSTSFFYNHTSQWRYETLKVSEI -------LSPTAKPEDWQGSLIDFNVKSERMGWLPS-----APQLQ-TNPLQVVRDAKAAG -IAPA-----DYVVAGL-----KN---------------GSLKMSCEDPDNPL-NFPRNMF -VWRSNLLGS---SGKGHEYFLKYLLGTQHGIQG---KDLGDDGDKPSEVVWHEKAAEGKL -DLLVTLDFRMSTTCLYSDIILPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIAKKFSELTIGHLGLE-QDIVTVPVLHDTPGELAQPF----EVKDWKKG -ECEPVPGKTMPSLVVVERDY--PNTYKMFTSLGPLLSKIGNGGKGIAWNTETEVKQL--- ------GELNYLVTEEGISKGLPRIASDIDATEVILMLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAKPRE----D-DKIRFR-DVQAQPRKIISSPTWSGLESEQVCYNACY -TNVHERIPWRTLT------GRQQFYQDHSWMRAFGETLCVYKPPVDTRSIT--P--ILG- -------------------------QKPNGNDELVLNF-------------------LTPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMGEIDAAKVGIKDNDWI-- ----------------EAFNVNGALVARAVVSQRVPEGMCMMYHAQE-------------- ---KIVNMP-GAETTGGRGGIHNSVT---RATLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIIRKMS-------KVDW---LEEPKPEQA------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1 rank: A; tun:J9260_09180 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- --------------NMLAMCG---CVGQSG------------------------------- -----------------------------------------------------------GG -WAHYV---------------------------------------------GQEKL----- ------------------------------------------------------------- --------------------------------------------------------RPQTG -WL------------------PLAFALDWSRPPRQM-NSTSFFY----------------- ------------------------------------------------------------- ------------------------------------------------------------- --------SHSNQWRYEKLEL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------KEILSPL -ANPA------------------RHSGSLIDYNVRSE------------------------ ------------------------------------------------------------- -----------------------------RMGWLPS-----APQLN-TNPLRIAKAAQAAG -MSPA-----EYTVAAL-----KA---------------GKIAFAAEDPDNPQ-NFPRNLF -VWRSNLLGS---SGKGHEYMLKYLLGTQHGVQS--KDLGVMGGAKPEEVKWHDTAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAAVDPAW -EARSDWEIYKGIAKAFSKVCEGHLGVE-TDLVTLPLLHDAPAELGQAM----GVKDWKKG -ECELIPGKTAPALVAVERHY--PDTYARFTAIGPLLEKLGNGGKGISWNTETEVAFL--- -------GQLNHQQTTGINEGRPCLNSAIDAAEMILSLAPETNGQVAVKAWQALSKI---- ------TGIDHSHLAIHKE----D-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHDWMRDFGESMLVYRPPINTKTIK--P--LLN- -------------------------QRSNGNPELALNW-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWMSETDAKTLGIQDNDWI-- ----------------DLFNANGAIAARAVVSQRVMPGMVMMYHAQE-------------- ---KIVNVP-GSVITGHRGGIHNSVT---RVCPKPTHMIGGYAQ---------QAYGFNYY -GTV-GSNRDEFVIVRKMT-------QVEW---LDNE---------GNDYAQEAVQ----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1 rank: C; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLN---FLARKNADTFS-DGHGVTTTENR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLIRSRLLK---------LWRK------------ ------------------------------------------------------------- --------------------ERTIK------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------TPIGAWAAIQEN--------- --------PEKRADYMKMRGL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1 rank: A; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------FLARKNAGTFS-DGHGVTTTESR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLVRSRLLK---------LWRK--ERTIKTPIGA -WAAIQENPEKRADYMKMRGLGGFVRATWEEVNEIIAAANAYTVKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEVRYKGAKSVVVSPDYSEAAKFSDLWLHPKQG-TDAALAMAMGHVILREFHL----D -RQADYFEDYCRRYTDMPMLVKLTG----KDGHFIPD-RFVR---------ASDFTGA-LD -ETNNPEWKTVAVDAKTKQFVSPGGSIGYRW---------GEQGKWNLEAKDGKGADVDLA -MSFI---LDGEHDTIANVGF----------------------------PYFGNRE----- -----------------HDYFEGTDHDSVLVRKVPARKVKLA-DGEALVATV--------- ----FDLFVAN-YGLDRGL--------NDPNSAKSYQENLPYTPAWAEKITGVPRDQIIAV -AREF------ASNAEKTNGRSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNGTSFFYAHTDQWRYETLKVDEI -------LSPTAPEGPWDASLIDYNIRAERMGWLPS-----APQLK-TNPLEVSKQAAAAG -KEAK-----DFVAEQL-----KA---------------GALSMSCEDPDDKA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTKHGVLG--KDLGEEGRQISKEAVWHDEAPEGKL -DLLVTLDFRMSTTCVYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SSAADPAW -DARSDWEIFKGIARKFSEVAPEVLGVE-KDVVLVPTLHDTAGELAQPI----DVKDWKKG -EIEPIPGRTMPTVAVVERDY--PNLYKKFTSVGTLLDTVGNGGKGIAWNTEHEVDLL--- ------ARLNGVVQEEGVTRGRPRIESDIDATEVILSLAPETNGEVAVKAWEALSKF---- ------TGRDHTHLAIPKE----D-EKIRFR-DVVAQPRKIISSPTWSGLESEKVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFCVYRPPIDTKT----------- -VNPAIR------------------SKADGKPHLVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWISEPDAKRAGIVDNDWV-- ----------------EVYNTNGAIVARAVVSQRMKDGTVFMYHAQE-------------- ---KIVNTP-GSPITGQRGGIHNSVT---RVITKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDEFVVVRKLE-------TVDW---LEGPHTESVAY--NKEAAE--------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206 rank: A; bprc:D521_0425 Respiratory nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--LSADKE--EFS-DGHGVTVGEDR------TW-EDAYR -SRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKYPMIRGRLLK---------QWREAKSVA-KSPVDA -WANLVENTAKRKEWMELRGKGGFVRSSWDEVNEIIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADIWMHPKQG-TDAAIAMAMGHVILKEFYF----N -KRTEYFDDYVRRYTDMPNLVMLEEKVLDDGRKVLVPGRYAR---------SSDFDGK-LG -QTNGADWKTVAFD-TAGKPVVPNGSIGFRW----GPEGRKDQGKWNLESKE--A------ --------NYGNDVKLKLSLMEDQSIHD------------VVPVGF---PYFGGID----- -----------------TPYFDANKQSDVLVQNIPAKKIILT-ENGVEKEVFVATV----- ----FDLLAGN-YGIDRGL---------GGECAKSYDDNVPYTPAWQESITGVKREQVIAV -ARQF------AENAEKTKGKSMVIIGAAMNHWYHCD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWIRPPRQQNSTSFFYAHTDQWRYEKLGMEEV -------LSPLANKEEYTGSMIDFNVRAERMGWLPS-----APQLK-TNPLEVVKEALAAG -KDPK-----KYVVDGL-----KS---------------GTLQMSCEDPDHPS-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGADEARPSEVEWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -EARSDWDIYKGFAKKFSEVCVGHLGVE-KEIVMTPLMHDTPAELAQAF----DVQEWKKG -ECDLIPGKTAPQIAVVERDY--PNTYNRFTALGPLMDKVGNGGKGIAWDTKVEVEQL--- -------RELNGRVEHGEMKGMAKISTDIDAAEVVLMLAPETNGHVAVKAWDALSKI---- ------TGLEHAHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNACY -TNVHEYIPWRTLT------GRQQFYQDHKWMRAFGEGFVSYRPPVDLKTII--------- -----------EVKGIKPNGNK----------EIVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDAVKAGIVDNDWV-- ----------------ELYNANGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVTVRKMR-------NIDW---LDTENANSVQA----------------- ----- ->whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1 rank: A; pde:Pden_4236 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNF--LKSTRK-DTFA-DGHGQTTIENR------DW-EDTYR -SRWRH------DKIVRSTHG-VNCTGSCSWKIYVKNGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKTPLVRGRLMR---------RWRDLRRT--LGPIEA -WTAIQSDPAARADYVKARGRGGFVRASWDEVTEIVAAANAYTAKTW----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEARYRGTKSAVVSPDYSEAAKFGDIWLNAKQG-TDAALAIAMGHVILREFHL----D -RQVDYFEDYTRRYSDFPMLVKLEP-----KGDRFVPGRMLR---------AADIDGA-LG -ETNNPDWKTVAIDDASGRLVAPNGSIGHRW---------GEQGTWNLEEKA--------- ---------GAESVRLRTTLI------------LDGQNDGTAGVDF---PYFGGSA----- -----------------TNGWQACDTPDVLTRAIPVRKVALK-DGE----AMVATV----- ----FDLLCAN-YGLDRGL--------GGDWVARDYGSDMPGTPAWAERITGVPADRIIQV -AREF------AANAEKTGGKSMIIIGAAMNHWYHMD-MNYRGVINMLVMCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWGRPPRHMNSTSAWYAHTDQWRYETVRSDEI ------LSPTAPAGDWSSLSLIDYNIRAERMGWLPS-----APQLR-TNPLQVAAAAKAEG -TEVR-----DYVAREL-----KA---------------GRLEMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVLG--KDLGEEGRRKPVEARWHDKAPEGKL -DLLTCIDFRMSTTAVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKTDWEIFKAIAAKLSEIVPGYLGVE-TDVVQLPLQHDSPGEVAQPR-----VADWKQG -QCDLIPGKTAPAFIAVERDY--PNLYRRFTALGPLMEKAGNGGKGIAWDTKHEVAHL--- ------RALNGTVTDEGPTKGMARIDTAIDAAEVILMLAPETNGEVAVKAWEALSKA---- ------TGREHKHLALPKE----D-EKNRFR-DIAAQPRKIISSPTWSGIESESVCYNAGW -TNVHELIPWRTLT------GRQQLYQDHEWMLAFGEFFLAWRPPVDLKTIT--APATGA- -----------------LGANE---------KHVVLNF-------------------ITPH -QKWGIHSTYSDNLLMLTL------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17 rank: A; acis:CBP35_16735 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--TFS-QGHGQTNGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLK---------HWRA-ALLLAKSPVDA -WANIVENESAKREWQKQRGLGGFVRSTWDEVNQMIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSSFIIAWGSNVPQTRTPDAH -FLTEVRYKGTKVVSITPDYSEVAKLGDLWMHPKQG-TDAAVAMAMGHVILKEFYFKDGGK -GRSTYFDDYARRYTDLPLLVVLKEKTLPDGRTVMVPDRYVR---------ASDFPGQ-LD -QSNNPDWKTVGYD-ELGQVTLPNGSIGFRW----GADGRADEGLWNLENKE--A------ --------RTGNTVKLKLSVI------E--------DGEQAYDVADVAFPYFGGVQ----- ----------------TPNFTANEQGGDVMVRRVPVSHLELA-GHEAQGRVMVATV----- ----FDLLAGN-YGIDRGL--------PGEEPGGSYDADRPYTPAWQESITGVPREQIIAV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHCD-MNYRGIMNMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------LSPLADKKSYSGSMIDYNVRAERMGWLPS-----APQLK-TSPLQVAKDAAAKG -MDAK-----DYVVQSL-----KD---------------GSLQMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGRDEAKPEEVQWHANAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QAKSDWEIYKGFAKAVSEVSVGHLGVE-KDVVLTPIMHDTAGEMAQPY----GVRDWKKG -DCELIPGKTAPQVTVVERDY--PNLYKRFTALGPLMDKAGNGGKGIGWNTQTEVGQL--- ------GDLNGRVKEEGVTQGMPRIVSDIDATEVVLMLAPETNGHVACKAWEALGKQ---- ------TGRDHVHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMRDFGEGFVSYRPPVHLKALH----EVEG- -------------------------KKPNGNREIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAASAGIVDNDWV-- ----------------ELFNANGAIAARAVVSQRVNPGMVMMYHSQE-------------- ---KIINTP-GSEITGTRGGIHNSVT---RIVLKPTHMIGGYAQ---------YSYGFNYY -GTI-GTNRDEFVLVRKMD-------RVDWLDDEVSDTGAHA------------------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1 rank: A; hyb:Q5W_04195 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------QG------------------------------------------- ------------------------------------------------------------- -------------------------------------TDAALAMAMGHVVLKEFYFPAN-G -QRSSYFDDYARRYTDLPMLVMLKEQTLPDGSTTLVPDRYLR---------ASDFNGK-LG -QANNPDWKTVAFD-TTGKAVLPNGSIGFRW----GDQGREDAGKWNLESKE--A------ --------RDNGDVKLKLSVL------E-----DGAQDHQVVDVGF---PYFGGQQ----- ----------------TPNFPANAAVGDVNQAKVPAVRLRLG-KAGEERYALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKNYDDNAPYTPAWQETITGVPRQQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWLRPPRQQNSTSFFYAHTDQWRYEKLDVSEI -------VSPLADKAKFGGSMIDYNVRAERMGWLPS-----APQLK-TNPMQVVKDATAAG -MDPK-----DYVVQAL-----RD---------------GSLEMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTENGVQG---KDLGADEAKPTEVKWHKDAPQGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSKSDWEIYKGFAKRFSEVCVGHLGVE-KEVVLTPLMHDTAAELAQPF----EVKEWKKG -ECELVPGKTAPQIAVVERDY--PNLYKRFTALGPLMNKLGNGGKGIGWKTEIEVEQL--- ------GQLNGVTREEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMVAFGEGFSSYRPPVDLK--T--TDVVQG- -------------------------LRPNGHKEIVLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEDDAKSAGIQDNDWI-- ----------------ELFNVNGAVAGRAVVSQRVKNGMVMMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMQ-------KVDW---LDTP---------RDDHLVKAVQSQGEN -P--- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------LYSANRVKYPLVRGRLLE---------RWRT-ALKTARTPVDA -WATIVENPDARRDYQKVRGMGGFVRSSWDEVNQLIAAANVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAVTPDYSEVAKLADLWLHPKQG-TDAALAMAMGHVALNEFYF----K -QRSPYFDDYARRYTDLPLLVMLKEHILPDGSKTLVPDRYLR---------ASDFNGK-LG -QDNNPEWKTVAFD-AGGRAVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RHGAEVKLKLSVI------E--------DGTQAHEVVGVGLPYFGGVS----- ----------------TPHFTANAQQGEVNFVKVPAVRLRLG-KEGEQREALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKSYDDNAAYTPAWAESITGVPGDQIITV -ARQF------ADNAHKTRGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------VSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVKDATAAG -LDAK-----DYVVRGL-----RD---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTESGVQG---KDLGKDDARPAEVAWHEHAPEGKL -DLLVTLDFRMSTTCLYSDVVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCIGHLGVE-KEVVLTPIMHDTAGEIAQPF----DVKEWKKG -QCELIPGKTAPQVTVVERDY--PNVFKRFTALGPLMDKLGNGGKGIGWKTGTEVEQL--- ------GQLNGTTQADGPTKGMPQIVTDIDACEVILQLAPETNGHVAVKAWQALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DVQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMIAFGESMSSYRPPVDLKT----TSGIHN- -------------------------IKGNGNPEILLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDARLAGVQDNDWV-- ----------------EVFNINGAIAARAVVSQRVNPGMLMMYHAQE-------------- ---KIINTP-GSQITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMS-------KVDW---LDTPR--------DDHLAAAYQAQGENP ----- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FTLPRE--RSA-DGHGVVTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------------RWRAALTTARTPVDA -WAT--------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------IVENP------------ ------------------------------------------------------------- ------------------------------------------------------------- -DARRDYQKVRGMG----------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPQE--TYS-GRHGVATNEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIADDESARRDYQQVRGLGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSSFIIAWGSNIPQTRTPDAH -FFTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVILKEFYFKDGGQ -GRSAYFDDYARRYTDLPLLVMLKEHQLADGSTTLVPDRYLR---------ASDFSGQ-FG -QDNNPEWKTLAFD-TSGNPVLPNGSIGFRW---GEQLDEGELAKWNLESKD--A------ --------RNGQDVKLKLSVV------E--------DGAQPHEIAEVAFPYFGGVE----- ----------------TPNFPANAAQGEINRAKVPTVRLDLVGQGGESRQALVATV----- ----FDLQVAQ-YGIDRGF----------GSGAIDYDDNVPYTPAWQESITGVPRDQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNGTSFFYAHTDQWRYEKLGVEEV -------LSPLADKAAFGGSMIDYNVRAERMGWLPS-----APQLK-THPMQVVKDASAAG -LDAK-----DYVARAL-----KD---------------GSLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGADEAKPTEVKWHAKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QAKSDWEIYKGFAQAFSEVCVGHLGVE-KEVVLTPLMHDTPAELAQPF----GVQDWKKG -ECALIPGKTAPQVTVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTDLEVTQL--- ------GQLNGVTLEEGVTKGMPKIVTDIDACEVILQLAPETNGHVAVKAWEAQSKA---- ------TGRDHVHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLK-----TTGGLS- -------------------------IKSNGNAEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEEDATKVGIVDNDWI-- ----------------ELFNSNGAIVGRAVVSQRVKPGMTMMYHSQE-------------- ---KIINTP-GSEITGARGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLEEPAGAPASGAGH----------------- ----- ->eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPRE--AFS-GDHGLTTNEDR------TW-EDAYR -NRWAH------DKVVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIAEDDAARRDYQQVRGMGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSNFIIAWGSNVPQTRTPDAH -FLTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVVLKEFYFKDGGK -GRSAYFDDYARRYTDLPLLVMLKEHKLPDGSITLVPDRYLR---------ASDFNGK-LG -QGNNPEWKTVAFD-ADGRAVLPNGSIGFRW---GEKLGEGETPKWNLESKE--A------ --------RHGQDVKLKLSVV------E--------EGEQEHEIAEVAFPYFGGVQ----- ----------------TPNFPANSAQGEINRAKVPAVRLRLG-KEGDERYALVATV----- ----FDLQAAQ-YGIDRGF----------GSGAASYDDNAPYTPAWQEAITGVPRDQVVTV -ARQF------ADNADKTQGRSMVIIGAAMNHWYHSD-MNYRGVINLLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNSTSFFYAHTDQWRYEKLGMEEV -------ISPLADRKIYDGSMIDYNVRAERMGWLPT-----APQLK-TNPMQVVRDAAAAG -LDAR-----DYVAKAL-----KA---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGAGDAKPSEVKWHASAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KDVVLTPLMHDTPAELAQPF----EVKDWKKG -ECELIPGKTAQQITVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTELEVTQL--- ------GQLNGVTLEEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKV---- ------TGREHKHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLKT----TAEIAG- -------------------------VKPNGNPEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEEDAAKAGIVDNDWV-- ----------------ELFNVNGAISARAVVSQRVKPGMTLMYHAQE-------------- ---KQINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDEPAGTAGSGH---------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSQPKE--TFS-GDHGLTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRSRLLE---------RWRA-AMKTAKTPVDA -WATIVEDDAARRDYQKVRGMGGFVRSSWDEVNQIIAASNVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWG--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2011_265_B_bin.52_k121_959771_6 rank: A; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------GEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FYTEVRYRGTKSAVVSPDYSEAAKFGDIWLNPQAG-TDAALAMAMGHVILREYHL----D -RQAEYFEDYARKYTDMPMLVRLE-----DRDGHLVPGRMLR---------AEDFDGK-LG -ETNNPDWKTVAYDEATGQIAVPNGSIGFRW---------GEEGKWNLEQRA--------- ---------KGAEANLRLSQILDGHHDE---------------IVGVDFPYFGGVA----- -----------------TGDFVKCDHPEVLTRNIPARRAKLA-DGSQVLAATVFDL----- -------FCAN-YGLDRGL--------GGKWVSKDFNDDSPYTPAWAEKITGVAREKIIAV -AREF------AGNAEKTHGKSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCIGQEGG-G ---WSHYVGQEKLRPQT---GWAPLAFALDWNRPPRQMNSTSCWYAHTDQWRYETLRAGEI -------LSPTAPEGDWHISLIDYNIRAERMGWLPS-----APQLK-TNPLEVAKAAKAA- ----------GKAIPAYVAEQLKS---------------GALQMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVMG--KDLGEEGGVMPKEAVWHDEAPKGKL -DLLVTIDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKSDWEIFKSIARKFSEVAPEVLGVE-TDIVQLPLLHDTPGELAQAH-----VRDWKKG -ECDLIPGKTAPNYIAVERDY--PNLYKKFTSVGPLLEKLGNGGKGINWDTKVEVGHL--- ------RDLNGVVQDEGVSKGMAKLDTAINAAEMILMLAPETNGEVAVKAWEELEKP---- ------TGRHHAHLAEGAH----H-TKIRFR-DVAAQPRKIISSPTWSGIESETVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFVSYRPPVDLKTI---TKAVNN- -------------------------DAAEGNPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVVWMSEVDAQKARLVDNDWV-- ----------------EAYNINGALTARVVVSQRIKQGTLFMYHAQE-------------- ---KIVNTP-GSEKTGHRGGIHNSVT---RTTLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIVRKMK-------KVDWLD-TPATHKVEAAE----------------- ----- ->NASQAN2011_265_B_bin.52_k121_465271_4 rank: C; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNFFQSKELEQ---FS-DGWGQTTRENR------DW-EDVYR -NRWRH------DKIVRSTHG-VNCTGSCSWKIYVKSGIVTWETQQTDYPRTR-----AGL -PNHEPRGCARGASYSWYLYSANRVKNPLIRGALMR---------AWRK--MRPTMTPVAA -WAAIQNDPVLRASYTKTRGKGGFVRATWDEATEIIAAANAYTAKTY----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -F----------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSH--FSAPKE--EFA-DGHGVATGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALLVAKSPVDA -WASIVENPQARAEWQKQRGLGGFVRSTWEEINQLVASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----D -KRSAYFDNYVRRYTDMPNLVQLEERTLPDGRKVMVPGRYLR---------ASDFDGK-LG -QSNNPEWKTVALD-QDDKIVLPNGSIGFRW----GAAEREDLGKWNLENKE--A------ --------RGDTQVTLKLSLM------E----GAKDGSAADYEVGDVGFPYFGGID----- -------------TPNFDANKQSAAVGDVLVRKVPVRRVKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------PGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWVRPPRQMNSTS -FFY------------------AH------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------TDQWR--------------------------------- ------------------------------------------------------------- -----------------------Y------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------ERLGVDE------ ------------------------------------------------------------- -------------------------------ILSPL------------------------- --------------ADKSK------------------------------------------ ----- ->NASQAN2015_172_B_bin.54_k121_327740_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------IWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRQVVVPGRYIR---------ASDFNGK-LG -QDNNPDWKTVALD-QNDKIVLPNGSIGFRW----GAEGRSDEGRWNLENKE--A------ --------RGDGDVKLKLSLM------E--------GEDSEYQVGEVAFPYFGGID----- -------------TPNFHANKQVSAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------DGETAAKDYEEDVPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAVG -MDPK-----EYAIKAL-----QD---------------GSLKMSCEDPDNPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGPEDAKPAEVKWHDKAPEGKL -DLLVTLDFRMSTTCMYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----EVNEWQKG -KCELIPGKTAPQITVVERDY--PSTYKRFTALGPLMAKVGNGGKGIGWNTADEVQQL--- ------GELNGHVRTEGVTKGFPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHPWMIAFGEGLTSYRPPVDLKT----VDDMID- -------------------------RKPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKDAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEISGMRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVIVRKMR-------KIDW---LDNEANNQVQV----------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_678_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- -------------------------------------NGKLGQDNNP------EW-KTVAL -DQA--------DRVVL-----PNGSIGFRWGAEGRSD--------------------AGK -WNLEDKEARGG--------NEVKLKLSLM------------------------------- ---------------------------------------------------------EGEG -ADYEVGEVA--------------------------------------------------- ----------------------FPYFGGIDT------------------PNFSANKQASA- -------------------------------------VD---------------------D ------------------VLVR--------------------------------------- ------------------------------------------------------KVPVR-- ------------------------------------------------------------- -------------------------------------RIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKT----VDEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQA----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--AFS-GGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRAALAVA-KSPVDA -WTSIVENPNARLEWQEQRGLGGFVRSTWEEVNQIIASANVYTIKQY----GADRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QADRMVLPNGSIGFRW----GAEGRSDAGKWNLEDKE--A------ --------RGGNEVKLKLSLM------E--------GEGADYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVIWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKTV----DEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQV----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--PFS-GGHGVTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRA-ALAVAKSPVDA -WASIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RGDSEVKLKLSLM------E--------GEGSEYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----DYAVKAL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEDAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLMPLMHDTPAELAQAF----DVKEWSKG -ECELIPGKTGPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTTDEVHQL--- ------GELNGKVRAEGVTQGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMQAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKNAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KVDW---LDGEAPATVQA----------------- ----- ->NASQAN2011_028_B_bin.24_k121_53788_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALAVAKSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERNLPDGRKVMVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKEA-------- --------RGDNEVKLKLSLM------E--------GEGSDYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRVKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKQDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMKVVKDALAQG -MDPK-----DYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGIEDAKPTEVHWHDQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----DVKEWKKG -ECELIPGKTAPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTADEVHQL--- ------GELNGKVRAEGVTKGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RKPNGHKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KIDW------------------------LDGEAPA -TVQA ->NASQAN2015_227_F_bin.21_scaffold_4919_3 rank: C; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRAALAVA-KSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_25058_1 rank: C; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--SFS-GDHGVTTGEDR------TW-EDAYR -TRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSMQPVDA -WASIAQSDEKRREYQTVRGLGGFVR------------SNVYTIKKH----GPDRI-VGFS -PIPAMSMVS------YGAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYF----P -DGGKPRSAY---FDDMPMLVMLKEHQLPNGDTVMVPDRYVR---------ASDFNGK-LG -AANNPDWKTVAFD-ESGKVVLPNGAIGFRW----GPDGRADEGQWNLEAKE--A------ --------RHGTEVKLKLSVM------E--------GDNPSLETAKVGFPYFGGIV----- -------------SEHFPNNATGDAAKDVLVRTVPVQRISLG-KEGDKREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------AENADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGMDEV -------LSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPFQVVKDAEAAG -MSPV-----DYTVKSL-----KD---------------GSLAMSCEDPDHPN-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG--------------------------- --------------------------------KDLGADEAK-------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PTEVVW------------------------------ -----------------------------------------HKEAPEGKLAL--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----VVTLD---------------------------------------------------- -----------------------------F------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4 rank: C; buq:AC233_31260 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --WRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGPQDAKPTEVKWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -QSRSDWEIYKGFAKKFSEVCVGHLGVE-QEVVLTPLMHDSPAELGQPM----GVQDWKRG -DCELIPGKTAPQITVVERDY--PNVFKRFTALGPLMNKVGNGGKGIAWNTQVEVTQL--- ------GQLNGLVREEGVTKGMPKIDTDIDACEVVLQLAPETNGHVAVKAWEALSKA---- ------TGRAHKHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHAWMLAFGEGFGSYRPPVDMKA----TALMHN- -------------------------QRPNGQPEILLNF-------------------ITPH -QKWGIHSTYTDNVLMLTLSR---------------GGPIVWLSEDDAKSAGIVDNDWV-- ----------------ELFNVNGAIAARAVVSQRVKPGMVMMYHAQE-------------- ---KIINTP-GSEITHVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMD-------KIDW---LDTPVG-------AERVTRVQAQGENA- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3 rank: C; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY----FSQPTEPFS-NEHGITTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCQRGASYSWYLYSANRVKHPMVRARLLK---------HWRE--ARLHHDPVDA -WASIMANETKRRDYQQVRGLGGFVRSSWDEVNEIIAAANVHTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGCKTVAVTPDYSEVAKLADLWMHPKQG-TDAALAMAMGHVILKEFYF----D -RRAAYFDDYARRYTDLPMLVMLREQTLDNGRTVLVPDRLLR---------ASDFNGK-LG -QANNPDWKTIAFD-TTGKAVAPNGSIGFRW----GPEGRADAGRWNLEDKD--A------ --------RTGADTKLKLSVL------EDEHGEGAAQAHEIVEVGF---PYFGGVV----- ----------------NPHFTGNDQGGDVRRIHVPAVRLRLG-KAGEERHALVATV----- ----FDLQAGQ-YGIDRGL----------GTGAKNFDDDAPYTPAWQEAITGVPREQVIAV -ARQF------AENAEKTEGRSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWIRPPRQQNSTS -FFY------------------AH------------------------------------- ---------------------------TDQWRYE--------------------------- -----------------------------------------------------KLGMDEVL -SPLADKAAFKGSAIDFK------------------------------------------- ------------------------------------------------------------- --------------------------------APQLNVNPIQVAKA--------------- -------------------------ARAA-------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------VDPKDYTVQGLKNGS---- --------------------------------------IDLACHDPDAP------------ -----------------------------QNW----------------------------- -------PRNMFV----------------W------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2 rank: A; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ----------------------S-------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------MNYRGVINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMDEI -------LSPLADKKAYAGSMIDYNVRAERMGWLPS-----APQLK-TNPLKVVRDASAAG -MDPK-----DYTVKGL-----KD---------------GTLKMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGRDEAKPSEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWDIYKGFAKKFSEVCVGHLGVE-REMVLSPMMHDSPGELAQPL----DVKDWKRG -EVDLIPGKTAPNMVVVERDY--PNVYKRFTALGPLMNKVGNGGKGIAWNTQTEVKQL--- ------GELNGLITEQGVTCGMPRIDSDIDACEVVLQLAPETNGHVAVKAWQALGKQ---- ------TGIDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFTSYRPPVDLKTT---------- ----------AGIHGIKSNGNP----------EILLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKRAGIVDNDWV-- ----------------ELFNINGAIAARAVVSQRVNNGMTLMYHAQE-------------- ---KIINTP-GSEITGIRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDTPADASNPA------------GSHA- ----- ->NASQAN2016_164_F_bin.17_scaffold_8891_2 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPRE--SFS-GDHGVTTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSQDPVDA -WASIAQSDAKRKEYQSVRGLGGFVRSSWDEVNEMVAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNS----------------DAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYFPDGGK -ARSTYFDDYVRRYTDMPMLVMLKEQTLPSGEVVMVPDRYLR---------ASDFNGK-LG -AANNPEWKTVALD-ESGKVVLPQGAIGFRW----GPDGRADEGQWNLQAKE--A------ --------RHGNDVKLKLTVM------E-----GEQASLETAKVGF---PYFGGIE----- -------------SEHFPNNATGAGANNVLVRTVPVQRIALG-KAGDTREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFGLDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEV -------LSPLADKKAFGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVRDAQAAG -MEPK-----DYAVKGL-----KE---------------GTLSMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDMGHDEAKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2015_227_B_bin.17_k121_559871_7 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPKE--AFS-GEHGVSTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWREARLS--MDPVDA -WASIAQDDAKRKEYQSVRGLGGFVRSGWDEVNEMVAAANIYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYC-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2 rank: A; aon:DEH84_18240 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- --------------------AA-------------------------------DW-VRPSR -QQN--------STSFFYAHT---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DQWRYEKL----------------- --------------GVNEVLSPLADKAKF-------------------------------- ------------------------------------------------------------- ----------------------------------------GGSMI---------------- ---------------------------D--------------------------------- ------------------------------------------------------------- ----YNVRAER-------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------MGWLPS-----APQLQ-TNPLNLVKEAQAKG -MDAK-----DYAVQSL-----KD---------------GSLKMSCEDPDNPA-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGPNDAKPQEVQWHNQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -EARSDWEIYKGFAQKFSEVCVGHLGAE-REVVMTPIMHDTAAELAQPF----GVQEWKKG -EIDLIPGKTAPQIAVVERDY--PNTFKRFTSLGPLMNKLGNGGKGIGWNTQDEVHAL--- ------GELNGTVREEGVSQGMPKIVSDIDASEVVLMLAPETNGHVAVKAWEALGKQ---- ------TGRDHTHLALHRE----D-EKIRYR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFVSYRPPVDLKT----LDDIKG- -------------------------VKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNNGMVLMYHAQE-------------- ---KIVNTP-GSEITGTRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLDDESSNQGVHA------------------- ----- ->NASQAN2016_164_F_bin.17_scaffold_1152_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -----------------VTCG---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------MPKI- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------TDIDAC------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------EVVLQLAPETNGHVAVKAWKALGKQ---- ------TGLDHTHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNA-- --------------------GYTNVHEMIPWRTR--EGFTTYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSETDAKSVGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW--------------------LEEEAQGENA- ----- ->NASQAN2015_227_F_bin.21_scaffold_2406_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------VSYNAGYTNVHEMI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------PWRTL-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------T------------------------------------- --------------------GRQQFYMDHPWMTAFGENFSSYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAKSAGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMA-------KVDWLDDEGSSTEPTATHN---------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSSPKE--SFS-DGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTRD-----DL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLQ---------HWRA-ALAVSKSPVDA -WANIVENTAARSEWQKQRGLGGFVRSTWEEVNQLIASANVYTAKKY----GPDRV-MGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYSEVAKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----N -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVMVPGHYLR---------ASDFNGK-LG -QDNNPEWKTVAID-ENDKIVLPNGSIGFRW----GAEGRSDMGKWNLESKEA-------- --------RGDAEVKLKLSLM------E--------GATPDYEVGDVGFPYFGGID----- -------------TPNFNANKQGEAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------AGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTKGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLE-TNSFQVVKDAQAAG -MDTK-----DYVVKSL-----KD---------------GSLKMSCEDPDNPK-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG---KDLGAEEAKPTEVQWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAQAYSEVCVGHLGVE-KEVVLTPLMHDTPSELAQAF----DVKEWKKG -ECDLIPGKTAPTIAVIERDY--PNTFARFTALGPLMEKAGNGGKGIGWDTKVEVQQL--- ------QSLNGKVHTEGVSKGMAKIVTDIDAAEVILQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAIHRE----D-EKIRFR-DVQAQPRKIISSPTWSGI----------- ----------------------------ESETVSYNAGYTNVHE----------------- ----------------------------------MIPWRTLT------------------- ------------------------------------GRQHFYL------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- --------------------------------TLT-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------GRQHFYLDHDAYIAFGEHLSTYKPSPT-------------- ----------PEAYGDLRKT-----VNDGHAKMLN---------------------CLTPH -GKWHIHSTYGDTLRMLTLSR---------------GNEPCWLSEEDAAELGIKDNDHV-- ----------------EVYNDHGVYVARACVSARIPKGVCIVYHAVERTYNIP-------- ---KSQIRR-GEHGEPRRGGMNNSFT---RVHLKPNLMCGGYGQ---------FTYHFNYW -GPV-GVNRDTHVLVRKMH-------VVEY------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- --------------------MG--------------WIQDLFAPEQR------SW-EDFYR -NRWAH------DKVVRTTHG-VNCTGSCSWNVYVKQGVVTWEMQALDYPTID-----RSI -PNYEPRGCQRGISTSWYIYSPLRVKHPYMRGALLD------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------LWQEARRE--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------HP------------------ ----------DDPVAAW-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------ASIT----------------------------------- ------------------------------------------------------------- ----- ->AFN37208|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIVTWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGFRRATWDECLELVASSLLYTAKKY----GPDRV-VAFA -PIPAYSYLS------FGAGTRFIQL----------------------------------- ----FGGFTLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVANGANMNMTRTPDVH -FISEARHNGTKFVVIAPDFSQVAKYSDWWLPVKAG-QDQALWMGIDHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGKVAVTTA--------- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEPYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWSCWALGKDWVPTSRLQQSSSWHYAHSDQWRYEGDFTEYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPLDVVKQAEAAG -AKT------DEQIVKWVVEQVKS---------------KQLKFAIEDVDAPE-NWPRTWL -IWRGNALQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVTFREPAPRGKM -DLLCQLNFRMDTTATYCDVVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMTPLAHDTPDELSQDYQAGMKVLDWGKG -EIEMIPGKTAPHFKVVERDY--ANIYNQWITFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRK----TGDIV-- -------------------------RSPVDDESVVLNY-------------------ITPH -GKWHIHSTYYDNHRLLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPE-------------- ---RTISIPKSQVRGNRRGGAHNSLT---RIRINPMQMAGGYAQ---------WTYAWNYW -GPIGIMTRDTHVAVR--------------------------------------------- ----- ->AFN37205|Nitrolancea_hollandica_Lb ------------------------------------------------------------- -----------------------------------------------------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRHRWQRARGKGGFRRATWDECLELVASALLYTAKKY----GPDRV-VAFA -PIPAYSYLS------YGAGSRFIQL----------------------------------- ----FGGFNLSFYDWYADLXNSFPEVWGDQTDVCESADWYNSKFIVSNAANMNMTRTPDVH -FISEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTCWALGKDWIPPSRLQQTSTWHYANSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPFEVVKQAEAAG -AKT------DEQIVKWVVAQLKS---------------KQLRLAIEDVDAPE-NWPRTWL -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVVVREPAPRGKM -DLVCQLNFRMETTATYSDIVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMQPLAHDTPDELSQDYLAEMKVLDWGKG -EVDLIPGKTAPHFKIIERDY--ANLYNQWTSFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMVYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYAFNYW -GPIGIFTRDTHVA----------------------------------------------- ----- ->AFN37207|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRC-AAFA -PIPAYSYLS------YGAGSRFFQL----------------------------------- ----FGGFNMSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVIAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIDYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCVGYRW-------ATKETGKWNISMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------EVAQVEF----- ---------------------DIFGTGKVARRGVPIKYLETS-EGK-VAVTTAFDL----- -------LLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPIEAPILTGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTTWALGRDWIPPSRLQQSPVWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAIDLLASAVRMGWMPF-----YPQFN-RNPLEIVKQAEAAG -AKS------DEQIVKWVVGQLKS---------------GNLRYAIEDIDAPE-NWPRTWV -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EEHAKGRVKDVVLRDPAPRGKM -DLVCDINFRMETTALYSDMVLPTAMW--YEKNDLNTTDLH-SFIHP----L-GAAVPPVW -EAKTDYEIFKAIAKKVSELAPSVFPQPVKDIISNPLIHDTPDELAQDYLSEMKVLDWGKG -EIDLIPGKTGPHLKIVERDY--VNLYNRWISFGPKARENGISGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGGRYPRLEFAEEAANLLLHLSPETNGEVCYHAFKEEEKQ---- ------IGMPLADLAESIR----G-VRMNYF-DLTRQVRRTMISPCWTGMINDGRAYAAWC -LNVERLVPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRKTG--DIVRSP- ----------VDDES------------------VVLNY-------------------ITPH -GKWHIHSTYYENHRMLTLSR---------------GIEPCWINDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMFNYW -GPIGIFTRDTHVAVR--------------------------------------------- ----- ->AFN37206|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRV-TAFA -PIPAYSYVS------FGAGARFIQL----------------------------------- ----FGGFHLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEGYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLSLVS---AWQSWALAKDWFPPSRVQQSSTWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPM-----YPQFN-RNPLELVKQAEAAG -AKS------DEQVVEWVVGQLKS---------------GNLRYAIEDVDAPE-NWPRVWL -IWRGNAFQS---SAKGAEYFLRHYSGTHDNAVA-----EEHAKGRVKDVVFREPAPRGKF -DLLCDLNFRMDTTALYSDIVLPTAMW--YEKNDLNTTDLH-TFIHP----L-GAAVPPVW -EAKSDYEIFKSLAKKVSELAPSVFPQPVKDIVSNPLAHDTPDELSQDYLAEMKVLDWGKG -EIEMIPGKTAPHFKIVERDY--VNFYNRWISYGRKARENGIVGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGQRYPRLEFAEEACNLIMFLAPESNGEVCYHAFKEEEKQ---- ------LGLPLADLAEAVR----G-VRMNFF-DLTRQVRRTLISPCWTGMVNDGRAYSAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMWNYW -GPIGILTRDTHVAVR--------------------------------------------- ----- ->WP_005004540|Nitrococcus_mobilis ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMEDG-------- --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGSVLVATV--------- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIHDLDNSPID- ------------------------------DKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVE-------------- ---RTIYIPKSQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->Nitrococcus_mobi_EAR23355 ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMED--G------ --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGS----VLVATV----- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIH--DLD---- -------------------------NSPIDDKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVERT------------ ----IYIPK-SQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MS-WIEDIISPNTR------KW-EEFYR -NRWQY------DKVVRSTHG-VNCTGGCSWAIHVKDGIVVWEMQQLDYPQFN-----KDV -PPYEPRGCQRGISYSWYLYSPIRVKYPIIRGALID---------LFRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------E ------------------------------------------------------------- ------------------------------------------------------------- --------KKKCG------------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- -----------------------------------------DPVLA--------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------ANLQADDTK------------ ---------------------------RKRYQRA--------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Nitrobacter_winogradskyi_gb_ABA05326 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLAD---------LWHEAKASY-PDPVQA -WASLVEDEEKRNRIQKARGKGGFRRAKWEELIELIAASCLYTARKH----GPDRV-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----FGGGLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWSTVAMALDWNKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPNFH-RNPIEVVAEAERAG -AKS------TADIATYVADQVAS---------------KKLDLAINDPDAEE-NWPRVWF -IWRANAIQS---SAKGHEFFLRHYLGAHDNVIA-----EERAKGKTTTVKYRDTAPQGKY -DLVVDINFRMNTTGLYSDIILPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDIVLQPLMHDTPDELAQPE-----ILDWAEG -ECKLVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVNIPIKKQYDQMLEN -PIMPMPDSRHMRCVEWGGKRYPSLEDVLDACNVVLLCAPVANGEVSYQGFVNEEQH---- ------VGLPLADIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLVNDGRAYSAWC -MNIERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRLLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RIRINPLFLAGGYAQ---------FTYGWNYW -GPTGIFTRDTHVVVRKME-------KVEW------------------------------- ----- ->WP_011314088|Nitrobacter_winogradskyi ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYVRGPLYD---------LWKEAKASH-PDPVQA -WASLVGDEQKRSRIQKARGKGGFRRAKWEELVELIAAAALYTARKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TADIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLISKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNIPIKKQYDQMLDN -PIMPMPDARHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLTNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->Nitrobacter_sp_Nb_311A_ZP_01048070 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLYD---------LWREAKASH-PDPVQA -WASLVGDEQKRLRMQKARGKGGFRRAKWEELVELIAAAALYTARKW----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------AKRVARY--Q -DVENGDWKMLVLDSKTGEPRAFKGQVGDRW--------GSTHGKWNLSAED----TLDNS -PIDPVLSFIDQSDGVVQVGF------D---------------------DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGEVLVTTG--------- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDENAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLQAKAVRSGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TDDIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGMTNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDSQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->A_Nitrobacter_hamburgensis_YP_578638 ------------------------------------------------------------- --------------------MS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLLD---------MWREAKASS-ADPVQA -WGALIGDEQKRSRIQKARGKGGFRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFVDYIKRYTDLPFLVELES-----NGNTYKTGRLLR---------SNRVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVKRVATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWATVALALDWAKPPRLVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPKWAKGHAIDLEAKAVHNGWMPF-----TPHFN-RNPIEVAAEAERSG -AKN------VQDIETYVVDQVVS---------------KKLQMAIDDPDAAE-NWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNAIA-----EDRAKGKAQVVKYHETAPRGKY -DLVIDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIGKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWSLG -ECKAVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPNR----N-VAATFY-DLTRQPRRIITSPCWTGMVNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- -----SR---------------------VDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->B_Nitrobacter_hamburgensis_YP_578186 ---------------------------------------------------------MTTG -LAAGQR--------TEETQMS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRIKYPYVRGPLLD---------MWREAKASS-ADPVQA -WGALVGDEQKRARMQKARGKGGYRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLLSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGTTYKTGRLLR---------ARHVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVRRIATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATTAEYTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWASIALALDWSKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKAVRSGWMPF-----TPHFN-RNPIEVAAEAERAG -AKS------TEDIATHVIDQVAS---------------KKLNLAIEDPDAAE-NWPRLWF -IWRGNAIQS---SAKGHEFFLRHYLGTHDNAIA-----EDRAKGKTHTVKYHDTAPRGKY -DLVVDLNFRMDTSSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWDIFKLIAKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNVPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPTR----N-VATTFY-DLTRQPRRLLTSPCWTGMMNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14 rank: A; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGQRSTWGVVSESRRRFLVKAGL -ASAAGA--------AINLNLFGCGRSHAPLQHFKGTTAGHFDLGPRTTPKLGNW-QDLYR -QRWTW------DKVVKGSHGWANCRSACEWDLYVKDGIVVREEQSATYEASE-----PGV -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------PRGSGQWEKISWEQAIKEIAQKTVDAVTEF----GTDTVFQDLG -PNFDFGPST--------AGRFKFMYQAGSLFADM-------------------------- ---------WGEI---GDLNFGATMALGAAQIGGSSDEWFLSDFIVVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPIETG-TDAALGLAVARHLFEVNAI----D -------LPFVREQTDLPLLVRLDTGRFLRETDLNSG------------------GNA--- ----------------------------------------DQLYLWHPQKNAPVFAPGC-- --------TGNTTRKLTLDFE----------------------------APIDGQW----- -------------------------------------TIKLH-DGKEVAIAPVGAL----- ----LKEHLEP-WTFEHTA-----------------------------SVTHLHVDQVKKF -AEGW-----------AKCQRPMVLSSWGSNRFVHSD-LMNRSKILCLMLKGALGKKGT-G ----YQATGIVDMEGFNNAMQMDHEGVR--------------------------------- -------------------------------GRLGALLGIMPPADLFQAVLDIVMQRKTEG -DVAL-----ETEMNYL-----KHHLCSSDVMESNFKAPGYRAAVVKEHEGMLPRSLESYY -QEARQKDWS---QGLPRKAPVKVYFSGGANILRRSNMP-----------QYYKTFIWDEM -QCIVDINPKYSFTGTQSDYILPAAGW--YEKAGIKYTMSYVPYLH-----YCDVAVPPLG -ESKGEWEIFWLLTREMERYA---------------------------------------- ---KEKNLPVLDGCGRGSNDF--KTLHQRYSNQGELGQ----------------------- --------------------------------HDDEKVMKEILHGDATEGMTIEGLKQTGI -AKFTSAGKPVAADAINNP----D-WKGEGV-MTTLTRFTVHKEPWPTYS----------- --------------------GRITSFIDHPWFIEMREQFPIHKDSPKAGG----------- ---------------------------------------------------DYPFQFVSCH -ARWSIHSTWRDTPMMLRLQR---------------GEPLVYINPIDAERVGVKDFEYV-- ----------------EIFNNYGSVRMRVKVAAMVRPGVAYYYHAWE-------------- ---------------PHQFPNHQSFKWLIPGLVNPLYMAGGYGQ---------INHAMNRY -QPG-SAVQDTRIGIR------------PW---HGQATGAHPVKRPEAAATSK-------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1 rank: C; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGNLIKTGIASASRRKFLVMAGA -ASAAGA---------ALSLFGCGRAPLQH--FKGTTASGRFDLGPRTAPKLGNW-QDLYR -QRWTW------DKVAKGSHGWANCRSACEWDLYVKDGVVVREEQSATYEASE-----PGI -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------SRGSGKWEKISWEQAMKEIAQKTVDAAEKW----GTDTIYQDLG -PNFDFGAST--------AGRFKFQF----------------------------------- ---MAGGVFADNWAEIGDLNVGASITTGAAHLGGSSDEWFLSDFIIVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPLESG-TDAALGLAVARHLLETGAI----D -------LPYIREQTDLPLLARLDTGRFLRESEMVNG------------------GNA--- ----------------------------------------DQLYMWHPQKNAPVPAPGC-- --------LNNTTRNLKLDFE----------------------------PPIDGQW----- -------------------------------------KVKLA-DGKEVGVVPVGAM----- ----LKEHLDS-WTFEHAA-----------------------------KVTHLHIDQIKKF -AEGW-----------AKAQRPMVLSSWGSNRYVHSD-LMNRTKLLLLMLKGAMGKKGA-G ----------YQATGWV-------------------------------------------- ----------------------------------------------DLDGFGNAMQMEKSG -MT------------------------------------GRLAVMLNAM------------ ---------P--------------------------------------------------- ------------------------------------------P------------------ ------------------------------------------------------------- -----------------------KELFNA-------------------------------- --------------------------------VVDIIKKRKTEGDVALEG----------- ----------------ENN----Y-LRTK-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------LCTSDVVEVNLKSDGY--- -----------------------RAALNKEQKGLYPHELDEYYKEAHD------------- -----------------------------KGWAP--------------------------- -----GLPRKAPPKIFF-------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3 rank: A; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MSISRRHFIVGSAV -AVAGVG------------LYS--LRPKKP--VVYPVGVRAPKVAAR-KVHYNDY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQAAIYEPHR-----PDV -PDFNPRGCQKGACYTQLQVSEARVKYPLKCVG---------------------------- -----------------ERGEGKWKRVSWDTALDEIADRLIDIAVRDGTESIIFDDTTNVG -YGPE-----------TAGDVRFAAA----------------------------------- ----IQATRLDSWSGVGDMPNGLIQTWGLYNCEGTSDDWYLSDYIVIWVGNPNYTRIPDAH -FLHEARYRGAKLVVVAPDLNPSTAHADLWINVNAE-TDSALALSCAQVMIAEKLY----K -------KDYVLQQTDFPFLVRKDDQRFLRAADMVKG--------------GAD------- ----------------------------------------NALYLWDEAKHAPVIAPGCEG --------DGDGGRIMALGGI------K---------------------PALSGTF----- -------------------------------------KVTTQ-DGKTVEVQTVFDM----- ----IRAKLDAEYTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPKAMIIASYGSCKHYHHD-LNQRSFVLLMNLTGNQGQQGG-G ----------YRISAW-----WAMDGLD--------------------------------- -------------------------------QMADSTVPLKDMLRIIPKAIRGLSPRDYEG -LFTEYSDKEGHTPALLFLY--LH---------------GGYKEMWDKPHLQDPALPRPF- ---ADYVQES---IDKGW-SKVHPPLGREPRAYI---FTGGNPLRRWPSPQIAKQHLWPKF -ELVVSVNFRMSTSSLFSDYVLPVAAY--YEKYGIKYAQTYVPYIIT----S-DKATEPLG -ESKSDWETFGLLSKHVAERARVRGVTMVRGL----------------------------- ----------------KDVLFDLSKAYEVHTHHG--------------------KYDP--- ----------------------------TDPEDPIKLMDAIFANSPSIGCNTGREALDMGA -VPVIGTGRPSLIDQNYSP----YDPKDTYW-PHKDFIDKKIAWPTLT------------- --------------------GRQQFYIDHPWFLEGKEHLPTFKPSIHANSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHAVWRDVKLLLRLQR---------------GQPACWLNPKEAEKRGIKDGDMV-- ----------------RVFNDHGTCECMVKVSAITAPGEVIIYHAW--------------- ----------EPYQFKKWQGNQEPVE---APW-KALHLAGGYAQ---------LHWRVYYH -GPN-HSPRGAPVEVEKIGYEGG-------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4 rank: C; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MQISRRGFIVGSAV -AAAGVG--------LYSLKSK--KAVIKPGITLP-DKTPAKKIKYN------DY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQNAIYEPPR-----PGI -PDQNPRGCQKGACYTALQLSESRVKYPLKRAG---------------------------- -----------------NRGEGKWKRISWDEALTEIADKLLDIAVAEGTETICFDDLSNTG -YGPETAGDFR-----FSTGMQVSRL----------------------------------- ----------DGWSGVGDMPLGVIQTWGAFNCEGTSDDWFRSDYIVIWLGNPSYTRIPDAH -FLHEARYRGAKLVVVAPDLNATTVHADMWLNVKPE-TDAALGLACAQIMISENLY----K -------KDYVLEQTDFPFLVRKDNQRFLRVSDVVKG--------------GAD------- ----------------------------------------NAFYLWDEAKNAIAMAPGCEG --------DGDGGRSLKLGAL------K---------------------PALSGTR----- -------------------------------------SVKLA-DGSTVECITVFDM----- ----IKERLDKEHTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPSAMIIASYGACKHYHSD-LFQRSFILLMNLTGNQGKPGG-G -MRVAAWWGMDGLDAMA----DSTIPMA--------------------------------- -----------------------------------------DMMKIIPKAVRGLTPRDYES -LYTDYSNREGHTPTMVFLY--VH---------------GGYKELWDKPYLQDPNLPRNI- ---SSYMRES---IDKGW-TKVHPPENKSPKAYI---FTGGNPLRRWPSPQIAREKLWPKF -DLVCSVTFKMSTSTLWADYVLPVAAY--YEKYGIKYAQSYVPYIIS----S-DKATEPLG -ESKSDWETFGLMAKKVAERAKARNITMVRGL----------------------------- ----------------DDKPFDVSKVYDFYTGNG--------------------KYDP--- ----------------------------TDPEDPVRLMDEIFAGSPNVACNSAREALQRGA -VPVTGPGRPSLINQNYSD----YDGKDTYW-PHRDFIEKKVAWPTIT------------- --------------------GRQQFYIDHPWFIEGKEALPTHKAPPLATSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHSIWRDVKLLLRLQR---------------GQPAAWMNPAELQKRGLKDGDMV-- ----------------RVYNDHATFECNIKSSPATAPGEIIVYHAWEPFQFK--------- -----------------KWQSNQEVT---EAPVKGLHLAGGYTQ---------LHFRVYYG -SMH-HTPRGAAVEVEKAPT----------------------------------------- ----- ->NASQAN2015_111_B_bin.76_k121_226837_116 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVSRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDIWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVRAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVETR-TGK-VTVTTVFAL----- ----LRKRATE-HSPEKMS-----------------------------TETGLNPKAMRTV -AREF----------AKAGQRAMIYAGFSACKWLHGD-ILQRSMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLEEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DTAVKPLG -EAVDDFEALRRVSAAISTIAREKATPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRDSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQQGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDAGSFVCMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLYS-------RGKV---TAAKARIA-------------------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVNTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------NVETR-TGK-VTVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKRAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DQAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLHS-------RGKV---------------------------TAAK -VRIA ->NASQAN2014_190_B_bin.96_k121_3766_2 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLTHSAL -AAGAAL--------ALHHGAA--------------MADALSR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIDEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VAVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------DETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPIYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDATARNVRDGDLI-- ----------------EVFNDGGSFICMAHVSAGIMPGTVYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---------------------------TAAK -VRIA ->greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHTAL -ASAALA--------LQHGAAM--ADALTR--------------PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVYKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGDI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VTVTTVFAL----- ----LKKRAAD-HSPENMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRIVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRASGN--------------RWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTAAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVWNSDESP----FHADIA------ESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARNVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---TAAKVRIA-------------------- ----- ->providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4 rank: A; shal:SHALO_2978 molybdopterin oxidoreductase, alpha subunit (db=kegg) ----------------------------------------------MANSSRRNFLKASG- ---------------FSAAMLAGQGTLFAKTDVIK-VENAKDSYPNA------SFTETNYR -DEFKFTYGEKAEHGYAYHCV--NCQGNCAWEVWGNNGIVTRENQSAKYPAF------GHN -PDFNPRGCNKGVQHSQVMYEKDRILYPMKRIG---------------------------- -----------------ERGKGKWKRISWDEAATEVAQKLYTTM-------------IDPK -KGPAAITVH------AGTGLLTEGRRPSVLRFGT-------------------------- ---QLGASRIYPASYLGDMFTGAAIAYGEGNMGCTYDFMFNVSTSIMWGANPSATRIPDAH -FVWEGKYNGSKIIVITPEYNATAARAHLWVPIKPG-TDSFLAMSIINEMLAKKLY----- ------LPQAVKTYTDLPFLVDAKTKRFIRRSDAEHA------------------------ ---------------HDEKTHHLYE---------------DEFYCWNLKSGKPELMPGTEG -SERKTIMLKDKGWDI-----------D---------------------PALEGEW----- -------------------------------------EMTLQ-GGKKVKVTTVFEL----- ----LKKEASK-YSAKDTQ-----------------------------KITGVHLDVVTEL -ATHI-----------AKDKCVEITTGFSLNKYFNGV----LSIWNIATICGLTGRFGPRG ------------------------------------------------------------- -------------------------------GLNTE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------NEFQLSG------------------------------------------------ ------LEALSGFAGKYS------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PRFA-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------SGFLSEFM------------------------------------------- ------------------------------------------------------------- ----- ->muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MKLTRRTVLQGIAG -ASAATVVGGQD---ALGEAGAPAAKTGKD--VPVIIDDPREHYPNT-----RPV-EDMYR -SEFADTFGDPDDHGTAFHCV--NCQGNCAWQVWIKDGKVTRENQSAAYPAIR-----EDI -PDSNPRGCNKGVQHSQVMYEADRIRYPMKRVG---------------------------- -----------------ERGGGKWERISWDEAIDTIAQKLYRTM-------------VERG -PQGNYVH--------VGAGLLSEARGASIKRMGA-------------------------- ---LLGAVRPYIASYVGDMFPGVSLVYGEGNIGCSYDFMYGTNVQVYWGCNPNTSRIPDAH -YVWEGKYNGSKVIVISPEFNSTAIHADRWIPIKPG-FDGHLAMSLMHELVDKQLY----D -------AELVRKFTDLPMLIREDSGAMLRLSDIDPARAAAEGALAFDAELAEKFGKKAHG -KKDHAEDVFLAVNEVGGKLTAMPGGEGSAL---------GTLR----------------- --------LQDVGWKIT--------------------------------PALSGNW----- -------------------------------------TVTLR-DGKTVRVHTVFDA----- ----LRKELEA-FTPEKTH-----------------------------KLTGVHPTLVRDL -ARDI-----------ALPEVVSVTMGFALGKHFNGM-LTQRAIASLMALTCRMGPRGGLN --TENEWSISGLGGLSGFDGAFKHRFAS--------------------------------- -------------------------------GAVSEH----QLGDGAATSKKAYTDDEIRE -ATG------QDAASYR----------------------AEIAALLEKS-----KNDRGVD -PAKGRFGKPWWDTVETFFIVADARFRRNKSGYR--------------------EAFLDKA -KFFAVADMKMGETARFADIVLPSASH--YEVWDLRVNPGYHRFANIA---QPPKGLEPVG -EAKSEWHIATMLVTRMQEIA---------------------------------------- --------------------L--AEYAR--------------------------------- --------------------------------TKNIGVMHIPDPTHTRDGIRPLDKF---- -------------VELFTD----H------------------------------------- --------------------GKLGT---DKQAVEFALGHV--------------------- ------------------------------------------------------------- -------DQFRGEDLESCYDR----------------GGFLVVNDKGGKT----------- -------------------------------SPLYP------------------------- ------------------------------------------------------------- -----DKPYSTF----------------------------------ENHF----------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MSISRRDALRNLLF -GTVAAG--------VAAKVPTAEAKEFSDPQPVR-VDDPRKSYPDT------QTTEDFYR -AEFQAVRGNPDERGFAYHC--VNCQGNCAFEVWTENGKVTRENQSASYPQLA-----PNL -PDANPRGCNKGSQHSQVMYEADRLLYPMKRAG---------------------------- -----------------ERGSGKWKRISWDEAITEIAENL------------HRGL-VEKG -PSSNYVH--------IGAGVLTEARAASIKRLGSL------------------------- ----IGAVRPYIASYVGDMFPGVTVVYGEGNIGCTYDFVFTTNVAVFWGCNPNTSRIPDAH -YLWEGKYNGSKIIVITPEFNSTAIHADLWVPLKAG-YDGHLALSIIHRIIQRKLF----R -------PEFLKEYTDLPFLVRKDTKELVRLSDVALD--------------AKGFDGA--- ----------------SARLFGEHPH--------------ECFLAFNTKNRKFTAMPGTEG -SGVETLRLQDMDWDI-----------D---------------------PALNGSW----- -------------------------------------KLTLK-DGKQVQVTTAFEL----- ----FKKEVAA-FAPEKVQ-----------------------------KLTGVHPSIVDEL -ATDL-----------TKAKVSLVTMGFAVGKHFNGM-LSQRAIASLTAFCGKLGPEGGLN --TENEWNISGLEGLSGFQGKYQHRFAS--------------------------------- -------------------------------GFVSE-----FMLGEGLEDADALYSDEDMR -RGT------GDSKAEY-----KA---------------KVQALLEQGKNDERYKEGKPYW -T-----------TVENFLLFADSRFRRNKGNYQ--------------------KAFLEKA -KFIAYGDVRANDMAIYADILLPCKTP--YECWDLRTNPGYHRYANIA---YPPPNLKPVG -ESKSEWEIATLVVEKLEALAKQKAAAT--------------------------------- ----------------GEDRY---------------------------------VVIP--- --------------------------------DKTHTQEGVRRLDELVREFTKDGTL-RTD -KDAVEYALEHVDQFKPNDTKSLY-ERGGFL-QLNEKAGKSS--PLYADK-----PYNTFE -NQLFLHQRFDTLT------GRLTFYVDHPLWIAANAHVPTAKQPIRPARHP--------- ------------------------------------------------------FVLMTPH -ARWSIHSTYKTSPILLRLQR---------------GKPCVMINPEIARARGIQDGDTI-- ----------------KMFNELGEVRVMAKLSPACPPDALVMEHGWE-------------- ---------------PFMYDGKKGHNLIIGDMLNLLELTDGWGH-------LKFGTNWDGN -----QHAYESTMDIAKA------------------------------------------- ----- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60 rank: A; sul:SYO3AOP1_1175 molydopterin dinucleotide-binding region (db=kegg) -----------------------------------------------MTVSRRDLLKAAAL -GSVAIGSNTLAKNAFTEPIPQKEAKDI----PVI-VEDPRASYLNTK-----SI-EDMYR -REFAETFGEKKDHGYAYHCV--NCQGNCAWQVWTKDGKVTRENQSASYPQIA-----PNI -PDYNPRGCNKGVQHSQIMYEQDRLLYPMKRVG---------------------------- -----------------PRGEGKWKRISWDEAITEVSENLYNTMQE---K----------- --GPAGNYIH------IGAGVLTEGRAASVKRLGT-------------------------- ---LLGAVRPYIASYVGDMFPGVSTVYGEGNIGCTYDFIFKTNVAIFWGCNPNTSRIPDAH -FLWEGKYNGSKIVVISPEYNSTAIHADLWVPIKPG-YDGHLAMAVLNEIVFKKMY----N -------ESFVKEFTDLPLLVRKDNKELVRFAEIDTKDSNFD---------SKSSEKL--- --------------LKKILKRELKEHEVF--------------LAWNQKTNKMTVLPGSEG -SPVETLRLKDRGWNI-----------N---------------------PALSGTW----- -------------------------------------KIKLK-DGHTVEVTTVFDL----- ----FKQELKK-FDPLRMH-----------------------------AVTGVHPTIVSEL -ARDM-----------IVPKNTLVTMGFSLGKYFNGM-LIQRAISALTAISGRLGESGGLN -T-ENEWNITGLSGLSGFEGKYQHRFAS--------------------------------- -------------------------------GFVSE-----YMLGDNLNDYDHLYAEAEIK -EST------GLGKKQY-----RE---------------KIEKIVKDG------ANDEGFK -NGKPYWTTM---ETFLLFADAR--FRRNKGSYK--------------------EAFLKKA -KFIAYGDYRMSDFCNYADILLPCKSH--YEVWDIRTNPG---YHRFANIAYPPANLKNVG -EAKSEWEISTLIAEKIQDIA------------------LKKYKS--------------SG -DKKAIHVPDTTHTQTGFRAL--DEVVNEFTIGG---------------------KVR--- --------------------------------SDKDAVEYMLEHVDQFKPNSTKTMY-ERG -GFLVLNDKAGKSSPLYSN----K-PYNT------FESNKLLYQPFETLT----------- --------------------GRLTFYVDHHLWIETGAHIPTARNPIRPKK----------- ----------------------------------------------------FPFVLMTPH -ARWSIHSTYKTSKILQRLQR---------------GKPYIMINPKVAEAKGIKDGDEV-- ----------------KMFNDLGETFLMAKITPSAPEHSLVMEHGWEPFMYKNKVGH---- ----------------------NALV---GDMINLLELSDGWGH-------LKFGTNWDGN -----QHAYETTVDIVKA------------------------------------------- ----- diff --git a/assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json b/assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json deleted file mode 100644 index 76c34e49..00000000 --- a/assets/trees/nar_nxr/nar_nxr.refpkg/phylo_modelNQB2rG.json +++ /dev/null @@ -1,11 +0,0 @@ -{ - "empirical_frequencies": true, - "datatype": "AA", - "subs_model": "WAG", - "program": "RAxML version 7.7.2", - "ras_model": "gamma", - "gamma": { - "alpha": 1.530755, - "n_cats": 4 - } -} \ No newline at end of file diff --git a/assets/trees/nar_nxr/nar_nxr.tre b/assets/trees/nar_nxr/nar_nxr.tre deleted file mode 100644 index 72500eef..00000000 --- a/assets/trees/nar_nxr/nar_nxr.tre +++ /dev/null @@ -1 +0,0 @@ -(OOP57237|Brocadia_caroliniensis:0.010806074,(RIK02127|Brocadia_sp:0.000910858,(KKO18748|Brocadia_fulgida:0.000000005,OQZ00558|Brocadia_sp_UTAMX2:0.000914005)0.781:0.000917034)0.992:0.013579216,(WP_052562588|Brocadia_sinica:0.009341785,(OHB44699|Planctomycetes_bacterium_GWE2_41_14:0.028539476,((WP_070066136|Brocadia_sapporoensis:0.005501886,RZV59451|Brocadia_sp_BROELEC01:0.002673850)1.000:0.025826757,((((OHB72803|Planctomycetes_bacterium_RBG_16_41_13:0.009726587,(WP_099324707|Kuenenia_stuttgartiensis:0.000917459,NxrA_Candidatus_K_stuttgartiensis_CAJ72445:0.000000005)0.998:0.017229244)1.000:0.098072241,((((RBG1_10:0.249943905,((GCA_001803565_00046|MHDQ01000004unannotatedprotein:0.399259377,((BBJ23760|Nitrotoga_sp_AM1:0.0,BBJ23368|Nitrotoga_sp_AM1:0.0):0.003761140,((RFC31618|Nitrotoga_sp_SPKER:0.006020303,((SPS06998|Nitrotoga_fabula:0.0,SPS06751|Nitrotoga_fabula:0.0):0.042255811,(RFC37636|Nitrotoga_sp_CP45:0.000000005,(RFC33776|Nitrotoga_sp_LAW:0.000000005,RFC30723|Nitrotoga_sp_MKT:0.001768416)0.953:0.002651540)0.916:0.006621566)0.695:0.008594937)0.950:0.008908972,BBJ23476|Nitrotoga_sp_AM1:0.013693167)0.440:0.001391552)1.000:0.666812638)1.000:0.321755680,((((greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3:0.011379394,(NASQAN2014_190_B_bin.96_k121_3766_2:0.017081478,(NASQAN2015_111_B_bin.76_k121_226837_116:0.021392246,icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5:0.002525334)0.985:0.013886431)0.102:0.014633186)1.000:1.045689577,((flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14:0.290495020,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1:0.289900857)1.000:0.977544665,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3:0.182186058,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4:0.220237367)1.000:0.733397499)0.485:0.198655286)0.560:0.125080923,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1:0.429037937,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1:0.433198646,((NASQAN2011_330_B_bin.17_k121_430440_3:0.641466723,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7:0.393884505,(gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3:0.324547720,((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1:0.157095605,((whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1:0.167523285,(NASQAN2011_265_B_bin.52_k121_959771_6:0.026017376,NASQAN2011_265_B_bin.52_k121_465271_4:0.000000008)0.818:0.115349202)1.000:0.087988271,(logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2:0.159911107,(lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5:0.020931878,(watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30:0.032515342,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1:0.071100891)0.951:0.024998611)0.985:0.042982912)1.000:0.086501401)0.986:0.042923050)1.000:0.086203118,(((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6:0.320376687,(flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9:0.147904578,(nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5:0.099435688,lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3:0.013429712)1.000:0.121234242)0.749:0.040234813)0.863:0.055442056,((king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1:0.156531059,NASQAN2015_010_A_bin.16_Ga0466474_000034_25:0.177178519)0.992:0.044604086,((((NarG_Escherichia_coli_NP_415742:0.203008887,NarG_Halomonas_maura_gb_AAT47523:0.153894902)0.981:0.047232779,watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1:0.311887965)0.998:0.063567006,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6:0.106781950,(NASQAN2011_286_B_bin.1_k121_764018_13:0.005660724,NASQAN2011_286_F_bin.29_scaffold_54_27:0.000000005)1.000:0.123919793)1.000:0.131403606,(NarG_Pseudomonas_stutzeri_gb_AAZ43099:0.046987015,(NarG_Pseudomonas_fluorescens_gb_AEV63780:0.078508524,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16:0.074914222,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11:0.000000008)0.885:0.078978122)0.708:0.032866426)1.000:0.168519259)0.242:0.019184033)0.998:0.047390479,(flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1:0.199222465,((littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6:0.090260755,(littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7:0.175888927,watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2:0.078834694)0.544:0.015106087)0.765:0.040298684,flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1:0.189261863)0.493:0.037097247)1.000:0.139855980)0.732:0.020426298)0.995:0.035229012)0.458:0.027215325,((((((NASQAN2015_172_B_bin.54_k121_327740_1:0.048321373,((cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17:0.003316375,Yukon_2004-1_F_bin.10_scaffold_678_1:0.110287220)0.999:0.034293344,(cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5:0.010147982,(NASQAN2015_227_F_bin.21_scaffold_4919_3:0.024300445,NASQAN2011_028_B_bin.24_k121_53788_5:0.000000005)0.990:0.014294289)0.365:0.007073108)0.988:0.017900532)0.950:0.016382079,(watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1:0.104162330,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1:0.054766712)0.871:0.041502925)1.000:0.076566993,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4:0.104610952,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2:0.070583667,eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23:0.043655384)1.000:0.048776638,((yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1:0.089459252,cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1:0.023635532)0.326:0.001148673,lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1:0.090302159)0.885:0.013388066)0.878:0.032405321)0.565:0.021969185,((flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2:0.152164297,(NASQAN2016_164_F_bin.17_scaffold_1152_1:0.081072836,NASQAN2015_227_F_bin.21_scaffold_2406_1:0.055593684)0.976:0.109893377)0.649:0.067627453,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2:0.064995222)0.815:0.039464533)0.963:0.029952893)0.148:0.015135463,flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17:0.129369944)0.861:0.019065424,(((watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1:0.392541235,yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1:0.171599398)0.840:0.248083204,((Yukon_2004-1_F_bin.10_scaffold_25058_1:0.105822798,NASQAN2016_164_F_bin.17_scaffold_8891_2:0.030238438)0.312:0.015380827,NASQAN2015_227_B_bin.17_k121_559871_7:0.039959075)0.928:0.056585084)0.234:0.007394197,(watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7:0.604640728,flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3:0.181397923)0.845:0.147304633)0.903:0.041551231)0.908:0.028658570,lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206:0.136445862)1.000:0.145006781)0.508:0.034596552)0.999:0.098317003)0.563:0.079911427)0.999:0.168588838)0.985:0.135263217,(CRI68048|Thiocapsa_sp_KS1:1.094261762,(flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4:0.488541056,(sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1:0.401066831,((GCA_003453735_00577|DMNE01000186unannotatedprotein:0.309801231,(((AFN37208|Nitrolancea_hollandica_Lb:0.039042664,AFN37205|Nitrolancea_hollandica_Lb:0.011623567)0.981:0.018883572,(AFN37207|Nitrolancea_hollandica_Lb:0.059889634,AFN37206|Nitrolancea_hollandica_Lb:0.035086850)0.741:0.017421853)1.000:0.237080104,((WP_005004540|Nitrococcus_mobilis:0.005243894,Nitrococcus_mobi_EAR23355:0.002640284)1.000:0.244172179,((WP_011314088|Nitrobacter_winogradskyi:0.002534990,(Nitrobacter_sp_Nb_311A_ZP_01048070:0.009400785,(A_Nitrobacter_hamburgensis_YP_578638:0.031550923,B_Nitrobacter_hamburgensis_YP_578186:0.023740548)1.000:0.053836401)0.978:0.022733577)0.963:0.016265428,Nitrobacter_winogradskyi_gb_ABA05326:0.037260949)1.000:0.216806507)0.880:0.055888930)1.000:0.201356108)0.974:0.063994885,(blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11:0.000000005,blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9:0.000000005)1.000:0.282418622)0.992:0.095642727)0.132:0.041822075)0.986:0.188699247)0.017:0.049701189)0.871:0.184584331)0.173:0.116759705)1.000:0.987285179)0.550:0.236304701,(providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4:0.472026440,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60:0.325258151,(icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14:0.332187014,muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5:0.705095308)0.418:0.106182937)0.994:0.312896913)1.000:0.774651657)1.000:0.778950754)0.975:0.154198707)1.000:0.231811834,((((cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor:0.000877951,cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor:0.000943888)1.000:0.055806636,(GCA_003523945_00056|DOFS01000023unannotatedprotein:0.004579427,DJ_nxrA:0.006504779)0.999:0.028051194)0.999:0.046515340,(DJ_nxrA2:0.074233359,DJ_nxrA1:0.060036576)0.694:0.026270877)0.990:0.045759227,(((((WP_053378142|Nitrospira_moscoviensis:0.008325164,(riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5:0.012480447,GCA_002083555_01644|MSXN01000007unannotatedprotein:0.002680030)0.924:0.008235322)0.880:0.003077004,(((GCA_002420115_02525|DIHK01000043unannotatedprotein:0.012092376,GCA_002483475_03556|DLHZ01000062unannotatedprotein:0.002691200)1.000:0.023236403,(GCA_900078535_00262|FJVM02000053unannotatedprotein:0.014982211,(GCA_001458695_00808|LN885086unannotatedprotein:0.023036213,GCA_002451055_00821|DKBD01000269unannotatedprotein:0.007573759)0.688:0.003976613)0.390:0.001522946)0.694:0.004052451,GCA_002331335_02310|DCZO01000011unannotatedprotein:0.017101140)0.922:0.006393889)0.980:0.016473529,(riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32:0.002308752,GCA_002737345_00863|NSIK01000010unannotatedprotein:0.006832549)1.000:0.023034521)0.393:0.016407361,WP_080886776|Nitrospira_japonica:0.032980329)1.000:0.048957408,(((Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein:0.0,Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein:0.0):0.048648714,((CBK42946|Nitrospira_defluvii:0.0,NxrA2_Nitrospira_defluvii_YP_003798871:0.0):0.003132849,GCA_900170025_02937|FWEX01000006unannotatedprotein:0.002326236)1.000:0.046043049)0.987:0.028241355,((CUS31266|Nitrospira_nitrosa:0.032070423,CUS38776|Nitrospira_nitrificans:0.014206130)1.000:0.059565512,(GCA_001567445_02228|JZQY01000048unannotatedprotein:0.031898730,((CBK42928|Nitrospira_defluvii:0.0,NxrA1_Nitrospira_defluvii_YP_003798853:0.0):0.020188049,GCA_003456605_00391|DMQK01000091unannotatedprotein:0.020042828)0.973:0.029005902)1.000:0.049275974)0.916:0.026734542)0.987:0.030138243)0.163:0.019579673)1.000:0.351067665)0.984:0.079553236,((OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14:0.144751486,OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b:0.164104591)0.967:0.106906909,(((OUC07869|Chloroflexi_Litorilinea_aerophila:0.108541565,RCK74665|Chloroflexi_Anaerolineae_bacterium:0.109258954)1.000:0.169950317,(KRT77589|Armatimonadetes_bacterium_CSP1_3:0.210493116,KRT68888|NC10_bacterium_CSP1_5:0.135568128)0.411:0.038266264)0.915:0.031759119,(GBC85351|bacterium_sp_HR11:0.152552869,(GCA_002328125_01442|DCWK01000050unannotatedprotein:0.001947491,GCA_002685755_01556|NYYB01000002unannotatedprotein:0.001760896)1.000:0.300590274)1.000:0.072067691)0.853:0.038248286)0.986:0.048595639)0.582:0.046460101,((MSP_nxrA:0.025354205,(((MBL09191|Acidiferrobacteraceae_bacterium:0.033838550,TDJ60388|Nitrospina_sp:0.042298150)0.934:0.011901270,((Nitromaritima_KMP11423|SCGC_AAA799_A02:0.031363214,((GCA_002705185_00880|PAJA01000060unannotatedprotein:0.0,MAX17737|Nitrospina_sp:0.0):0.009948403,(GCA_001542995_01387|LFLA01000024unannotatedprotein:0.011368914,(GCA_002453875_01196|DKHT01000003unannotatedprotein:0.0,GCA_002454045_00625|DKID01000024unannotatedprotein:0.0):0.025625262)0.731:0.006753767)0.957:0.010197443)0.837:0.006601827,cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor:0.016703925)0.925:0.009659103)0.780:0.008734629,PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15:0.031915291)0.638:0.007806333)0.907:0.014421329,(WP_042250442|Nitrospina_gracilis:0.018020385,WP_042251421|Nitrospina_gracilis:0.040064063)0.228:0.014895744)1.000:0.388356661)1.000:0.140833958)0.990:0.036064959,((((WP_007222969|Jettenia_caeni:0.0,NxrA_planctomycete_KSU_1_ZP_10101005:0.0):0.002251376,TLD40744|Candidatus_Jettenia_ecosi:0.013337202)0.983:0.006913180,TLD41279|Candidatus_Jettenia_ecosi:0.021669001)0.000:0.000000005,WP_007220240|Jettenia_caeni:0.000000005)0.998:0.026966168)0.882:0.017606145,((WP_070067449|Brocadia_sapporoensis:0.003688908,(OQZ04816|Brocadia_sp_UTAMX1:0.003783493,RZV56287|Brocadia_sp_BROELEC01:0.003479253)0.233:0.001151055)0.997:0.020857077,(KKO18624|Brocadia_fulgida:0.021890769,(OOP55454|Brocadia_caroliniensis:0.024026386,(WP_052561322|Brocadia_sinica:0.000917852,KXK29028|Brocadia_sinica:0.000923980)1.000:0.023040103)0.993:0.017011726)0.725:0.010490186)0.877:0.013675102)0.965:0.015645586)0.779:0.007537636)0.931:0.007662564)0.935:0.007110293); diff --git a/assets/trees/nar_nxr/nar_nxr_color_map.tsv b/assets/trees/nar_nxr/nar_nxr_color_map.tsv deleted file mode 100644 index 27fa3bb2..00000000 --- a/assets/trees/nar_nxr/nar_nxr_color_map.tsv +++ /dev/null @@ -1,6 +0,0 @@ -"label" "color" -"nxr/nar-N utilization" "purple" -"other-None" "blue" -"narG-N reducer" "green" -"nxr-Nitrifier" "red" -"nxr-None" "orange" diff --git a/assets/trees/nar_nxr/nar_nxr_search_terms.txt b/assets/trees/nar_nxr/nar_nxr_search_terms.txt deleted file mode 100644 index 6bfb7b07..00000000 --- a/assets/trees/nar_nxr/nar_nxr_search_terms.txt +++ /dev/null @@ -1,13 +0,0 @@ -K00370 -K00371 -K00374 -nitrate reductase -nar -NAR -narG -narH -narI -narJ -EC: 1.7.99.4 -EC: 1.7.5.1 - diff --git a/assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa b/assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa deleted file mode 100644 index 8620f8d1..00000000 --- a/assets/trees/nar_nxr/nar_nxr_seqs_for_tree_aligned.faa +++ /dev/null @@ -1,5425 +0,0 @@ ->RBG1_10 -----------------------------------------------MTLSRRRFLKISSL -SAAGA---------LVDLPELKFLQFLET------VENPLEYYPNR------DW-EKIYR -DQYRY------DSSFTFVCT-PNDTHACRLRAYVRNGIVIRVEQAYDVQNYTDLYGNKAS -VMWSPRGCNKGYNLPRRVYGPYRVKHPMVRKGWKE----------WAE----------AG -FPDPTLPENQQKYF--RRGEDSWVKVSWDEGFELVAKGLLHTMEKYSGEKGAEIL-RKQG -YPEEMIEAM------HGSGAQTIKIRGAMPLLGATRIFGFYRFAN-MLGLYDGK------ ----LGARGWSNFSWHGDLPPGHPMVTGVKCSDPELNDFRHSKLLVFLGKNMVESKMADAH -WWIETIERGGKVVNISPEYSATSSKSDYWIPIRPG-TDTALLLGVTQIIIQEKLY----D -------QDFIKKHTDLPLLIRMDNLKLLRPTDIIKG---YK----------NQILTG--- ---------------YSVKVQKIKPELREKW---------GDFVVWDLKTKK--PQTVT-- --------REDLGEKIERKGL------N---------------------PALEGNY----- -------------------------------------KIKLV-NGKEIEVKTVFQL----- ----YKELLSE-YDLETVS-----------------------------QITGSPKNLIYQL -AQDL-----------ATIKPASIHTGEGVNHFFHCD-LVTRAVWLPLALTGNIGKPGA-N ---VGHWAGNYKGEVFD--------GLG--------------------------------- -------------------------------VYLNE-----DPFNPNLDPSAKLEDIKLKK -YYK------GEEVCYW-----NY---------------EDRPLIVKG----------KCF -TGKTHMPTP---TKAEWVGNGN-LLNNAKWAHN----------------MIANVE--GKV -EMIVYNEIEWTASCEYADVVFPVHSWMELTLPDMTASCSN-PFLQV----W-KGGIKPIF -DTKQDNEVLAGVAAKLSELT---------------------------------------- ----------------HDNRY--KDYWKF-------------------------VLEG--- --------------------------------NNEVYLQRILDACSTTKGYKIDELL-KSD ------RG----WLMNFRT----Y-PRIPFW----EQIQESK--PFYTKT----------- --------------------GRMEFYREEDEFIDYGENLIVHREPVEATPYL--PNVILG- -THKAIR---PNSYGISPESIN---ADERQVRNLKMSWKQVKLSKNPLWEKGFRFYCLTPK -SRHTVHSSWSVLDWNMIWQSNFGDPYRMDNRTPGVGEHQMHMNPLDAKELGINDGDYAYV -DANPEDRPYTGWKEEDPFYKVSRLMVRVKYNPAYPRGITMIKHASFIATHKSVKAHESRP -DKRAVSED-TGYQSSFRYGSQQSIT---RGWLQPTMMTDSLVRKNYMGQEIGEGYEIDVN -APN-TCPKETLVKIIKAE-DGGMGGKGKW---EPARTGYTPAG--ENKDMKKFLEGGFIL -KV-- ->cas150m_01921|CAS-150m-3753Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLITQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->cas50m_02313|CAS-50m-4275Perchloratereductasesubunitalphaprecursor -----------------------------------------------MFLSRRQFLKVTTG -TVAAVA--------LADKALA--LTALQP--VVE-VGNPLGEYPDR------AW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRVRSFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------AG -SPEFT-PDVMSKYKFNARYLDDMLRVSWDTAFTYIAKAMLIISERYSGEAGARRL-REQG -YPPEMIEMS------KGSGVRTFKFRAGMPILGVIGKMGITRMNGGCGALLDTYIRKVKP -NQAQGGRYWSNYTWHGDQNPAHPFWSGVQTSDIDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARCVVITPEYNPTAYRADYWIPVRPA-TDAALFLGACKIIFDENMH----D -------HDFCAAYTDMPILVRTDTLQYLDPRDVIQG---YA---------LPDFSKT--- ---------------YSGKVQTLDPAKIARL---------GGFMVWDINKNS--AVPIH-- --------RELVGWHFRNSGI------E---------------------PAMTGSY----- -------------------------------------RVKLL-NGREVDVLPVFQM----- ----YQAHLQD-YDLDTCH-----------------------------QINRAPKDLIVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHQT-IIARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGIWC-ATPWSGGGLG--------------------------------- -------------------------------THTAE-----NPFKITLDPNAHGKEVHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ECLVTQDVEMTSDVNHNDVAMGVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDKRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDASSTAYGYSVDTML-KSE ------KG----WMVMCRT----Y-PRQPFW----EETNESK--PQWTRT----------- --------------------GRYENYRIEPEAIEYGENFISHREGTEATPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIALPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQLHVNPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAMD-TGYQSNFRYGAQQSFT---RDWLMPMHQLDSLPGKHAVAWKFKFGYQVDNH -AVN-TVPKECLMRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_003523945_00056|DOFS01000023unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAVMTKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRM-REQG -YPPEMIEMT------KGSAIRSFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENLY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLSKNQ--AVPIH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-NGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPECIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTMHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPEFT-PAIMSKYKFNARYLDDMLRVSWDTAFTYLAKAMIIIAERYSGEAGARRL-REQG -YPPEMIEMT------KGSAIRAFKFRAGMPILGLIGKMGITRMNGGCGALLDTYIRKVQP -DQAQGGRYWSNYTWHGDQNPAHPFWNGVQASDVDMNDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTAYRADYWMPVRPA-TDGALFLGALKIIFDENMY----D -------YDFCQSYTDMPILVRTDTLQYLDPREVIKD---YA---------FPDFANS--- ---------------YSGKVQTMKPDVIARL---------GGFMVWDLNKNQ--AVPLH-- --------RELVGWHYRKSGI------D---------------------SALTGTY----- -------------------------------------RVTLL-SGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTNHYFHQT-IIARGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGIWN-ATPWGGGGLG--------------------------------- -------------------------------THTGE-----NPFKITTDPNAHGKEIHVKG -YYY------GEEVAYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNAKHHYD----------------MVKNVD--PHI -ETLVNQDVEMTSDVNHNDISFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLSEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRILDASTTAYGYNADVML-KSE ------KG----WMVMCRT----Y-PRHPFW----EETNESK--PQWTRT----------- --------------------GRYENYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RDWLMPMQQLDSLPGKHAVGWKFKFGYQVDNH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA2 -----------------------------------------------MLVTKRQFLKITAG -TVAAVA--------LADNALA--LTALQP--VVE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDMYGNRGT -FAHNPRMCLKGYTYHRRVYGPYRLKGPLMRRGWKA----------WMD----------DG -SPELD-PTVMTKYKFSARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEAGARRL-REQG -YPPEMIEMM------KGSGVRSMKFRAGMPVLGVIGKMGITRMNGGCGALLDSWVRKVGP -DSAQGGRYFNNLTWHGDQDPSQPFWSGAQAIDCDLSDMRFSKMNTSWGKNFVENKMPEAH -WKLESIERGGRVVVITPEYNPTAQRADYWMPVRPE-TDGALFLGACKIILDDGLQ----D -------NDFIRSSTDFPLLIRTDTLQYLDPRDVIKD---YA---------FPDFSKS--- ---------------YSGKVQGLSPSQIARL---------GGFMVWDLNQDK--AVPLH-- --------RELVGWHFKKSGI------D---------------------PALTGSF----- -------------------------------------RVKLL-SGREADVMPLFQM----- ----YQVHLQD-YDLDTVH-----------------------------QINRCPKDLIVRW -ARDN-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAAMVMTLTGNMGKFGS-G ---CHTWSGNYKVGVWA-ATPWSGEGIG--------------------------------- -------------------------------IHTGE-----NPFKITTDPNAHGKEINYRP -YYY------GEETTYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKLRWVANVN-ILNNSKHHYD----------------MVKNVD--PHI -ETIVTQDIEMTSDVNHADVSFAVNGWMEFTYPEMTATVSN-PWMQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYVQRLLDAGSTSYGYSADTML-KSE ------KG----WMVMTRT----Y-PRIPLW----EETNESK--PMWTRS----------- --------------------GRLETYRVEPEAIEYGENFISHREGTEATPYL--PNAIMS- -SNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHVNPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQLDSLPGKMANKWKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->DJ_nxrA1 -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------LADKALA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTMHRRVYGPYRLKGPLMRRGWKQ----------WMD----------DG -SPEFT-PAIQTKYKFNARYLDDMLRVSWDTAFTYLAKAMIVIANRYSGEYGARKL-REQG -YPPEMIEMM------KGSGVRAFKFRAGMPVLGIIGKMGITRMNGGCGALLDSWVRKVGP -ENAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDIDLSDMRFCKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAYRADYWIPIRPE-SDGSFFLGACKMIVDEGLF----D -------ADFVRANTDMPLLVRTDTLQYLDPRDVIKD---YQ---------FPDFSNT--- ---------------YSGKVQTLKPAEIARL---------GGIMVWDLNKNQ--AVPIH-- --------RELVGWHFKKSGI------D---------------------PALTGTH----- -------------------------------------RVRLL-TGREVDVMPIFQM----- ----YQVHLQD-YDLDTVH-----------------------------QICRSPKDLIVRW -ARDM-----------GTVKPAAIHNGEGVCHYFHMT-QNGRAAALTLIYSGNMGKFGS-G ---CHTWSGNYKAGTWA-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFKITTDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRRVF -TGKTHMPTP---SKFRWVANVN-VLNNSKHHYD----------------MVKNVD--PHN -ECLVHQEVEMTSDVNHFDVSFAVNTWMEFTYPEHTATVSN-PWFQV----W-KGGIRPLY -DTRNDLDTVAGVAAKLTEMT---------------------------------------- ----------------GDGRF--RDYFKF-------------------------VYDN--- --------------------------------RVDVYLQRLLDAGNCSYGYNADTML-KSE ------KG----WMVMTRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRVETYRVEPEAIEYGENFIVHREGPEATPYL--PNAIMS- -SNPYIR---PDDYGVPITAQH---HDDKTVRNIKLPWAEIKRYANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQMYESNFGDAYRMDKRTPGVGEHQIHINPSAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAFPYHVTMAKHAPFVSTAKSVKGHETRP -DGRAIALD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHPVAWKFKWGFAIDHH -AVN-TTPKECLIRITKAE-DGGIGGRGPW---EPVRTGFTPGQ--ENEFMIKWLKGDHIK -IKV- ->GCA_001567445_02228|JZQY01000048unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPIFQL----- ----YQVHLQD-YDLDTVH-----------------------------QVNRSPKDLIVRW -ARDC-----------GTIKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLTTDAHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNSKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVSAKLKELT---------------------------------------- ----------------GEARM--ADTYRF-------------------------VYQN--- --------------------------------RMDIYVQRILDASTTFYGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFIVHREGPECTPYL--PNAIMS- -TNPYIR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYCFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42928|Nitrospira_defluvii ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->NxrA1_Nitrospira_defluvii_YP_003798853 ----------------------------------------------MMQLSRRQFLKVSAG -TVAVAA--------VADKALA--LTALQP--VVE-VNNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLIVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESMERGARLVIITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPHEVLKD---YQ---------VPDFTKS--- ---------------YSGRVQGLSQDQVQRL---------GGMMVWDLAKGK--AVPLH-- --------REQVGVHLAQSGI------D---------------------PALTGTY----- -------------------------------------RIKLL-NGREVDVMPIYQL----- ----YTIHLQD-YDLDTVH-----------------------------QVNRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLRDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLKEMT---------------------------------------- ----------------GEQRM--ADTYKF-------------------------VYHN--- --------------------------------RVDIYVQRILDASTTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLETYRIEPEAIEYGENFISHREGPECTPYM--PNAIMT- -TNPYVR---PEDYGIPVTAQH---HDDKTVRNIKLPWSEIKQHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKQANALKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMVKWLKGEHIK -IKV- ->GCA_003456605_00391|DMQK01000091unannotatedprotein ----------------------------------------------MMQVSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VVE-VDNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-SDVKRKYKFDSRFLDDMVRVSWDTAFTYVAKGLVVIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPILGMMGKHANTRFNNCVLPLLDSWIRKVNP -DQAQGGRYWNNYTWHGDQDPSQPWWNGTQNCDVDLSDMRFTKLNTSWGKNFVENKMPEAH -WKLESIERGARLVVITPEYNPTASRADYWIPVRPE-TDGALFLGASKIILDENYQ----D -------IDFIKGFTDMPLLVRTDTLQYLDPYEVVKE---YQ---------LPDFTKS--- ---------------YSGRIQGLTQDHIRRL---------GGMMVWDLAKGQ--AVPLH-- --------REQVGLHFAQTGI------D---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDVMPVYQM----- ----YTIHFQD-YDLDTVH-----------------------------QINRAPKDLIVRW -ARDC-----------GTVKPAAIHNGEGVCHYFHMT-SMGRAAALVMMLTGNIGKFGT-G ---CHTWSGNYKVGIWQ-AAPWSGAGAS--------------------------------- -------------------------------VYLGE-----DPWNLNLKDDVHGKEIKYRK -YYY------GEEPGYW-----NH---------------GDNALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVVNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMLVTQDIEMTSDVNHADVAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFSGVAVKLKEIT---------------------------------------- ----------------GDQRM--ADTYKF-------------------------VYQN--- --------------------------------RVDIYVQRILDASSTFFGYSADVML-KSE ------KG----WMVMCRT----Y-PRHPLW----EETNESK--PHWTRS----------- --------------------GRLESYRIEPEAIEYGENFISHREGPECTPYL--PNAIMT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKQQANPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYCYV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQANFRYGAQQSFT---RSWLMPMHQTDSLPGKQANAMKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMAKWLKGEHIK -IKV- ->Baikal-deep-G159_00763|Baikal-deep-G159-c12unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->Baikal-deep-G158_01775|Baikal-deep-G158-c18unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAAA--------VADKALA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGYTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PDVKRKYKFDARMLDDMVRASWDTAFTYVAKACILIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIIGKMMNTRFNGGVLPVLDSWIRKVDP -DKAQGGKYYSNYTWHGDQDPSHPWWNGTQNCDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGACKIIIDENMQ----D -------IDYIKGYTDMPLLVRTDTLQYLDPREVIAD---FK---------FPDFSKS--- ---------------YSGRVQSLKPEQIERL---------GGMMVWDNNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLI-NGREVDVAPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRSPKDLIVRY -GRDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAALMMTITGNIGKFGT-G ---CHTWSGNYKAGVWN-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNQTLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIITQDIEMTSDVNHADVAFACNSWMEFTYPEMTATVSN-PWLQI----W-KGGIRPLY -DTRNDADTFGGVAVKLTELT---------------------------------------- ----------------GDARI--RQVFHF-------------------------VYQN--- --------------------------------RVDVYVQRALDASATCYGYNADTML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFVVHREGPECTPYL--PNAIFS- -TNPYVR---PDDYGIPITAQH---HDDKHIRNLKLPWTEIKRQSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYIYV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAFPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHAIAWKFKWGYAIDHH -AVN-TTPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CBK42946|Nitrospira_defluvii ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->NxrA2_Nitrospira_defluvii_YP_003798871 ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -EKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPVRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NSREIDVMPIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900170025_02937|FWEX01000006unannotatedprotein ---------------------------------------------MQVSVSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHGCRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PDVKRKYKFDSRFLDDLNRVSWDTAFTYVAKAAVLIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRTFKHRAGMPVLGIVGKMMNTRFNGGCLPLLDSWIRKVDA -DKAQGGKYYSNYTWHGDQDPSHPFWNGTQNCDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGARIVVITPEYNPTAYRADYWIPLRPE-TDGANFLGAAKIIFDENLQ----D -------IDYIKEFTDLPLLVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQVERL---------GGMMVWDLAKGK--AVPLH-- --------REQVGFHFKESGI------D---------------------PALTGTF----- -------------------------------------RVKLL-NGREIDVMSIYQM----- ----YQVHLQD-YDLDTTH-----------------------------QITRAPKDLIVRW -ARDS-----------GTIKPAAMHNGEGVCHYFHMT-EMGRAAAFIMTITGNIGKFGT-G ---CHTWSGNYKAGIWN-AVPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNLTLDPNAHGKEIKTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPSP---SKVRWVTNVN-ILNNAKHHYD----------------MVKNVD--PNI -EMIVTQDIEMTSDVNHADVAFACNSWMEFTYPEMTGTVSN-PWIQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEMT---------------------------------------- ----------------GDARF--RGVFHF-------------------------VYMN--- --------------------------------RVDVYPQRMLDASATCYGYSADVML-KSE ------KG----WMVMGRT----Y-PRHPLW----EETNESK--PQWTRS----------- --------------------GRIETYRIEPEAIEYGENFISHREGPECTPYL--PNAIFS- -NNPFIR---PDDYGIPITAQH---HDDKHVRNIKLPWAEIKRHPNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVFV -DGNPVDRPYRGWKPSDPFYKVSRLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHTIAWKFKWGYAIDHH -GIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS31266|Nitrospira_nitrosa -----------------------------------------------MVITRRQFMKASAG -TIAAIA--------VADKVLA--LTALQP--VTE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLIRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFASRFLDDMLRVSWDTAFTYAAKAMVVIATRYSGEAGARRL-REQG -YAPEMVEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPVLDTWVRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARLAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMH----D -------VDYLKQFTDMPLLVRTDTLQYLDPREVIPD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDLAKQK--AVPLH-- --------REQVGWHFDSSGI------Q---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDAQPIYQM----- ----YQIHFQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-SNGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWS-ATPWSGSGSG--------------------------------- -------------------------------VHLSE-----DPWQINLDPNAHGKEIKYKS -YYY------GEEPGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAARLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRVEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPHVR---PDDYGIPVTAQH---HDDKTIRNIKLPWVEIKRHTNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->CUS38776|Nitrospira_nitrificans -----------------------------------------------MLVSRRQFMKATAG -TIAAAA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WAD----------DG -SPELT-PEAKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGVRCFKHRAGMPILGFIGKHSNTRFNNSVLPLLDTWIRKVGP -DQAQGGRYWNNYTWHGDQDPSQPFWNGTQNCDVDLSDMRFTKFNTSWGKNFVENKMPEAH -WKLESIERGARIAVITPEYNPTAQRADYWIPLRPQ-SDGALFLGACKIILDENMQ----D -------IDYLKQFTDMPLLVRTDTLQYLDPRDVIQD---YK---------FPDFSHS--- ---------------YSGRIQALKPEYIERL---------GGFMVWDMAKKQ--AVPLH-- --------REQVGWHFDKSGI------E---------------------PALTGTY----- -------------------------------------RVKLL-NGREIDALPIYQL----- ----YLIHLQD-YDLDTTH-----------------------------QITRSPKDLLVRW -ARDS-----------GTIKPAAIHNGEGVCHYFHMT-ANGRAAALVLTLTGNIGKFGS-G ---CHTWSGNYKVGIWN-ATPWSGVGGG--------------------------------- -------------------------------VHLSE-----DPWHINLDANAHGKEIKYRN -YYY------GEEPAYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-LLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHADIAFAVNSWMEFTYPEMTATVSN-PWVQI----W-KGGIRPLY -DTRNDADTFAGVAAKLAEIT---------------------------------------- ----------------GEKRM--RDVFHF-------------------------VYEN--- --------------------------------RVDVYAQRLLDASSTFYGYSADVLL-KSE ------KG----WMVMVRT----Y-PRHPLW----EETNESK--PMWTRS----------- --------------------GRIESYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPIAAQH---HDDKMIRNIKLAWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQVHINPQAAKDRGINDGDYVYI -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKSANGLKFKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_080886776|Nitrospira_japonica ---------------------------------------------MTMFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMMRVSWDTAFTYAAKSMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVTS -DQAQGGRYWSNYTWHGDQNPSQPWWCGAQASDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLESIERGGRIVVITPEYNPTAYRADYWMPLRPQ-SDGAIFLGAMKIITDENMH----D -------IDFLKGYTDAPVLVRTDTLQFVDPRDVVRD---YK---------FPDFSKS--- ---------------YSGRVQTLKPEQVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYSNSGI------D---------------------AALTGTY----- -------------------------------------RIKLL-NGREIDVMPVWQL----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLLVRW -ARDS-----------GTVKPAAIHNGEGTNHYFHMT-VNSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWV-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PSI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQV----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEIT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYMN--- --------------------------------RVDVYVQRLLDASATFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRVPFW----EETNESK--PMWTRT----------- --------------------GRFETYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYCR---PDDYGIPITAQH---HDDKTVRNIKLPWSEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RSWLMPMHQTDSLPGKHANGLKWKWGFEIDHH -AVN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.137_k121_1578656_32 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRVQSLKPEQVERL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-STPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWQEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002737345_00863|NSIK01000010unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKE----------WMD----------AG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIVIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRTFKHRAGMPVLGIIGKMGNTRMNGGVNALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWCGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPA-SDGAIFLGAMKIIVDENMH----D -------VDFLKGYTDSPVLVRTDTLQFLDPREVVAD---YQ---------FPDFSKS--- ---------------YSGRVQSLKPEGIARL---------GGMMVWDLNKKA--AVPLH-- --------REQVGWHYQNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTCH-----------------------------QICRTPKDLLVRW -ARDS-----------GSIKPAAIHNGEGTNHYFHQT-INSRGAAMVLIVTGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGIA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFAANSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDSFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFKF-------------------------VYEN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRTPFW----EETNESK--PMWTRT----------- --------------------GRYENYRTEPEAIEYGENFISHREGTEATPYL--PNAIMT- -SNPYVR---PDDYGIPITAQH---HDDKTVRNIKLPWAEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002420115_02525|DIHK01000043unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDSWIRKVSP -DQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFMGAMKIIIDENMH----D -------VDFLKQFTDAPILIRTDTLQYLDPRDVVPD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDVERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGVPITAQH---HDDKTIRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002483475_03556|DLHZ01000062unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAAA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPSQPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------VDFLKQFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQALKPQDIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYMNSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGVTHYFHMT-PNGRAAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGCWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIVRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_001458695_00808|LN885086unannotatedprotein -----------------------------------------------MFLSRRQFLKVSVG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -APELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGVQGSDVDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPQ-SDGALFLGAMKIIVDENMH----D -------VDFLKSFTDAPILVRTDTLQYLDPRDVIPD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIQRL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIHTRS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VVNNAKHHYD----------------MVKNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRPEAEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWDEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPFVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGCQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_900078535_00262|FJVM02000053unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------IADNVLA--LTALQP--VIE-VGNPLGEYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIGTRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------SDFMKQFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQTLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPIWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKQ -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VLNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTIRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMSKHAPYVATPKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQLDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002451055_00821|DKBD01000269unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRRYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGIIGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPFWSGVQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIMVDENMH----D -------IDFMKSFTDAPILVRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKGEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALTGSY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QITRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-ANARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLS--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVVNVN-VVNNAKHHYD----------------MVRNVD--PNI -ECLITQDIEMTSDINHADIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYAN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYVR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQIHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMAKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAVAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002331335_02310|DCZO01000011unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWVCS-PNDTHACRVRAFVRNGVIMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRSGMPVLGIIGKMGNTRMNGGINALLDTWIRKVGP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFMKSFSDAPILIRTDTLQYLDPRDVIAD---YK---------FPDFSKS--- ---------------YSGRIQSLKAEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYANSGI------D---------------------AALNGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YMVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INSRGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGAWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITLDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNL -ECLITQDVEMTSDVNHNDIAFACNTWVEFTYPEMTITVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--RDYFAM-------------------------VYSN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPAYPYHVTMTKHAPYVATAKSVKGHETRP -DGRAIAID-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->WP_053378142|Nitrospira_moscoviensis -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKQ----------WMD----------DG -SPELT-PETKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMIIVATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -DQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGSLFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVAD---YK---------FPDFSKS--- ---------------YSGRIQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYVNSGI------D---------------------AALTGTY----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTVH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKLRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGTAAKLSEMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYLN--- --------------------------------RVDVYAQRMLDASSTFYGYSADTML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVSTAKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->riogrande_2019_sw_WHONDRS-S19S_0066_A_bin.62_Ga0451725_0007910_5 rank: A; nmv:NITMOv2_4538 putative Nitrite oxidoreductase, alpha subunit; K00370 (db=kegg) -----------------------------------------------MFLSRRQFLKISAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAYIIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVNP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFIGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDT------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->GCA_002083555_01644|MSXN01000007unannotatedprotein -----------------------------------------------MFLSRRQFLKVSAG -TVAAVA--------VADKVLA--LTALQP--VIE-VGNPLGDYPDR------SW-ERVYH -DQYRY------DSSFTWCCS-PNDTHACRIRAFVRNGVVMRVEQNYDHQTYEDLYGNRGT -FAHNPRMCLKGFTFHRRVYGPYRLKGPLMRKGWKA----------WMD----------DG -SPELT-PDTKRKYKFDSRFLDDMLRVSWDTAFTYAAKAMVIIATRYSGEAGARRL-REQG -YAPEMIEMM------KGAGTRCFKHRAGMPVLGILGKMGNTRMNGGINALLDTWIRKVSP -EQAQGGRYWSNYTWHGDQNPAHPWWSGAQGSDIDLSDMRFSKLNTSWGKNFVENKMPEAH -WKLECIERGARVVVITPEYNPTAYRADYWMPLRPE-SDGALFLGAMKIIVDENMH----D -------IDFLKSFTDAPILVRTDTLQYLDPRDVVKD---YA---------FPDFSKS--- ---------------YSGRMQSLKPEQIERL---------GGMMVWDLNKKQ--AVPLH-- --------REQVGWHYTNSGI------D---------------------AALNGTF----- -------------------------------------RVKLL-NGREIDAMPVWQM----- ----YLVHFQD-YDLDTTH-----------------------------QICRTPKDLIVRW -ARDS-----------GTIKPAAIHNGEGTCHYFHQT-INARGAAMVLIITGNVGKFGT-G ---QHTWAGNYKAGTWT-ATPWSGAGLA--------------------------------- -------------------------------VHTGE-----DPFNITTDPNAHGKEIKTKS -YYY------GEEVGYW-----NH---------------GDTALIVNTP-----KYGRKVF -TGKTHMPTP---SKFRWVTNVN-VLNNAKHHYD----------------MVRNVD--PNI -ETLITQDIEMTSDVNHNDIAFACNSWMEFTYPEMTVTVSN-PWVQI----W-KGGIRPLY -DTRNDLDTFAGVAAKLSDMT---------------------------------------- ----------------GDKRM--KDYFAM-------------------------VYTN--- --------------------------------RVDVYAQRMLDASSTFYGYSADVML-KSE ------KG----WMVMVRT----Y-PRHPFW----EETNESK--PMWTRS----------- --------------------GRYENYRIEPEAIEYGENFISHREGPEATPYL--PNAIFT- -TNPYCR---PDDYGIPITAQH---HDDKTVRNIKLSWHEIKRHSNPLWEKGYQFYCVTPK -TRHRVHSQWSVNDWVQIYESNFGDPYRMDKRTPGVGEHQLHINPQAAKDRGINDGDYVYV -DGNPVDRPYRGWKPSDPYYKVARLMIRAKYNPSYPYHVTMAKHAPYVATPKSVKGHETRP -DGRAIAVD-TGYQSNFRYGAQQSFT---RNWLMPMHQTDSLPGKHAIAWKFKWGYQVDHH -AIN-TVPKECLIRITKAE-DGGIGARGPW---EPVRTGFTPGQ--ENEFMIKWLKGEHIK -IKV- ->GCA_002328125_01442|DCWK01000050unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDTFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNL------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVH-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPETAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->GCA_002685755_01556|NYYB01000002unannotatedprotein -----------------------------------------------MKLSRRKFLAASGS -GLLA----------WSGRGLA--LAALHP--TGE-MGNPLTNYPNR------GW-EKVYR -DQYKV------DGSFTWVCS-PNCTHECRLKAFTRNGIVLRTEQNYDKHRITDIYGVKAT -HHWNPRGCPNGFTFQRRMYGPYRLRYPMVRRGWKR----------WAD----------DG -FPELN-EANKKKYKFDSRGTDIFVRVKWDDAFTYASKGFIQISKTYSGDAGKKRL-LDQG -YDPASLTHW------DGAGTRTMKFRGGMGLLGVIGKYGMYRFAN-TMSLLDTHTRGVGP -KKARGGRAWSNYTWHGDQAPGHPFVHGLQASDCDFNDLRNSKLHIHMGKNLVENKRPDSH -FFMESMERGAKIIVVAPEYSPPATKADYWIPIRPQ-TDTALLLGVTKILIDRGWY----D -------AKFVKEFTDFPLLVRTDNLRRLRPQDVIPG---YK---------NQDISGG--- ---------------PSFKIHGLTPKYRDAA---------GDFMIWDKGKNA--PAPIT-- --------RDDVGKHIGAKNI------D---------------------PALEGKY----- -------------------------------------TVKLV-SGVEIEVMPVFEM----- ----YKSHHLKDYDLDTVY-----------------------------EITHSPKDLIERF -AKDV-----------ATIKPAALHVGEGVNHWFHAT-MTNRAQYLPMTLTGNIGKLGA-G ---CHTWAGNYKAALFQ-GSGWSGPGFK--------------------------------- -------------------------------GWIAE-----DPFNPNLDPKADGKNIKVRG -TIK------DEEPAYW-----NY---------------GDKPLVVDTP-----KYGRKVF -TGKTHMPSP---TKSLWFTNVN-IFNNAKWLYE----------------MVKNVN--PKI -EMIICSEIEMTSTAEYSDILLPANTWMEFEQPEITGSCSN-PFLQI----W-KGGVKPIY -DTKDDILIMAEMAKKLGEIL---------------------------------------- ----------------KDKRF--EKYWKF-------------------------ALDK--- --------------------------------KAEVYIQRLLDSSTPTRGYKYDDIM-AGK ------YGESGTALMLFRS----Y-PRVPFL----EQIEESV--PFYSPT----------- --------------------GRLQAYNDEPGVIEYGENLIVQREGPEGTPYL--PNVIIS- -SSPFIR---PEDYGIPENHMG---WDERQVRNIKLPWKEAKDTKNPLWEAGYRFFCLTPK -SRHLTHSSWQVTDWNFIWSTSFGDPYRMDRRQPGVGENQVQMNPEAAKDLGFNEGDYVYV -DANPADRPYIGWKPSDPFYKVARLMLRVKYNPSYPYDVVMIKHGAWCATEKSVKGHETRK -DGRAVSAD-TGYQASYRYGSHQSIT---RGWLMPMHQLDSLFHKKKVFMGFMLGGEADNH -AIN-TVPKETLVKLTKAE-DGGLGGRGVW---APATTGFSVGN--ENKFMQSYLQGT-VK -VKRG ->WP_042250442|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKIRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDDTFTYLAKGHVAVGKAYSGQRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGIYRLAN-MVGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVCPEYNPPSTKADYWIPCRAGASDISIFLGCAKIIMDEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDTNTDK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDSVN-----------------------------QISHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------SMVAE-----DPFNPVLDISKNVDWANVKG -YLK------GEEVGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---SKLIWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYADFVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTAGMGYNIDDII-NGK ------YGEPGACLLLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTAMMKHSCWTSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMFGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQY-- ----- ->WP_042251421|Nitrospina_gracilis -----------------------------------------------MRLNRRKFLQVSAG -VASAMA--------LSSKRVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRVYGPYRNKYPMLRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRVTWDETFTYLAKGHVAIGKAYSGSRGAQRL-KNEG -YQPEMIEAM------GGSGSRSMKYRGGMGLLGVVGKYGIYRLAN-MMGLLDAIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPTRAGLADISIFLGVAKILMDEGLV----D -------GEYVKEYTDMPLLVRTDNLIRLHPEDYIPG---YK---------NQPLPKD--- ----------------GFTTKWMKNYDRDKM---------PDFVVWDTNTDK--PVALT-- --------REDIGAKMRRKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLVVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWSGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVLDVTKNVGWENIKA -YAK------GEEPGYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLLWFVNVN-VINNAKWFYE----------------MVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAANSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRLSQIT---------------------------------------- ----------------GDKRF--ADYMK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTSTSGMGYNIDDII-NGK ------YGEPGCCLLLYRT----Y-PRSPFW----EMYTESK--PFYTAH----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYV -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTSMMKHSAWQSTERSVKAHEERP -DGRALSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKSKTKMKFVHGYEADNH -AIN-ATPKETLVKFSKAE-DGGMHGKGLW---EPARTGYTPESPLKDRFAEMYLAGQY-- ----- ->MBL09191|Acidiferrobacteraceae_bacterium -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLESYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNRYPMIRVGWKQ----------WAD----------DG -FPYLD-KANREKYKMTSRGTDEFVRMSWDDTFTYLSKGHIAVGRAYSGPRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISVFLGCAKIIMDEGLV----D -------IEYVKDYTDMPLLVRTDNLKRLHADDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFSRDQM---------PDFAVWDANTNK--PVAVT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DVKLT-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLVVRV -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDPAQNTDWKNVKG -YLK------GEEVSYW-----AH---------------RDEALIVNTP-----RYGRKVF -TGRSHMPTP---TKLFWFVNVN-VINNAKWFYE----------------LVFNTD--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFARRMSEVT---------------------------------------- ----------------GDKRF--GEFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -XGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKFGYEADNH -AVN-ATPXEXLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->TDJ60388|Nitrospina_sp -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LSSKRVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVKDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRLSWDQTYTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MMALLDSIIRGRGP -GQVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVTVAPEYNPPATKADYWIPVRAGLSDISVFLGAAKIIMDEGLV----D -------VPFVKEYTDMPLLVRTDTLVRLHPDDYIPG---YK---------VQALPKD--- ----------------GFTTKWLKNFNRSKM---------PDYTVWDTNTNK--PVAIT-- --------REDIGAKMLKKKI------D---------------------PALDGVY----- -------------------------------------DIKLV-SGKTITVMPMYEM----- ----YKIHLKD-YDLDTVN-----------------------------QISHAPKDLIIRL -SRDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---AHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFHIILDPAKNVDWKNVKG -YLK------GEEISYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLMWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIIAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLMHREFGKRMAQIT---------------------------------------- ----------------GDKRF--ADFMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PYYTPN----------- --------------------GRLQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEEEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWIGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYTR -VKI- ->MSP_nxrA ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------MPLYEM----- ----YKIHLKD-YDLETVN-----------------------------QISHAPKDLVVRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPEMDPAKNTTWAQIKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPVF -DTIDDNLIHREFAKRMAEVT---------------------------------------- ----------------GDKRF--ADYVK--------------------------VYEG--- ----------------------------EAPNRTKAQIRRLFTTGTTGMGYNIDDII-NGK ------YGEPGCCLMLFRT----Y-PRSPFW----EMFTESK--PYYTPH----------- --------------------GRLQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFMHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->PIQ99248|_Nitrospinae_bacterium_CG11_big_fil_rev_8_21_14_0_20_45_15 -------------------------------------------------------MQVSAG -VATAMA--------LTSKKVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTFPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGSRVMKYRGGMGLLGVVGKYGIYRLAN-MVALLDAIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------VNFVKEYTDMPLLVRTDTLMRLHPDDFIPG---YR---------NQDLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFVVWDANTDK--PVAIT-- --------REDIGSKMKKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTIPVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIMPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPVMDIAKNTDWANVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRSHMPCP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNCWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFARRLAEVT---------------------------------------- ----------------GDKRF--SDYMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEWGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWASTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->Nitromaritima_KMP11423|SCGC_AAA799_A02 -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTGKKVG---AQLKP--VVK-VGNPLDTYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRLSWDQTFTYLAKGHVAVGKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTMKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGVNKIIMEEGLV----D -------VDYVKDYTDMPLLVRTDNLIRLHPDDFIPG---YK---------AQQLPKD--- ----------------GFTTKWMKNYNRNQM---------PDFTVWDTNTNK--PVAIN-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DVKLV-NGKTITVMPLYEM----- ----HKIHYKD-YDIDTVN-----------------------------QISHAPKDLIIRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASFTPLMLTGNVGPKGS-G ---SMTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----TPFDTELDPAKNIDWNRVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRTPFW----EMYTESK--PFYTPN----------- --------------------GRTQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPFMGWKPSDPRYKVGRLMLRAKYNPAYPYHTTMMKHATWTATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->cas150m-4_02474|CAS-150m-4914Perchloratereductasesubunitalphaprecursor ---------------------------------------------------------MSAG -VATAMA--------LSSKKVG---AQLKP--VVK-VGNPLDSYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKFTSRGTDEFVRMTWDQTFTYLAKGHVAVGKAYSGVRGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVIGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDISIFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDNLIRLHPEDFIPG---YK---------VQPLPKD--- ----------------GFTTKWMKNFNRDKM---------PDFTVWDINTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVY----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKVHLKD-YDIDTVN-----------------------------QISHAPKDLILRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTVLDASKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHRQFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------EAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEFGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSSVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWTGTERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKSKMKFLHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002705185_00880|PAJA01000060unannotatedprotein ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->MAX17737|Nitrospina_sp ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------------------------MTIQWGKNLIENKMPEAH -WYTEIMERGGTLVSIAPEYNPPATKADYWVPVRAGLSDIALFLGVAKIIMDEGLV----D -------VDFVKDYTDMPLLVRTDTLVRLHPDDFIPG---YK---------AQALPKD--- ----------------GFTTKWMKNFNRDMM---------PDFTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-SGKTITAMPLYEM----- ----YKVHLKD-YDVDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNTILDASKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLVWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRLAEVT---------------------------------------- ----------------GDKRF--ADHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLLLFRT----Y-PRSPFW----EMYTESK--PYYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPXIR---PDXYGIPEDEQD---PDLRHVRNIKXPWSAVRTTXNFLWXXGXRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIXC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_001542995_01387|LFLA01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSKRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------SGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-QVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKLTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAVAPEYNPPATKADYWIPVRAGLSDISLFLGVAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDANTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PVLDGVF----- -------------------------------------DIKLV-SGKTITVMPLYEM----- ----YKVHLKD-YDIDTTN-----------------------------QICHAPKDLIVRL -ARDI-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNIVMDPSKNIDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWFVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIVLAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFSRRMAEVT---------------------------------------- ----------------GDKRF--MDHMK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGACLLLFRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINDGDYIYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-AVPKETLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYIR -VKI- ->GCA_002453875_01196|DKHT01000003unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GCA_002454045_00625|DKID01000024unannotatedprotein -----------------------------------------------MRLNRRKFLQVSAG -VATAMA--------LTSRRVG---AQLKP--VVK-VGNPLEAYPDR------RW-EEVYR -DQYKY------ERSFTYCCS-PNDTHQCRVRGFVRNGILMRIEQNYDHHKVRDLYGNQAD -AAWNPRMCLRGMTYPRRAYGPYRNKYPMIRVGWKQ----------WAD----------DG -FPYLD-KENREKYKMTSRGTDEFVRMTWDQTFTYLAKGHIAVAKAYSGARGAQRL-KNEG -YQPEMIEAM------GGSGPRTFKYRGGMGLLGVVGKYGVYRLAN-MVALLDSIIRGRGP -GKVLGGRAWSNYTWHGDQAPGHSWTHGMQTSDIDFADHRYAKMTIQWGKNLIENKMPEAH -WYTEIMERGGTLVAIAPEYNPPATKADYWVPVRAGLSDIALFLGCAKIIMDEGLV----D -------IDYVKDYTDMPLLVRTDTLIRLHPDDFIPG---YK---------AQSLPKD--- ----------------GFTTKWMKNFNRDMM---------PDYTVWDTNTDK--PVAIT-- --------REDIGAKMRKKNI------D---------------------PALDGVF----- -------------------------------------DIKLV-NGKTITVMPLYEM----- ----YKIHLKD-YDLDTVN-----------------------------QICHAPKDLTLRL -ARDM-----------GTIKPVEIHYGEGINHYFHAT-MHNRASYVPLMLTGNVGPKGS-G ---SHTWAGNYKAGNYQ-GSHWSGPGFA--------------------------------- -------------------------------AMVAE-----DPFNPILDITKNVDWKNVKG -YLK------GEEVSYW-----AH---------------RDKALIVNTP-----RYGRKVF -TGRTHMPTP---TKLCWYVNVN-VINNAKWFYE----------------LVFNTN--NNV -DMIVAQDIEFTGSCEYSDIILAPNSWAEFESYEITSACSN-PFHQI----WGGTGIKPIF -DTIDDNLIHREFGKRMAEVT---------------------------------------- ----------------GDKRF--SDFLK--------------------------VYEG--- ----------------------------KAPNRTKAMIRRLFTTSTTGMGYNIDDII-NGK ------YGEPGCCLMLYRT----Y-PRSPFW----EMYTESK--PFYTPN----------- --------------------GRIQFYNDEPEAIEYGENFIVHREGPEATPYL--PNVIVS- -TNPYIR---PDDYGIPEDEQD---PDLRHVRNIKKPWSAVRTTKNFLWEKGYRFYCVTPK -SRHTAHSSWATTDWNMIWNNNFGDPYRMDKRSPGVGEWQVHMNPFLCKDLGINEGDYVYC -DANPADRPYMGWKPSDPRYKVARLMLRAKYNPAYPYHTTMMKHATWIATERTVKAHEERP -DGRAMSMT-TPYQSNFRYGGQQSIT---RSWLMPMHQTDSLFHKAKTKMKFKHGYEADNH -AVN-ATPKEVLVKFSKAE-DGGLHGKGLW---EPVRTGYTPESPLKDRFAEMYLAGQYVR -VKI- ->GBC85351|bacterium_sp_HR11 -----------------------------------------------MKLTRREFMQTTAA -GAAALV--------LDDALRG--LRLLQP--VVE-VGNPLAAYPNR------DW-EAVYR -DQYRY------DRSFTWVCS-PNCTHECRLRAFVRNGIVLRSEQNYDLHRISDLYGNKAT -AHWNPRGCLNGYTFQRRVYGPYRLKYPMIRRGWKQ----------WAD----------DG -FPELT-PENMAKYKFDSRGTDTFVRVSWDEAYTYVARGMIAIARRYSGEEGRRRL-LEQG -YPEEMLEHW------EGSGVRTFKLRGGMGLLGVIGKYGLYRFAN-MLALLDAHVRKVPP -EEAKGARIWSNYTWHGDQAPGQPFVHGLQTSDVDMNELRFARLHIQCGKNLVENKRPESH -FFIELMERGAKIVAIIPEYGPQATKADYWIPIRPA-TDAALWLGITRVMIDNGWY----D -------VDFLKKWSDMPLLIRTDTLRRLRAHEVFPG---YR---------GGLDPKG--- ---------------PSFQVQDLKPDQYEKI---------GDFVVFDEKSQS--LKPLT-- --------RDDVGGRLTAKGI------D---------------------PALSWRG----- -------------------------------------KVRLV-DGTEVECMTLWEA----- ----YKIHLQD-YDLDTVC-----------------------------EITHAPKELVLRL -ARDIWETTQEVRRQNPDMGAVAIHIGEGLNHWFHAT-EMNRAVYLPLILTGNIGKPGA-G ---CHTWAGNYKAALFQ-GSPWTGPGFL--------------------------------- -------------------------------GWIAE-----DPFHPLLDPKADGTQVKVKK -YTH------DEEPAYW-----NY---------------DDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKLMWFTNVN-LLNNAKWVYE----------------MIKNVN--PKV -ELIIAQDIEMTSSCEYADVILPANSWMEMETYEITASCSN-PFLQI----W-KGGIRPIF -DTKDDVLIMAELAKKLGEIL---------------------------------------- ----------------KDRRF--ADYWKF---A----------------------LER--- --------------------------------KTEVYIQRLLDTCTTTKGYRVEDIL-AGK ------YGEPGAALMLFRT----Y-PRVPFW----EQVHDDL--PFFTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNVIVS- -SNPLIR---PEDYGIPLDHMG---RDERQVRNVKLPWSEVKKTKNPLWEKGYRFYCLTPK -TRHATHSSWQVTDWHLLYNNDFGDPYRLDKRSPGVGEAQLHMNPQAAKDLGINNGDYVYV -DANPADRPYVGWKPGDPFYRVARLMLRVKYNPAYPYHVVMMKHAAWIATEKSVRAHETRP -DGRALSED-TGYQASFRYGSQQSVT---VGWLMPMHQLDSLFHKAKAKVGFIFGGEADNH -AVN-TTPKETLVKVTKAE-DGGLGGKGVW---EPARTGYTAGD--EDDFMKRYLNGELVE -IVGE ->WP_099324707|Kuenenia_stuttgartiensis -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALSPS--GYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->NxrA_Candidatus_K_stuttgartiensis_CAJ72445 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKTKYMFDNRGNDELLRASWDEAFTYASKGIIHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVGP -DQALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLLIQTGKNLIENKMPEAH -WVTEVMERGGKIVVITPEYSPSAQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLIRTDTLKRVSPKDIIPN---YK---------LQDISDG--- ---------------PSYHIQGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PVLEGSF----- -------------------------------------KLKTI-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------SMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPSP---TKVLWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITNSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVAMLLFRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEY---WEDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDSFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFIFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELIK -VDA- ->OHB72803|Planctomycetes_bacterium_RBG_16_41_13 -----------------------------------------------MKLTRRAFLQVAGA -TGATLT--------LAKNAMA--FRLLKP--AVV-VDNPLDTYPDR------RW-ESVYR -DQYQY------DRTFTYCCS-PNDTHACRIRAFVRNNVMMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKR----------WAD----------DG -FPELT-PENKAKYMFDNRGNDELLRASWDEAFTYASKGILHITKKYSGPEGAQKL-IDQG -YPKEMVDRM------QGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-CLAIVDAHNRGVDP -DQALGGRNWTNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKIVVITPEYSPSSQKADYWIPIRNN-TDTALFLGITKILIDNKWY----D -------ADYVKKFTDFPLLVRTDTLKRVSPKDIIPN---YK---------LQDISEG--- ---------------PSYQIHGLKDEQREII---------GDFVVWDAKSKG--PKAIT-- --------RDDVGETLVKKGI------D---------------------PALEGSF----- -------------------------------------KLKTV-DGKEIEVMTLLEM----- ----YKIHLRD-YDIDSVV-----------------------------DMTNSPKDLIERL -AKDI-----------ATIKPVAIHYGEGVNHYFHAT-LMNRSYYLPVMLTGNVGYFGS-G ---SHTWAGNYKAANFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFKPNLDPYASAKDLNIKG -RAL------DEEVAYW-----NH---------------SERPLIVNTP-----KYGRKVF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWVEFQEFEITTSCSN-PFIQI----WGKTGITPVY -ESKDDVKILAGMASKLGELL---------------------------------------- ----------------RDKRF--EDNWKF-------------------------AIEG--- --------------------------------RASVYINRLLDGSTTMKGYTCEDIL-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEVIEYGENFIVHREGPEATPYL--PNAIVS- -TNPYIR---PDDYGIPENAEH---WDDRTVRNIKKSWEETKKTKNFLWEKGYHFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHIHPQAARDLGIEDGDYVYV -DANPADRPYEGWKPNDAFYKVSRLMLRAKYNPAYPYNCTMMKHSAWISSDKTVQAHETRP -DGRALS-P-SGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -CIN-TVPKETLVKITKAE-NGGMGGKGVW---DPVKTGYTAGN--ENDFMKKFLNGELVK -VDA- ->WP_070066136|Brocadia_sapporoensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IVNKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFSD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------AAIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTIRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->RZV59451|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ERVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQGSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREII---------GDFVVWDAKTNG--PKTIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGIF----- -------------------------------------KVKTV-DGKEIEVMSLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYSGS-G ---SHTWAGNYKAANFQ-SAKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPSAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----RYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEITGSIEYADFAFPANSWMEFETHEITNSCSN-PFVQI----W-KGGIRPVN -DSKDDVVIIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-SGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVAMIKHSSWIATERTVKAHETRS -DGRALAAG-TGYQSSFRYGSQQSVT---RDWSMPMHQLDSLFHKSKIGMKFVFGFEGDNH -GIN-TVPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTTGN--ENDFMKKYLSGELIK -IEKA ->OHB44699|Planctomycetes_bacterium_GWE2_41_14 -----------------------------------------------MKLTRRTFLQIAGA -TGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFVCS-PNDTHGCRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGALGIIGKYGMYRFNN-MLSLVDSHHRGVGA -DKALGGRNWSNYTWHGDQAPGHSFSHGLQASDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSSQKADYWIPIKCN-TDTALFLGVTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQPKDIFPD---YK---------LEDISHG--- ---------------ASYKIQGLHDDQREIV---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLRD-YDIDTVV-----------------------------EITNSPKELIQRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNVGYNGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GYVAE-----DAFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LINNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPENAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGVW---DPVKTGYTTGN--ENDFMKKYLNGELIK -VEKA ->WP_052562588|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGILHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEVEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIIRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKIKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMIKHSSWIATERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMTKYLNGELIK -VEKA ->OOP57237|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGSKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREIL---------GDFVVWDAKTNG--PQPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYMGS-G ---SHTWAGNYKAGNFQ-SAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFYQI----W-KGGIRPVN -DSKDDVMVIAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYINRLLDGSTTAKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGVPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYDVTMIKHSSWIATEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVTKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -VEKS ->RIK02127|Brocadia_sp -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPSLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->KKO18748|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGIGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->OQZ00558|Brocadia_sp_UTAMX2 -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------VANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTFTCS-PNDTHACRVRAFVRNEVVMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-MLSLVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTQVMERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGLTKILMDENLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDITHG--- ---------------PSYKLHGLHDDQREII---------GDFVVWDAKTKG--PKPIT-- --------RDDVGDKLTAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDVDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHYFHAT-LMNRSTYLPLMLTGNVGYKGS-G ---SHTWAGNYKAGNFQ-AAKWCGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPTAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWMEFETHEITSSCSN-PFFQI----W-KGGIRPVN -DSKDDVMVLAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTSKGYTFDDIV-AGK ------YGEPGVALLNYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAETKQTKNFLWEKGYKFFCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVSRLMLRAKYNSSYPYEVTMIKHSSWISTEKTVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSLT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKVCKAE-DGGVGGKGLW---DPAKTGYTTGN--ENDFMKKYLGGELIK -VEKA ->TLD40744|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGLGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->TLD41279|Candidatus_Jettenia_ecosi ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------MKHSACISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELVK -MEKA ->WP_007220240|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LMNRSTYLPLMLTGNIGYPGS-G ---SHTWAGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKAKIGMKFVFGFEADNH -GIN-TVPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLSGELIK -VEKA ->WP_007222969|Jettenia_caeni -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->NxrA_planctomycete_KSU_1_ZP_10101005 -----------------------------------------------MKLTRRTFLQVTGA -TGATFT--------LANKAMA--FRLLKP--AVE-VGNPLDAYPDR------AW-ESVYR -EQYRY------DRTFTYCCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYADLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGARKL-LDQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-SLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFSHGLQTSDVDMNDVRFSKLVIQTGKNLIENKMPEAH -WLTQVFERGGKLVVITPEYSPSAQKADYWIPIKCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISHG--- ---------------ASYKIHGLHDDQREII---------GDFVVWDAKTKS--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIVRL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYPGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPDAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVDTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSNDIEMTGSIEYADFAFPANSWAEFETHEITTSCSN-PFIQI----W-KGGIKPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDMRF--HDVWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTTKGYSFVDII-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQGYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDDYGIPEDAEH---WDERTVRNIKKSWAETKKTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHMNPEAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RNWSMPMHQLDNLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMKKYLNGELIK -VEKA ->WP_052561322|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRADTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->KXK29028|Brocadia_sinica -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LTSKAMA--FRLLKP--AVE-VGNPLDVYPDR------AW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWIYAAKGIIHITRKYSGEEGAKKL-IGQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------PEDISHG--- ---------------PSYKIHGLHDDQREMI---------GDFVVWDAKTNG--PKPIT-- --------RDDVGDKLVAKGI------D---------------------PVLDGTF----- -------------------------------------EVKTV-GGKVIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVSE-----DVFNPNLDPYAPATDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSKDDVMILAGMAAKLGELL---------------------------------------- ----------------RDLRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFEDIV-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPEGAEH---WDERTVRNIKKSWGEVKLTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPNDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGLW---EPAKTGYTPGN--ENDFMRRYLNGELIK -IEKE ->OOP55454|Brocadia_caroliniensis -----------------------------------------------MKLTRRTFLQVAGA -TGATFS--------LADKTMA--FRLLKP--AVE-VGNPLDAYPDR------TW-ESVYR -DQYRY------DRSFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGFTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGLGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGLTRILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDIFPD---YK---------LEDISQG--- ---------------PSFKMHGLHDDQRETI---------GDFVVWDAKTNG--PSPIT-- --------RDDVGDKLTAKGI------D---------------------PVLDGTF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPRELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPYAPATDLKVRG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKVMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWAEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DSRDDVMILAGMAAKLGDLL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTLKGYTFDAIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIAS- -TNPYIR---PDDYGIPESAEH---WDERTVRNIKKSWAEVKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQIHINPQAAMDMGINDGDYVYV -DANPADRPYEGWKPSDPFYKVARLMLRCKYNPAYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAD-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGIGGKGLW---DPAKTGYTAGN--ENDFMRRYLSGELIK -IEKA ->KKO18624|Brocadia_fulgida -----------------------------------------------MKLTRRTFLQVAGA -TGATFT--------LADKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVLMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRRGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDEAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRTFKGRGGMGLLGVIGKYGMYRFNN-TLALVDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSAQKADYWIPVRCN-TDTALFLGLTKILMDEKLY----D -------ADYVKKFTDFPLLVRTDTLKRLQAKDVFLN---YQ---------LEDISQG--- ---------------ASFKIHGLHDDQREII---------GDFVVWDTKTNS--PKPIT-- --------RDDVGDKLVGKGI------D---------------------PALDGTF----- -------------------------------------MVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDSVV-----------------------------EMTNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNVGYKGS-G ---SHTWSGNYKAGNFQ-ASKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEVTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVMILAGMATKLGELL---------------------------------------- ----------------RDMRF--RDYWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIV-NGK ------YGEPGVALLLYRT----Y-PRQPFW----EQVHESL--PFYTPT----------- --------------------GRMQAYNDESEIIEYGENFIVHREGPEATQYL--PNVIVS- -TNPYIR---PDNYGIPESAEH---WDERTVRNIKKSWSDTKQTRNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNPSYPYGVTMMKHSAWISTERSVKAHESRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFIFGYEADNH -GIN-TTPKETLVKITKAE-DGGMGGKGVW---DPAKTGYTAGN--ENDFMKRYLNGELIK -IEKA ->WP_070067449|Brocadia_sapporoensis ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------RGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTNG--PKAIT-- --------RDDVGDKLVAKDI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLRNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDEPEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->RZV56287|Brocadia_sp_BROELEC01 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKTKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLIENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITRILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVAKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPESAEH---WDERTIRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQVNINPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRAKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->OQZ04816|Brocadia_sp_UTAMX1 -----------------------------------------------MKLTRRTFLQVTGA -AGATFT--------IANKAMA--FRLLKP--AVE-VGNPLDAYPDR------SW-ESVYR -DQYRY------DRTFTYTCS-PNDTHACRVRAFVRNEVIMRVEQNYDHQNYSDLYGNKAT -RNWNPRMCLKGYTFHRRVYGPYRLRYPLIRKGWKQ----------WAD----------DG -FPELT-PENKSKYMFDARGQDELLKASWDDAWTYAAKGIIHITKKYSGEEGAKKL-IEQG -YPKEMVDAM------KGAGTRAFKGRGGMGLLGVIGKYGMYRFNN-MLSLLDSHNRGVGP -DKALGGRNWSNYTWHGDQAPGHPFVHGLQTSDVDMNDIRFSKLVIQTGKNLVENKMPEAH -WLTEVMERGGKLVVITPEYSPSSQKADYWIPIRCN-TDTALFLGITKILMDEKLY----D -------ADYVKKFTDFPMLVRTDTLKRLQAKDIFPN---YQ---------LEDISQG--- ---------------VSYKIHGLHDDQREII---------GDFVVWDTKTKG--PKAIT-- --------RDDVGDKLVVKGI------D---------------------PALDGIF----- -------------------------------------KVKTV-DGKEIEVMPLFEM----- ----YKIHLKD-YDIDTVV-----------------------------EITNSPKELIERL -AHDI-----------ATIKPVAIHYGEGINHWFHAT-LFNRSTYLPLMLTGNIGYKGS-G ---SHTWSGNYKAANFQ-GSKWSGPGFY--------------------------------- -------------------------------GWVAE-----DVFNPNLDPNAPAMDLKVKG -RAY------DEEVAYW-----NH---------------NDRPLIVNTP-----KYGRKCF -TGKTHMPTP---TKIMWFTNVN-LVNNAKHVYQ----------------MLKNVN--PNI -EQIMSTDIEMTGSIEYADFAFPANSWVEFETHEITSSCSN-PFVQI----W-KGGIRPVN -DTKDDVAILAGMAAKLGELL---------------------------------------- ----------------RDMRF--RDFWKF-------------------------ALEG--- --------------------------------RPEVYIQRLLDGSTTFKGYTFDDIM-NGK ------YGEPGVALLLYRT----Y-PRHPFW----EQVHESI--PFYTPT----------- --------------------GRLQAYNDESEIIEYGENFIVHREGPEATPYL--PNVIVS- -TNPHIR---PDDYGIPENAEH---WDERTVRNIKKSWSDTKQTKNFLWEKGYKFYCVTPK -SRHTVHSQWAVTDWNFIWNNNFGDPYRMDKRMPGVGEHQININPQAAKDLGINDGDYVYV -DANPADRPYEGWKPSDPFYKVSRLMLRVKYNSSYPYGVTMMKHSAWISTEKSVKAHETRP -DGRALSAG-TGYQSSFRYGSQQSIT---RDWSMPMHQLDSLFHKSKTSMKFVFGYEADNH -GIN-TVPKETLVKITKAE-DGGMGGKGLW---DPAKTGYTTGN--ENDFMKKYLNGELIK -IEKA ->KRT68888|NC10_bacterium_CSP1_5 -----------------------------------------------MEITRRTFLKAAAT -GATAF---------LADDAWA--LRLLQP--AVE-VGNPLSEYPDR------GW-ERIYR -DQYGY------DRTFTFVCS-PNDTHACRLRAYVRNGVVMRIEQNYDVSRYADLYGNKAT -PHWNPRGCLKGYTLHRRVYGPYRVKYPLVRKGWKR----------WAD----------DG -FPDLT-PANKTKYRFDSRGTDELMRISWDDAYSYIAKGMIQIARRYSGEEGVRRL-REQG -YPEEMIRET------HGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-TLALLDVHVRGVGP -DQALGGRTWSNYTWHGDQAPGHPYSHGLQGSDVDLNDFRFSKLHIQCGKNLIENKMPESH -FFNELMERGAKIVVITPEYSPPAAKADYWIPIRPN-TDTALFLGLTKILMEERHY----D -------AAFVKRFTDFPLLVRTDTLKRLRAHEVFPG---YR----------GRLPEN--- --------------GPSFTIQGLTKEQYEKL---------GDFVVFDAKSQS--LKPLT-- --------REDVGDRLAQQGT------D---------------------PTLDWQG----- -------------------------------------KVKLA-DGTEVEAMTLWAM----- ----YTIHLKD-YDLDTVH-----------------------------EITHSPKELIQRL -ARDI-----------ATIKPVAIHIGEGINHWFHAT-LSNRAFYLPLMLTGNIGVPGA-G ---SHTWAGNYKAALFQ-GSSWSGPGFK--------------------------------- -------------------------------GWVAE-----DPFNPNLDPNAPGQAVKVKG -YTK------DEEPAYW-----NH---------------GDLPLIVNTP-----KYGRKVF -TGLTHMPTP---TKVMFFNNVN-LINNAKHVYE----------------MLKNVN--PRV -EMIISVDIEMTASIEYADFALPANSWMEFQTPEITASCSN-PFLQI----W-KGGIKPLY -DSKDDVTILAELAQKLGAIV---------------------------------------- ----------------NDHRF--AAYWRF-------------------------ALEG--- --------------------------------RPEVYIQKLLDTSSTTAGYRVDEIM-AGK ------YGEPGACLMLFRT----Y-PRVPFW----EQVHDSD--PFYTDT----------- --------------------GRLHAYCDIPEAIEYGENFIVQREGPEATPYL--PNVIVS- -TNPYIR---PEDYGISPDAMH---WDERTVRNIKMAWADAKRTTNPLWEKGYRFFFLTPK -TRHRVHSQWSVCDWNQIWDSNFGDPYRMDKRMPGVGDHQLHMNPQAAKDLGINDGDYVYL -DANPADRPYIGWKPSDPFYRVSRCMVRVRYNPAYPYQVVMMKHAPYIATERTVKAHETRP -DGLALSE--TGYQANLRYGSQQSLT---RNWHMPMHQTDTLFHKAKATMSFLFGGEADNH -ALN-TVPKETLVKVTKAE-DGGMRGKGIW---EPARTGFTPGN--ESDFMKRYLAGEIVQ -IKKR ->OGW90704|PVC_group_Omnitrophica_bacterium_RIFCSPHIGHO2_02_FULL_63_14 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------MIWDSNFGDPYRMDKRTPWVGENQLHINPQAGKALGINDGDYVYV -DANPADRPYIGAKPEDPFYKVARLMLRAKYNSAYPYHIVMMKHAPNIATERSVKAHETRP -DKRALS-E-LGYQSNFRYGSQQSIT---RNWHMPMHQTDSLFHKAKVFMGFLFGGEADNH -AVN-TVPKETLVRVTKAE-DGGLGGKGVW---APATTGYTPGA--ESEAMRKYIDGGFVS -T--- ->OGW87506|PVC_group_Omnitrophica_bacterium_RIFCSPLOWO2_01_FULL_45_10b -----------------------------------------------MNESRRDFLKISAV -TAVTLA--------LSNKPFL--LWALEP--VAN-VENPLAYYPNR------DW-EKIYR -DQYRY------DRTFSWVCS-PNDTHACRALAYVRNGIIIRSGSEYNYETYGDLYGNKAT -QNWNPRQCAKGFTFHRLMYGPYRLKYPLVRRGWRE----------WAD----------AG -FPDLT-PENKTKYKFDSRGTDQLEKATWDEAYTYIANGIMSIAKRYSGVEGKRKL-LAEG -YPEEMLAPM------KGAGTRTMKFRGGMGLLGVFGKYGMYRLAN-TMALLDVNIRGVSE -EGAMGGRAWSNYTWHGDQAPGHPWVHGLQNADCDFNDLRFSKLIIQDGKNLVENKLTDSH -WFIECMERGAKLVTISPEYSPPASKSDYWIPIRPQ-TDAALFLGITRLMIDQGWY----D -------KEFVAQFTDFPLLVRTDNLKRLRAADIFPD---YK---------LGLSKNG--- ---------------PSFKYQGLKQEQYEKL---------GDFVVWDETKGA--PVAIT-- --------RDDVGKNLSKKGI------N---------------------PALEGSY----- -------------------------------------KVKTV-DGKEIEVTTLFSL----- ----YKIHLRD-YDLDSVV-----------------------------EITKAPKDLIEQL -AKDI-----------AAIKPVAIHQGEGINHWFHAT-EMNRAAYLPLMLTGNIGQKGA-G ---AFGWAGNYKAALFQ-GSAWTGPGFK--------------------------------- -------------------------------GWVAE-----DPFHPNLDPQTPGKAINAHA -YFR------DEEPAYW-----NH---------------GDRALIVDTP-----AEGKKVF -TGSTHMPTP---TKAMLFTNVN-LINNAKHTYD----------------MLKNVN--PNV -EMILSIDIQMTASIEYADIALPANTWMESEGLEVTASCSN-PFLQI----W-KGGIPPIF -DSKDDLVILSEIAAKLGDLT---------------------------------------- ----------------GDARF--RDYWKF-------------------------ALEG--- --------------------------------KREVYIQRLLDSSTTTTGYKLDDIM-KGK ------YGPPGGALMLFRT----Y-PRIPFW----EQVHEDQ--PFYTDH----------- --------------------GRLQAYTDVPEAIEYGENFIVHREGPEATPYL--PNVIVS- -SNPYIR---PKDYGIPLDAEH---WDERTIRNVKLPWSEVKNTKNFLWEKGFQFFCLTPK -SRHRVHSLWSNVDWHQIWDSNFGDPYRMDKRTPGVGEQQIHLNPQAAKDLGINDGDYVYV -DANPADRPYRGAKPGDPFYKVARLMLRAKYNSAYPYHVAMMKHGTYIATEKSVKAHETRA -DKRALSEG-GAYQANFRYGSQQSVT---RNWHMPMHQTDTLFHKAKVFMSFIFGGEADNH -AVN-TVPKETLVRISKAE-DGGLGGKGLW---EPVKTGYTPAH--ENDVMKQYLHGGFIK -T--- ->KRT77589|Armatimonadetes_bacterium_CSP1_3 ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------MDFNELRHARLHIQVGKNLIENKMPESH -FFNELMERGAKIAVITPEYSPPAAKADYWMPIRPQ-TDAALFLGITRLMMDRRWY----D -------EAFVKQFTDFPLLIRKDTLKRLRAAEVFPG---YK----------PGLDPD--- --------------GPSFKRHNLKLDQYEKL---------GDFVVFDRKTRK--LQAIT-- --------RDQVGERLAQAGL------D---------------------PDLRWRG----- -------------------------------------KVKLI-DGREVECLTLWEA----- ----HRDHLRD-YDLDTVA-----------------------------EITQTPRAMIERL -ARDI-----------ATIKPVSIHIGEGINHWFHAT-LANRAFYLPLMLTGNIGKPGA-G ---CHTWAGNYKAGIFQ-GSPWTGPGIT--------------------------------- -------------------------------GWLFE-----DPFHAALDPATSGTEIKVKK -YLK------DEEPAYW-----DH---------------GDVPLIVNTP-----KAGRRVF -TGTTHMPTP---TKVMWYNNVN-IINNAKWAYG----------------VIKHVN--PNV -ELIINQDIEMTASAEYADIILPANSWVEFETPELTASCSN-PFLQI----W-KGGIKPLF -DTKDDGVIIAEVAAQLTAQT---------------------------------------- ----------------GDRRF--RDYFKY-------------------------LLER--- --------------------------------RPEVYIQRILDSSTSTVGYRVADVV-NGK ------YGEPGAALMLFRT----Y-PRIPFY----EQVHDSE--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENFIVHREGPEATPYL--PNVIVT- -TNPLVR---PEDYGIPLDALH---WDQRTVRNVKLAWRDVKKTKNPLWEQGYRFYLLTPK -TRHRVHSSWSTVDWNMIWDSNFGDPYRLDKRAPGVGEHQLHIHPQAARDLGINDGDYVYV -DAYAADRPYIGWKPSDPFYRVARCMVRVRFNPAYPYSVLMMKHAPFMATEKSVRAHETRP -DKLARSAD-TGYQANLRYGSQQSVT---RDWLMPMHQTDTLFHKSKGTMAFIFGGEADNH -AVN-TVPKETLVKITKAE-DGGIGGKGLW---EPARTGFSPGR--EGDFMKRYLAGTLVK -VTKR ->OUC07869|Chloroflexi_Litorilinea_aerophila ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------EITASCSN-PFLQI----W-KGGIPPLY -NTRDDARILAEVSAALADEI---------------------------------------- ----------------GEPRL--RDYWRF-------------------------ILEG--- --------------------------------RPEIYIQRLLDSSLTTSGYRVEDII-AGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSV--PFYTDT----------- --------------------GRLNSYCDIPEAIEYGENIISHREGPEATPYL--PNVIVT- -RSRFVR---PEDYGIPADHMG---WEERTVRNIALPWNQVKETKNPLWAQGFHFYCLTPK -TRHRVHSSWSTVDWTIILDSNFGDPYRADKRLPGPGDHQLHMNPQAAKDLGIEDGDYVYV -DANPADRPYIGWKPDDPFYKVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVKAHETRP -DGLAKSEG-TGYMANLRYGSQQSVT---RDWSMPMHQTDTLFHKQKTGMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGLDGKGPW---EPTKTGYTPAH--ENEFMLRYLAGETIE -VTT- ->RCK74665|Chloroflexi_Anaerolineae_bacterium ----------------------------------------------MSHLSRREFLKLSSV -AALGTV--------INDLD----WKLLDP---IQ-VDNPLAAYPSR------DW-EAVYR -NQYRY------DSSFTFVCS-PNDTHACRLRAFVRNGIILRAEQNYDVERYSDLFGNTAT -AHWHPRGCKKGQTFHRRLYGPHRLKGPLMRKGWKE----------WAD----------AG -FPELD-EENKTKYKFNARGQDELLPVSWETAYDYIARGMIAIARRYSGEEGARLL-RKQG -YPEEMIQAM------SGAGTRTFKCRGGMGLLGVIGKYGMYRFAN-MLALLDVHVRNVPP -EEAKGGRTWSNYTWHGDQAPGIPFVTGLQASDEDLNDLRNSRLHIQCGKNLVENKMAESH -FFIEAMERGAKIVTITPEYSPPATKSDYWIPIRPA-TDTALFLGLARWIIENQKY----D -------EQFVKRFTDFPTLVRADTLKRLRADEVFSN---YQ---------PGLDPQG--- ---------------ASFTLQGLKPEQYEKL---------GDYVVINEKTGR--PQAIT-- --------RDQVGEVMDKAGI------Q---------------------PLLDWKG----- -------------------------------------KLRLV-DGSEVEVLTVWSM----- ----YLEHLKD-YDLETVL-----------------------------EITHVPKDLFLRL -AEDI-----------TTLSPVALHIGEGINHWFHAT-LANRAQFLPLMLTGNIGKPGA-G ---LYTWAGNYKAALFQ-GSAQSGPGFK--------------------------------- -------------------------------GWVGE-----DPFAPNLDENASGKEIKVHA -YTK------DEEPAYW-----NH---------------SERPLIVDTP-----KYGRKVF -TGQTHMPTP---TKVQFFTNVN-LLNNAKHHYE----------------MIKNVN--PNV -ELIISVDIEMTSTVEYADFALAANTWAEFETYEITASCSN-PFLQI----W-KGGIPPLY -DSRDDARILGELAARLGELL---------------------------------------- ----------------EDNRF--RDYWKF-------------------------ILEG--- --------------------------------RPEVYIQRLLDSSITTSGYRFTDII-EGK ------YGEPGAALMLFRT----Y-PRIPFW----EQIHDSI--PFYTDT----------- --------------------GRMNTYCDIPEAIEYGENLISHRESPEATPYL--PNVIVT- -SSRFVR---PEDYGIPPDATG---WEERTVRNLKMPWSEVKNTRNFLWEAGYHFYCLTPK -TRHRVHSSWSTVDWTLILDSNFSDPYRVDRRQPGVGEHQLHINPQAAKDLGLEDGDYVYV -DANPADRPYIGWKAEDPFYRVARLMLRVKYNPAYPYHIVMLKHGPFMATEKSVLAHETRP -DGLARSAD-TGYQANLRYGSQQSIT---RDWSMPMHQTDSLFHKQKTAMQFIFGGEADNH -ALN-TVPKETLVRIVKAE-DGGIEGKGIW---EPAKSGYTPAH--ENEFMSLYLQGKTIE -IKR- ->GCA_001803565_00046|MHDQ01000004unannotatedprotein --------------------------------------------MSFDRVSRRQFLETLAA -TATAAL--------VSKPAIGLALEKLQP--IPE-IKNPLEHYPPR------EW-EKIYR -DIYNP------DSSYIFACT-PNDTHNCYLRAYIKNGIVTRIGPSQRYRDATDIYETKAS -ARWDPRICNKGVAMVGRFYGDRRVKYPTVRKGFKE----------WVE----------KG -FPRD--ENGQPPLKYFKRGEDQWEKVSWDEAYTIVAQSMIDTVKTYSGTKGAELL-QKQG -YDAKMIEKM------MGAGTQAMKFRGGMPLLGVIKLFGLYRMAN-SMALLDSYIRGVGP -DKAIGGIGFDNYSWHTDLPPGHPMVTGQQTIDFDLVNAEYANIILCWGMNWICTKMPDGH -WLSEARLKGAKVVTITTDYNSTSSKADEIVIIRPG-TDPAFALGLAQVIINERLY----D -------EEFVEGFTDLPFLVRMDTRELLRAHEIISG---YN---------NAELKYT--- -RVIKKEEKPPPPFATNLGMPAVSSDMRQEW---------GDFVVWDSNAKK--ATPVS-- --------RDDTGERFTNKGV------K---------------------PALEGEF----- -------------------------------------EISLT-NGEKIKVRPIFDI----- ----IKQHLEDTWNVDSTS-----------------------------KITWAPKEAIINL -AREI----------AANKEKVLFTVGMGPNQLFNAD-QKDRAIFLVAALTRNVGFFGG-N ---VGSYAGNYRAALFN--------GMP--------------------------------- -------------------------------QYIAE-----DPFNIILDPTKPA---KVKP -YFK------MQSAHFY-----AH---------------GDTPLKVHDI----------YF -NGETHMPTP---TKFFWFAASNSILGNSKGMYD----------------VVMNLLRNRKI -EAVVVNEWWWSASCEYADVVLPADSWGEYNVHDMTASVTN-PFVMV----MPLTGVSRIW -DTKSDSETYAGVSEKLGELT---------------------------------------- ----------------GDSRF--KDYWRF-------------------------IADG--- --------------------------------KAKPYLQRIIDHSNTMKGYQIDNLISKAK ------DGIP--ALLMSRT----Y-PKFIGY----DQSVESA--PWYNKT----------- --------------------GRLEFYREEPEFLDYGENLPVHREPVDATFYE--PNVIVAK -GHPLIKPKTPTDYGWPMDDLS---GETRQVRNVVYTPDELLNTKHPLRKEGFTHIYLTPK -FRHAVHTFGVDLDLLSIWFGPFGDMYRRDKRKPWVNEGYVEINPDDARELGIEDGDYIWV -DPDPKDRPFKGWQDKPADYKVARCLLRARYHPNLPKGITRTWFNMYQATHGSVRGHESRK -DGLARNPD-TNYQSMYRYGGHQSST---RSWLRPTLLTDTLVRKNLMGQMIGKGFEPDVH -CAN-GAPRESFVKFTRAE-DGGESGKGKW---RPAVLGFRTGY--ENVAMKKYIKGGFIS -KGGK ->SPS06998|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->SPS06751|Nitrotoga_fabula ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRLGFKA----------WCD----------AG -YPRTG-ANGFPDPKFLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGVKTMKFRSGMAALGVLRIYTLKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGAHIVDISIDYHATANKADDVIILRPG-TDPALGLGVCHYLIKHNYY----D -------EDYLRANTDMPLLVRTDNWKNLKASDIIPN---YE---------LAELTHH--L -KVMKPGEKPTQPVAFQ-ATAFVAEDVRKFW---------GDNVVWDLNTNK--AVPLT-- --------RDECGARYAAKGV------K---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -SNLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLAALTDNVGHVGGCS ---YGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QFLME-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPMRRVQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPSDR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENITVYRTPIDSSHYE--PNVIVGH -CRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRIYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ENKQMRTYLQGAFTR -R--- ->RFC37636|Nitrotoga_sp_CP45 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC33776|Nitrotoga_sp_LAW ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-ATAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC30723|Nitrotoga_sp_MKT ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAD----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSMKRFAQ-GLALLDAYVRNVGP -DEASGAKVLDSYSWHTDLAPGCPMVSGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDLPLLIRTDNWKNLKASDIIAD---YK---------LADLTHH--L -KVMKPGEHPTMPPAFQ-STAFVAEDVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVVPVFQL----- ----QKEYLEE-FTPENTS-----------------------------IMTGVPVEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NF---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTAMT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--SIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATNHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLKGGFIS -R--- ->RFC31618|Nitrotoga_sp_SPKER --------------------------------------------------------KLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGA -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATSNKADDVIILRPG-TDPALGLGVCHLLIKNNHY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIIPD---YK---------LAELTHH--L -KVMKPGEGPTMPPAFQ-STAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVTPVFQL----- ----QKEYLEE-YTAENTS-----------------------------IMTGVPSEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KMAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADFFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGIP--TIFMSRT----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGH -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23760|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23368|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRTGFKA----------WAE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYSGDKGAALL-TRQG -YDPEMIASM------HGCGCKTMKFRAGMAALGVLRIYSLKRFSQ-GLALLDAYVRNIGP -DEASGAKVLDSYSWHTDLAPGCPMVTGHQMLDYEFMVYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGENPTQPVAFQ-STAFVSEEVRKFW---------GDNVVWDRKTNK--AVPLT-- --------RDECGARYAAKGV------D---------------------SALTGDY----- -------------------------------------EVTLV-DGKKIKVTTVFQL----- ----HKEYLEE-YTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GSPKESYVKIELAE-KGGVNG-GVW---HIAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->BBJ23476|Nitrotoga_sp_AM1 ------------------------------------------MMEIKNNIGRRSFLKLSAT -AGLAVM--------ANNAFAA--SPFLKP---YV-VDNPLKSYPNR------DW-EKVYR -DMFHV------DSEFIFLCA-PNDTHNCLLKAHVKNDVVIRISPSYGYGDAEDMDGNRSS -HRWEPRICNKGMVMNRKAYSDRRPKGAMVRAGFKA----------WVE----------AG -YPRTG-ANGFPDQKYLQRGKEPFIKLPWTEAYALAAGALENIARTYAGDKGAALL-TRQG -YDPEMIASM------HGCGCKVMKFRAGMAALGVLRIYSLKRFAQ-GLALLDAYVRNIGS -DEASGAKVMDSYSWHTDLAPGCPMVSGHQQLDYEFMAYEHAKLIVFWGNNFVCTKMPDLH -WVSESRLKGCHIVDISIDYHATANKADDVIIIRPG-TDPALGLGVCHLLIKNNQY----D -------ENYLRANTDMPLLIRTDNWKNLKASDIFPD---YK---------LAELTHH--L -KVMKPGEEPTQPVAFQ-ATAFVSEEVRKFW---------GDNVVWDKKTNK--AVPLT-- --------RDECGARYAAKGV------E---------------------SALTGEY----- -------------------------------------EVTLV-DGKKIKVAPVFQL----- ----QKEYLEE-FTAENTS-----------------------------IMTGAPMEAIVDL -ANLF----------HKHRGQGIISTGAGTNHYFNST-LKDRGFMLLSALSDNVGHIGGCT ---FGNYVGNYRQSVFG--------GFG--------------------------------- -------------------------------QYLLE-----DPFNPELDGRKMVT--KLAH -YTD------DESAHYY-----NY---------------GDRPL----------RNGTRLL -TDPGHMPAP---TKVLWQANSNSSLGNAKGHYD----------------MVVNTL--PRW -EAIFYSDWNWTASCEYSDIVWGVDSWLENKHTDMACSCSN-PFLTV----SPITPLRRFQ -DTVGDAEVPAGIFRAFTALT---------------------------------------- ----------------GDQRF--ADYFKF-----------------VGTNPAGNPADR--- --------------------------------DSEVYGQRVLNAGSATRGMVFAEIREKAK ------RGVP--TIFMART----Y-PRISGW----EQTAEGGGLPWYTKS----------- --------------------GRLEFYMDDPRLIDGGENLTVYRTPIDSSHYE--PNVIVGN -SRAFALMETPEMRGLERMGNSLKIAENRQGRNVILTTKELMATTHPLRPHGYEFCFNSPK -YRHGAHTTPIDTDLMTLWWGPFGDIYRHDKRQPSVGEGFVDVNPLDAKRFGIDEGDYIWV -DADPGDRPYKGWKEGTPEYALARFMVRCRYFPGMSQGSMRMYYNAYAATYGSMEGARTRA -DGLAKSPR-TNYQAMFRSGNHQSCT---RAWINPTNTTDTVANKKVFGQEIIIGMQNDVH -CAN-GAPKESYVKIELAE-KGGVNG-GVW---HVAAKGYRPTY--ESLQMRTYLQGGFIS -R--- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1348658_11 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------KEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYHAPE-------------- ---RTISVPKSPMRGNKRAGGHNSPT---RVHLKPSLMVGGYGQ---------FTYSFNYW -GPT-GVNRDTFILVRKLP------GKPEF------------------------------- ----- ->CRI68048|Thiocapsa_sp_KS1 ------------------------------------------------------------- -------------------MSK--TKDDNG--NGG-SRWFRELDEPR------KW-EDFYR -RRWQY------DKSVRTSHS-VNCSGSCSWEVFVKNGMITWELQKTDWPQI-----NDET -PNYEPRGCQRGISASWYPYSPVRPKYPYVRAVLLDFWRAERAAGKDPI----------AA -WGAIVENPERSKAYRNARGKAGWRRTTWDEATEIIAAAKIYTIKEH-------------- ----------GADHLASFSPIPAMSMVSFLSGHRL-------------------------- -SNLLGGTMLSFYEWYHDLPHVMPMIWGDQTDVHESADWYQSAYWIVMGSNLPMTRTADAH -FASEHKYNGGKLVNLSPDYSDVTKFADLWVPVRPG-TDTAFILSCIHVILQEFHV----N -RRSEYFHSYVAQYTNLPFLVILD-----QEGDHFASGRFLR---------ASDVAAY--- ---------------------AD--EELADW----------KLPCFD-KEGE--LRLPGGT -LGFRWEEKNTGRWNLKNEDAVTAQPFD---------------------PLLTLMDGEFEE -VIVEYADFTHTFNVEFGTTALRGEKARKSLRGVPSRVLTKK-DGTK---VRVATA----- ----YDLLLAS-FGVNRGLSGSGYPKDYDDASEAYTPAWQE-------QETGVDRNLAIRV -AREW------ADTAEKTKGKCLFITGSGILHWYHGGSLTYRSEAVMGILTGCQGRNGG-G ---FAHYVGTEKIRNMA---AIGTIGNAADWGNVGRQQNSTSYFYFHTDQWR-YDGMSLDP -LWAPRAKEMPARANHAADMNAVAVRNGWLPFFPQF-----DERNPTDVMQDARKAGCKSL -EDVK-----TWVAQQF-----KE---------------RKLKFALPNVDAPK-NHPKVLW -IYRGNLIGT---SMRGHELNLKHMLGTHNNVLGGETRA----KDMVNEIDWTENAPLGKL -DLIYNVNLRMDSSANYSDIVLPTAHWYEKFDLTCTD--LH-SFLHP----F-TPAHDPAY -ESKHDWEAFRLIAEKISELAKVHLPDPIEDLVMTALSTDTPDEMAQPM---GELRDWWKG -ESEPIPGKTFPNVSVVTRDY--TKIHDMYTTLGPAVTKPNSYGAKGIKGDLAEVYEQMKE -SYLVGEKQGRPNMETAAKVCEVILRISPESDGELSY-----------QIFKNLEKR---- ------CGVPLAHIVEPER----E-TAYHYP-DLISQPRRALTSPHWSAIETKGRTYSPWT -LNIEALKPFHTLT------GRQEIYYDHRMFRDLGEDFPVYKPPVDMV--S--IGDVAQ- -------------------------KDIKMKGAKLFRF-------------------ITPH -QKWGIHSMFGDSWQMQNMFR---------------GGPTVWINDDDARDIGVKDNDWV-- ----------------EIFNENGIQVARAVVSHTVPRDMSIVYHQTERH-------VNVP- ---FSSLAR-ERGASDLRGGNNNATT---RIMMNPATMVGGYANWTYWLNYQGTS------ -----PSERDCVVLIRKKP-METRGRKVIY---QESQL--------NVGA----------- ----- ->NASQAN2011_330_B_bin.17_k121_430440_3 rank: A; amyy:YIM_22320 narG; Nitrate reductase alpha subunit; K00370 (db=kegg) -----------------------------------------------------MFHNASLG -HTATMGRTDDVPNGTEEALIK--FGRFFAGGEVSKDLLSVTKAGGR------EG-DVFYR -DRWSH------DKVVRSTHG-VNCTGSCSWKVYVKDGIITWETQQTDYPSVG-----PDS -PEYEPRGCPRGAAFSWYTYSPTRIRFPYIRSVLLE---------MYREAKGRL-GDSVLA -WADVVDNSENRQRYHRARGKGGLVRVSWSEVSEIIAAAHVHTIKKY----GPDRI-FGFS -PIPAMSMAS------HAAGARFISL----------------------------------- ----MGGSMLSFYDWYADLPVASPQVFGDQTDVPESADWFNASYLIMWGSNVPVTRTPDAH -FMTEARYKGQKVIAISPDYADNTKFADEWVAPHPG-TDGALGMAMGHVILKEFFV----D -KQVPRFQDYVKKFTDLPYLVSLRK----KDGSWVPDKFLVASD-------LGDVSEG--- -----SRFKTVVLDSSTGETFVPNGSLGHRY-------NDSSTGKWNLDLEGVDPLLSV-- --------YGKKGAVSAPVLM----------------------------PRFDQGQ----- -------------------------------------EVSES-GGVLARGVPVIEIAGKTV -TTVYDLMLAQ-YGVAREG--------LDGDWPEGYDDRSPYTPSWQEEITSVPAVQAIRI -AREF------AQNAIDSEGRSMILLGAGTNHWFHSD-TMYRTFLALVTLTGCQGVNGG-G ---WAHYVGQEKCRPVT---GWAQLAFGADWSRPARQMIGTAFWYVSTDQWRYDALGSDLL -------ATPLGEGRFKDMTAIDVIAQSARMGWMPS-----YPSLN-RNSLDLVDEAREKG -VDPA-----QHVINEL-----KS---------------GDLQFAIENPDAPE-NWPRVLT -VWRANILGS---SSKGNEYFLKHLLGTDNSVRA----NENEPDARPKDVKWHEDAPEGKL -DLLVSVDFRMTSTGLFGDILLPAATW--YEKHDLSSTDMH-PFVHA----F-TPAINPPW -ETKTDYEIFQMLGRQVSEQAKGHLGER-EDLVVVPLLHDTPDAMATPG---GVVLDWKKG -EVEPIPGVTMPKLVVVKRDY--SQIGEKMAALGPLIDTLGTNTKGVPVSVLPEIELL--- -------RHSNGVASTGVGAGRPSLARDVDACEAILALSGTTNGRVAVAGFRALEKR---- ------TGQKLTDLALDNE----G-KRITFA-DTQARPVPVITSPEWSGSEHGGRRYTAFA -INVERLKPWHTLT------GRQHFFIDHDWMSELGEQLPVFRPPLNMHRIF--GS----- -------------------------QGDGVAKEVTVRY-------------------LTPH -SKWSIHSEYQDNLFMLSLSR---------------GGQEIWMSVEDAEIIGVKDNEWI-- ----------------EAYNRNGVVVARACISHRMPSGTVFMYHAKD-------------- ---RVVDVP-LAETSGKRGGIHNSLT---RLVIKPTHLIGGYAQ---------LTFAFNYL -GPT-GNQRDEVTVIRRRS--------------------------QDVEY----------- ----- ->GCA_003453735_00577|DMNE01000186unannotatedprotein ------------------------------------------------------------- --------------------MG--------------WIKDIFDPKAR------LW-EEFYR -SRWQY------DKKVRSTHG-VNCTGGCSWEVYVKDGIITWEMQETDYPLLE-----PGL -PHYEPRGCQRGITFSWYIYSPLRIKYPYIRGVLLD---------LWRKAKSIH-TDTVAA -WESVVENEESRRSYQKARGKGGLRRTTWEEALEIIAASTIYTAKKY----GPDRV-IGFT -PIPAMSMLS------YASGTRFLQL----------------------------------- ----FGGVALSFYDWYADLPPASPEVWGEKTDVAESADWYNSKYIVAMGANLSMTRTPDVH -FVAEARNNGTKLVVLSPDFSQVSKYADWWLPVTAG-HDGAFWMAVDHVILKEFFV----D -RQVQYFSDYLKRYSDAPFLVEIE-----GGEGSLRAGRFLR---------ANTLSRY--R -DAENGEWKLLVFDGKAKEPRMPNGSVGFRW--------QERKGQWNLEM----------- --------KDGADDTIIQPLLSLFEDRD---------------------AAVSINF----- ---------------------TEFASGRTFKRAVPVKYLQTE-KGR----VLVATV----- ----FDLLMAQ-MGVGRGL--------EGDFAEDYNDAERPYTPAWQEQFTGVSRDTLVCF -AREW------AVTAEKTKGKCTIIVGSGVNHWYHSN-LNYRAGITALILCGCVGVNGG-G ---MNHYTGQEKVAPEA---SWKSIAFALDWIKPPRLQNTPSFHYVHSDQWRYAE------ --------PENGIKVLEYMHPMDVLVNAVRMGWLPF-----YPQFN-RNPIDLVREAEESG -AKS------EQEIIEWLVLQLKD---------------KKIRFAVEDPDAPE-NWPRVWY -IWRGNAILA---SMKGHEYVLKHYLGTSTNAVA-----DEIVSASIKEVHSKGSAPEGKL -DLVIDINFRMDTSALFSDIILPAATW--YEKDDLNTTDLH-SFIHP----L-SAAVPPCW -EAKNDWDIFKEIALKISQLAPAHFSEPFREIVATPLMHDTRQEISQPQ-----VKDWHKD -KCQAIPGKTMPKFSVVERDY--TNLFKQFISYGHKEKEEGMGERGIQWKIGDMYDEF--- --------MKGVPVEQWGGERYPSLSEARDAANVILHFAPETNGEIAYRGFKALEEI---- ------TGMPLSDLAERQR----S-VRTIFP-DLLDQPKRILTSPCWSGITNGGRAYAPYC -INVERLMPWRTLTGRQHXAGRQHFYLDHEGYISFGENLPTFKSRVLLQN----------- ----------SGDIG----------KSTAIEKSLVLNF-------------------LTPH -GKWHMHTTYYDNLLMLTLSR---------------GVEPFWLNSKDAEDIGVKDNDWV-- ----------------EVYNDNGVVVTRAVVSARTPAGVGIFYHAPERT------------ ----ISFPK-SPLRNMKRGGGTNSLT---RIRLKPVLMVGGYAQ---------FSYAFNYW -GPI-GPDRDTYAYVHKLD------GKPVF------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_391728_1 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------MRGALLD-------------------------------LW-QEARR -QH-------------------------------------------------------PDD -PV--------------------------------------------------------AA -WASITDDPARRKRYQEARGKGGFRRVSWSEAQELIAAANLHTVKKY----GPDRL-VGFS -PIPAMSMIS------YAAGARFLQL----------------------------------- ----MGGLCLSFYDWYCDLPPASPEIWGEQTDVAESADWFHSKFIATVGSNVLMTRTPDAH -FLVEARHKGAKVVVFSPDFSQTSKVADEWIPINQG-SDTAFWMAVNHVILREFHA----E -RSVPYFQTYLRENTDAGFLVVMKA----DAQGNYRPGSLLR---------ASQLAET--Q -GEENAEWKSFVLD-TQGNLRVPVGQVGHRW--------QKSKGQWNIKQED--ARTGE-- --------AFEAALTLRDSAT----------------------------GAVKAVF----- ------------------DDFSEGRTDRVRVREVPVREVQTV-EGP----VYVTTV----- ----YDLHLAQ-HGVNRGF--------GGDWPTGYADDTHPFTPAWQEQYTGIKAETVINF -ARQW------ATTAEKSQGKCTVIIGAGVNHWYHNN-LIYRACINALIYCGCVGRNGG-G ---LNHYVGQEKLVPQA---SWGPIAFGTDWSAPPRLQNAPSFHYMHSDQWRYDRKFDEMC -------PVADKSHLMASGHTADKQALAVRSGWLPC-----YPQFTEHN-FKLVQEAEDRG -ADPV-----QHVVGRL-----KD---------------RSLKFAMEDVDNPA-CFPRVWY -IWRGNAIQA---SAKGHEYFLKHYLGTHHNSIA-----VEHAREDVKEVTWHDKLELGKM -DLIVDVNFRMDTSALYSDIVLPTASW--YEKDDLSSTDMH-SFIHP----L-QAAVPPCW -EAKSDWKIFRGIAEETSRMAQRYLPEPVKDFVCTPLMHDTPAEIAQPT-----VKDWAKG -ECEAIPGKTMPNMKVVERDY--TKIFQKYITLGRNFRNNGLGIHGTTYPVDDLYDAY--- --------LQDHPVEEVDGERYPSLRADRSVCEAILHFAAETNGELAYRAYEAESHK---- ------TGIDHTHLAAPTR----G-VRYNFA-DLCTQPRRSLTTPFWTGITNGSRTYSAYC -QNVEERIPWRTLT------GRQHLYFDHEAYVAYGEHLPTFKPRADLRTTR--DLDMTG- ----------------------------VESGALVLNY-------------------LTPH -GKWHIHSTFGDTLRMETLSR---------------GIEPFWMNEQDAGLLGIHDNDWI-- ----------------EVLNDHGTVVTRACVSARIPRGICFIYHATERT------------ ----IGNPK-SKHRGMRRAGGHNSLT---RARLKPLFMIGGYAQ---------FTYAFNYW -GPQ-GVNRDTFVVVKKLD-------KPEW------------------------------- ----- ->blackwarrior_2019_sw_WHONDRS-S19S_0021_B_bin.98_k121_1581374_9 rank: A; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MN-WIEEISNPHAR------QW-EEFYR -NRWQH------DRVVRSTHG-VNCTGSCSWMIYVKDGIVTWELQALDYPVLN-----NGL -PPYEPRGCQRGISFSWYQYSPIRVKHPYMRGVLMD---------LWRKAKETH-QDPVEA -WTAVVEDEAARKSFHQARGKGGFRRASWDEVTEIIAASTMYTIKKY----GPDRI-IGFS -PIPAMSMLS------YAGGSRLMQL----------------------------------- ----LGAVSMSFYDWYSDLPPASPETWGEQTDVAESADWFNSKYIVSVGSNMSMTRTPDVH -FAAEARHNGTKLVVFAPDFNQVAKYADWWVPVNAG-QDGAFWMAVNHVIMNEFHY----Q -NPTPYFLDYMKRYTDSPFLVELN-----EVDGKFVPGRMVR---------AGQVERT--K -DVENGEWKFLVWDELSNAPRMPQGSLGFRW--------QQQKGQWNLEPKD--G------ --------LDGSEIRPQLTFL---GATD---------------------EQLSVSF----- ---------------------AEFGEGKSFQRNIPVRTIETA-NGK----VAVATI----- ----YDLLMAQ-YGVGRGL--------EGDYPASYDDENLSYTPAWQERYTGIDRQTVIQF -AREW------ATTAEKTEGKCMIIIGAGVNHWYHNN-LIYRACIGALMLTGCVGRNGG-G ---LNHYVGQEKLAPAA---PWASIAFALDWQKPPRQMNSPSFHYINSDQWRYERTYTEPQ ---PVSRPDSESHRDMTQEHTLDANIRAVRMGWLPS-----YPQFN-VSSLEIIRKAEQAG -AKS------DAEIRQWVVNQLKS---------------GELKFAVQDPDAPE-NWPRLWF -IWRGNALNA---SAKGQEYFFKHYLGTHHQIIS-----EEVDKSHFNEVTYRDEAPEGKF -DLVVDINFRMDTSALYSDIVLPTASW--YEKDDLNSTDMH-SFIHP----L-QMAVPPSW -ESKSDWDIFKILAEKFSELAPTHFPEPVRDLVAMPLQHDTPAEMAQAH-----IRDWAKG -ECEPIPGVTMPNFIVTERDY--VNLGKRFVSLGPKVEKEGFAIHGIHMEVGDLYREL--- --------LKSKPTVTWNGQTYPSLTVARDAANIILNLAPETNGEVAYRAFKAEEER---- ------IGLKLTDLAEPTR----A-VRTDFK-DVVRQPRRLLNSPIWTGIMTDGRPYAAYT -LNVERLVPWRTLT------GRQHFYLDHEGYLAYGEHLPTYKPRPD-------------- ----------PLAFGDLEKSHS-------EGKTIQLNY-------------------LTPH -AKWHIHSNYFDNDRMLTLSR---------------GLEPLWISEKDAKEIGIVDNDWV-- ----------------EAYNDHGVTVTRAIVSARIPSGICILYH----------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->gunnisonriver_2019_sw_WHONDRS-S19S_0062_A_bin.22_Ga0451722_0001801_3 rank: A; htq:FRZ44_42870 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------ILDKLMF--FKAGTE--RFA-DGYGAVTEESR------AW-EDGYR -QRWQY------DKVVRSTHG-VNCTGSCGWQVYVKSGFVTWETQVLDYPLTR-----PDL -PNHEPRGCARGASASWYLYSSNRIKYPLMRRQLMD---------LWREARRRH-KDPVEA -WRSIVETPELARRYKQARGRGGFVRAEWDEANELIVASNTYTIKEY----GPDRV-VGFS -PIPAMSMVS------YSAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSNFLIVWGSNVPQTRTPDAH -YFAEVRYKGTKTVVVTPDFSEAAKFADLWLDPKQG-TDAAMAMAMGHVILKEFHA----D -NPEPYFRDYCQQYSDLPFLVRL-----VKQGEHYVPERFVR---------ASDFADG-QG -QDNNPEWKTLGFDELTDELVVPNGSIGFRW---------GEDGRWNLEQKD--A------ --------RSGVAAKLRLSLL------EAPSEAPGPKSERSTQVANVAFPYFGGRH----- -----------------HEFFESSPQDEIQVRNVPARTLALK-DGE----YLVATV----- ----FDLMLAH-YGIDRGL---------GGVAASSYDDDVPYTPAWQERITGVSRDKVIAV -ARGF------ADNAAKTRGRSMVIIGTGVNQWFNND-MTYRAVINMLILCGTVGRSGG-G ---WAHYVGQEKLRPQP---GWQTLAFALDWSRPPRLMNGTSFWYAHTDQWRYEKVQASEL -------LSPTREQGDWDVSLIDYNVRSERMGWLPS-----APQLE-KNPLRLGREIHEQK -LDAP-----TAVAHQL-----ET---------------RTLRLSCEDPDNPR-NFPRNLF -VWRSNLLGS---SSKGHEYFLKHLVGAKHGVLG--ADLKELGERLPTEVDFHDEAPEGKL -DLLVTIDFRMSSNCMYSDIVLPTATW--YEKNDLSTTDMH-PFIHP----L-TGAVDPLW -ECKSDWEIFRGFAEKFSEVCEGHLGTE-YDVVLQPLQHDAPGELGQAL----GVVDWKKG -ECRAIPGKTMPNVQLVERDY--PATYKRFVSLGPLVNSLGMSTKGLKWDATEEVELL--- ------KEKNGEVAEAGVGHGRPRIQTDLHACETILALSPETNGRVAVKAWKALEVR---- ------TGRQHAHLAEGRA----A-ERITFD-DVVAQPRKVITSPTWSGAESEKVTYSAGY -INVEEQVPWRTLT------GRQQTYQDHPWMRAFGEHFPSYKPPIDTK--T--VGTLLR- -------------------------SQENGNPQLVLNF-------------------LTPH -QKWGIHSSFTDTQMMLTLSR---------------GGPNIWVSEQDARRLGISDNDWI-- ----------------EAYNSNGALVARAVVSQRIKAGCAFMYHSQD-------------- ---KTVNAP-GTETTGTR-GIHNSIS---RIVVKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDDFVVIRKVR-----------------NLDFMDGTPVRILAPAVSVGGAE-- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001351_7 rank: A; ddz:DSYM_27970 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--FERVQS--TFS-GGHGIVTNEDR------KW-EDAYR -NRWRH------DKIVRSTHG-VNCTGGCSWKIFVKNGLVAFEMQQTDYPRTR-----DDL -PNHEPRGCQRGASFSWYLYSPHRIKHPLVRGRLLD----------LYRAERKSGKDPVEA -WEAIQADPAKRIQYTAVRGLGGFVRTNWDEVTEIAAAANVYTIKKW----GPDRI-YGFS -PIPAMSMLS------YAAGSRYLSL----------------------------------- ----IGGACGSFYDWYCDLPAASPQTWGEQTDVPEAADWYNSTYLIICGANLPMTRTPDAH -FATEVRYKGAKVVSMAPDYAEFVKFADLWMPVKQG-TDSAAFLAMGHVALKEFHV----K -RQDPYFQEYIRKYTDLPMLVMLR-----KTDDGYASDRTLR---------ASDFTGN-LG -ESNNPEWKTIVYDEKTKSYVAPNGSVGFRW---------GEEGKWNLLPKNAANQEEILA -ELTCIDSRDDV----ASVGF----------------------------PHFNAGE----- --------------------------PGLLYRNVPVRKLKLA-SGEDVLVSSV-------- ----YDLQVAQ-YGIDRGL-------GGGNVTDSYEDDKVAYTPAWAEKVTGVKRADLIRT -GREF------AENASKTKGKSMVIMGAAINHWYHND-LSYRAIMNLLHMCGCVGQSGG-G ---WAHYVGQEKLRPQA---GWAPIAFATDWHRPPRHMNSTTFWYFQTDQWRYEKVSADGL -------LADNAKSKYKGYQLADYNVVSQRLGWLPS-----APHFN-KNPIDIVTEAEKAG -ATD------EASIAKHMVEQLKS---------------GKLYFASEDVDAPE-NFVRNLF -VWRSNLLGC---SAKGHEYFLKHLIGAQNGVLQ-----EGVEGRACKEIKWHENGPTAKL -DLMVDINFRLNSTGAYSDIILPTATW--YEKHDLNTTDMH-PFVHP----L-SEAVSPGW -ESKSDWQIFQNIAKAFSKLAEKHLGTK-KDVVALPMQHDSPFELAQAM----GVKDWKKG -ECEPIPGKTLPLLKVVSRDY--PNTLKKFQAIGPLLNKLGNNVKGIDWNTDQELNEL--- ------KSLNGEILEDGISKGMPSIAADIAACDAVLRMAPETNGEVAHKSWSALSKK---- ------TGIDHHHLYAGRH----E-DKITFR-DIQAQPRKIITAPTWSGIESETVSYTAGY -TNIHEHIPFRTLT------GRAQFYQDHEWMLDFGEGFCAFRPGLDMKAIEATPKSVLA- ------------------------------KPHLVLNW-------------------ITPH -SKWGIHSSYQDNLRMLNLFR---------------GGPYFWIAEDDAKSIGLEDNDWV-- ----------------EAVNGNGATVARVVVSQRVPRGMALMYHAQE-------------- ---KIVNVP-GSPTTGKRGGILNSVT---RVVVKPTNMVGGYAQ---------LSYGFNYY -GTV-GTQRDEFVVVHKIE-----DKDVDW-----LERPLTPER--EGKLNPPGVGPR--- ----- ->NASQAN2011_286_B_bin.1_k121_764018_13 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D-----------AHDGFVNVCFPYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->NASQAN2011_286_F_bin.29_scaffold_54_27 rank: A; sdf:ACG33_10925 nitrate reductase alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ---------------MSNLLNR--LNFLKPAAVPFSDGHGATRDDDR------GW-EDAYR -QRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLMRSALLK---------LWRE--ARKTLAPVDA -WGSIVQDQTKAKSYKSKRGMGGFVRVDWDEANELIAASNLYTTKTF----GPDRV-IGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGACLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVSITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHL----D -NPSEYFTDYCRQYSDMPMLVRLDP----RDDGSYATSRYLR---------ASDLDGA-LG -EANNPEWKTLAFDENSGGLVVPHGSVGFRW---------GEKGRWNIEERD--------- --------SQGRDTRLVLSLK------D--------AHDGFVNVCF---PYFGGVE----- -----------------HEGWTSSPREDILKRHIPTRKIMQA-DGSEVLVASV-------- ----YDLLLAQ-YGLDRGF--------GGEHVAGSFDDDVPGTPAWQERITGVPRAEVIEI -AREF------ARTADKTRGRSMIIVGAAMNHWYHND-MNYRGLINMLVMCGCIGQTGG-G ---WAHYVGQEKLRPQS---GWAPLAFGTDWVKPPRQMNGTSFFYFNSDQWRYEKLDVSEI -------ISPLADPKKYSGSLVDFNLRAVRMGWLPS-----APQLN-MNPLAFVRDAEAKG -LDPV-----KHAVDQF-----KS---------------GGLDFAYADPDAPE-NFPRNMF -IWRSNLFGS---SGKGHEYMLKHLLGTRHGLQG--KDLGQRGAVKPQDVKWRDEATEGKL -DLVVTLDFRMCTTALYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWDIFKGIARTVSALAPGVLGVE-KDLVLTPVLHDTPNELAMPF----GVTDWKKG -ECEAIPGKTMPSMTVVERDY--PNLYKKFTSLGPLLDKQGNGGKGMSWDTQDEVDFL--- ------TQLNHPVLAEGISKGRPQIESAIDACEVILHLAPETNGHVAVKAWESLGTF---- ------TGRDHTHLAVGKE----H-EAIRFR-DVQAQPRKIISSPIWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHEWMLAFGEGFMGYRPPVNTKTIA--P--MLG- -------------------------AKPNGNKEIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKRAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRVMSGMAMMYHAQE-------------- ---RIINTP-GAEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------FSYGFNYY -GTT-GTNRDEFVIVRKMD-------KVEWHDGEPVPNNVEVAR----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_201_6 rank: A; thes:FHQ07_07000 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSY--------FLDRLNF--FKPAPE--PFA-DGHGAARREDR------SW-EDSYR -RRWQY------DKIVRSTHG-VNCTGSCSWKVYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRVKYPLIRAALLK---------LWREARKS--KSPVEA -WASIVSDPVKAKSYKQKRGMGGFVRSTWDEVNEIIAASNLYTVKEF----GPDRV-VGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----LGGGCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSRYIIAWGSNVPQTRTPDAH -FFTEARYNGTKTVAITPDYSEVAKLTDHWLHPKQG-TDAALAFAFGHVILREFHV----D -QPSQYFTDYCRQYSDMPMLVRLER----RADGRLVPERYLR---------AADLGGL--G -ETNNPEWKTLAIDDNSGDITVPNGSVGFRW---------GEKGKWNIEEKD--------- --------SAGRETRLRLSLK------D--------HADGVESVSF---PYFGGIE----- -----------------NEYWTESKFSDVLERNVPVKRLNLA-DGKEWVVASV-------- ----YDLLLAQ-YGVDRGL--------GGGNVASSYDDNVPGTPAWQEKITGVPRAEVIQI -AREF------ARTADKTHGRSMVIVGAAMNHWFHND-MNYRGLINMLVMCGCVGQTGG-G ---WAHYVGQEKLRPQS---GWAPIAFGTDWSKPPRQMNGTSFFYFNSSQYRYEKLGVEEI -------LSPLADKSKYSGSLADYNLRAVRMGWLPS-----LPQLN-TNPMKLVREAEAAG -VAPV-----DYAVGKL-----KD---------------GSLDFAFADPDAPE-NYPRNLF -IWRSNLLGS---SGKGHEYMLKHLLGTRHGLQG--KDLGERGAAKPEEIKWRDEAPEGKL -DLLVTLDFRMCTTALYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIFKGIARTVSQLAPGVLGIE-KDLVLVPTLHDTPNEIAMPY----GVTDWKKG -ECDLIPGKTAPSMVVVERDY--PNLYKKFTSIGPLLDTQGNGGKGMNWDTTHEIEFL--- ------GKLNHEVLEAGVSHGRPQLETAIDCAEAIMHLAPETNGHVAVKAWASLETF---- ------TGREHQHLAVGKE----H-EAIRFR-DIQAQPRKIISSPIWSGLEDENVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHEWMRDFGEGFMQYRPPVDTKTIK--P--IIG- -------------------------KKPNGNREIVLNW-------------------ITPH -QKWGIHSTYSDNLIMQTLSR---------------GGPIVWLSEDDAKSAGIEDNDWI-- ----------------ELFNVNGAIAARAVVSQRMMNGIAMMYHAQE-------------- ---RILNTP-GSEITGTRGGIHNSVT---RVVVKPTHMIGGYAQ---------LAYGFNYY -GTV-GTNRDELVVVRKMN-------KVDW---LDGEPVPATKEAAR-------------- ----- ->NarG_Escherichia_coli_NP_415742 -----------------------------------------------SK------------ ---------------FLDRFRY--FKQKGE--TFA-DGHGQLLNTNR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKYPMMRKRLMK---------MWREAKALH-SDPVEA -WASIIEDADKAKSFKQARGRGGFVRSSWQEVNELIAASNVYTIKNY----GPDRV-AGFS -PIPAMSMVS------YASGARYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYAEIAKLCDLWLAPKQG-TDAAMALAMGHVMLREFHL----D -NPSQYFTDYVRRYTDMPMLVMLE-----ERDGYYAAGRMLR---------AADLVDA-LG -QENNPEWKTVAFN-TNGEMVAPNGSIGFRW---------GEKGKWNLEQRD--GKT---- --------GEETELQLSLLGS------Q----------DEIAEVGF---PYFGGDG----- -----------------TEHFNKVELENVLLHKLPVKRLQLA-DGSTALVTTVYDL----- -------TLAN-YGLERGL--------NDVNCATSYDDVKAYTPAWAEQITGVSRSQIIRI -AREF------ADNADKTHGRSMIIVGAGLNHWYHLD-MNYRGLINMLIFCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWQPLAFALDWQRPARHMNSTSYFYNHSSQWRYETVTAEEL -------LSPMADKSRYTGHLIDFNVRAERMGWLPS-----APQLG-TNPLTIAGEAEKAG -MNPV-----DYTVKSL-----KE---------------GSIRFAAEQPENGK-NHPRNLF -IWRSNLLGS---SGKGHEFMLKYLLGT-EHGIQGKDLG-QQGGVKPEEVDWQDNGLEGKL -DLVVTLDFRLSSTCLYSDIILPTATW--YEKDDMNTSDMH-PFIHP----L-SAAVDPAW -EAKSDWEIYKAIAKKFSEVCVGHLGKE-TDIVTLPIQHDSAAELAQPL----DVKDWKKG -ECDLIPGKTAPHIMVVERDY--PATYERFTSIGPLMEKIGNGGKGIAWNTQSEMDLL--- -------RKLNYTKAEGPAKGQPMLNTAIDAAEMILTLAPETNGQVAVKAWAALSEF---- ------TGRDHTHLALNKE----D-EKIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLS------GRQQLYQDHQWMRDFGESLLVYRPPIDTRS----VKEVIG- -------------------------QKSNGNQEKALNF-------------------LTPH -QKWGIHSTYSDNLLMLTLGR---------------GGPVVWLSEADAKDLGIADNDWI-- ----------------EVFNSNGALTARAVVSQRVPAGMTMMYHAQE-------------- ---RIVNLP-GSEITQQRGGIHNSVT---RITPKPTHMIGGYAH---------LAYGFNYY -GTV-GSNRDEFVVVRKMK-------NIDW---LDGE---------GNDQVQESVK----- ----- ->NarG_Halomonas_maura_gb_AAT47523 ------------------------------------------------------------- ----MSH--------FIDRLNF--FRKARE--PFA-NDHGEVRDESR------GW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKHPLVRKPLLK---------LWREALEEK-GDPVDA -WASIVEDPAKTKQYKRARGMGGFVRADWNELNELIAASNVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVSVTPDYAEVSKLTDEWLSAKQG-TDAALAMAMGHVILKEFHL----D -RPSAYFTDYVRRYTDMPCLVELEA----REDGSYVPGKQLR---------ASDFEAS-LG -QDNNPEWKTVAWDETRDQLVVPRGSIGFRW---------GEEGKWNLEPRD--------- --------AEGAEIKTRLSLA------E--------AHDDVARVAF---PYFGGIA----- -------------HEHFDHVKSGGASDELLFHSLPAKRLTLA-DGREILAVTVFDL----- -------MCAN-YGIDRGF-RSQEGKEGEDDGATAYDQVKPYTPAWQEKITGVPAEQCLRI -AREF------ADNADKTHGRSMIIVGAGMNHWYHMD-MNYRGLINMLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWLPLAFGLDWQRPPRHMNSTSFFYNHSSQWRYXKLEIKEI -------LSPLAKPADYSGSLIDFNVRSERMGWLPS-----APQLA-TNPLSLAGKAAEAG -QSTA-----DYVVDQL-----KA---------------GGLRFAAEDPDDPQ-NFPRNMF -IWRSNLLGS---SGKGHEYLLKYLLGT-RHGIQGKDLG-EDGGQKPEEVVWHEAAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAATDPAW -ESRSDWDIYKGIARAFSKACVGHLGEE-TDLVTLPLQHDSPAELAQPE-----VKDWKRG -ECEPIPGKTMPALVEVKRDY--PATYERFTSVGPLLDSLGNGGKGIGWKTEKEVELL--- -------GKLNYVKTEGPAKGRPRIESAIDAAEVILTLAPETNGQVSVKAWEALSKI---- ------TGRDHRHLAEPKE----E-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTVS------GRQQFYQDHAWMRAFGESLLVYRPPIDTKAAV--SL----- ----------ADDKG-------------NGNPEIALNW-------------------ITPH -QKWGIHSTYSDNLLMQTLSR---------------GGPIVWLSKDDARSIGVEDNDWI-- ----------------ELYNANGAIAARAVVSQRVKNGMAMMYHAQE-------------- ---RILNMP-GSEVTGTRGGIHNSVT---RVCPKPTHMIGGYAQ---------LAYSFNYY -GTV-GSNRDEFVIVRKMK-------KIDW---LDGE---------GNDYEQEAVK----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0001905_7 rank: C; this:HZT40_10960 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FKQRKT--PFA-QGHGAVTHEKR------DW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASFSWYIYSANRLKYPLIRKPLME---------LWRSAKARH-TDPVVA -WESIVENPLSTNDYKTKRGLGGFIRSSWEEVNELIAAANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCMSFYDWYCDLPPASPMIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKHADQWLNPKQG-TDAALALAFGHVILKEFHL----D -KPSTYFTDYVRRYTDWPNLVLLEK----RDDGSYQAGRFAR---------ASDFVEG-LG -ESNNPDWKTVAIDEATGEIIAPNGSIGYRW---------GENSKWNIQQKHG-------- --------TDQQEVTLALSLI---------------------------------------- ------------------------------------------------------------- ----------------------------------------------------KQHDQIVEL -CLPY--------------------FGGVPSDYFKGN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------VLKDVL----- ----------------------------RYQLPARQVTLAD-------------------- ------------------------------------------------------------- ----------------GTTGL---------------------------------------- --------------------------------LVTVYDLNMAN------------------ -----------------------Y------------------------------------- --------------------GISRGLGADDSAQDFNDA---------TAPYT--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------PAWQEAI------------------------- ------------------------------------------------------------- ----- ->king_2019_sw_WHONDRS-S19S_0016_B_bin.5_k121_1281127_1 rank: A; gpb:HDN1F_13240 narG; Nitrate reductase, alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLQF--FNKVKS--TFA-DGHGAVVNEDR------GW-ENAYR -SRWQY------DNIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCQRGASYSWYLYSANRLKYPMMRKPLLE---------LWRE--ARKSLSPVDA -WESIVENPVKSKAYKTKRGLGGFIRVDWEEANELVAAANIYTAKKY----GPDRI-NGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGTCLSFYDWYCDLPPSSPQTWGEQTDVPESADWYNSTFLMLWGSNVPQTRTPDAH -FYTEVRYKGAKSVVITPDYSEAAKFADLWLAPKQG-TDAALAMAFGHVVLKELHL----D -NPSEYFTEYCRKTTDMPHLVMLKT-----RGNAFVADRFLR---------ASDLSDN-LQ -QSNNPEWKTLVINENTNEMVVPNGSIGFRW---------GEDGKWNIQATDS-------- --------ADGSDIKARLSLI------E-----------NADQVVSVEFPYFGNLN----- -----------------HPHFTHTEHAEILERNVPARRIQLA-DGSDAYVVTVFDL----- -------LVAN-YGIDRGL--------GGENVAKSFDDDQPYTPAWQERITGVKREHVITV -ARQF------AENAHKTHGKSMVILGAGLNHWYHMD-MNYRGIINLLMMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWHRPPRHMNGTSFFYNHTSQWRHEKLDVREI -------LSPLADKTAWSGSLLDYNVRAERMGWLPS-----APQLN-VNPLELTKAAAAAG -QSPV-----DYAVENL-----KS---------------GKLAFACEDPDNPV-NFPRNLF -VWRSNLLGS---SGKGHEYFLKYLLGTTHGVQG--KDLGEMGAPKPEEVVWHEQGAEGKL -DLLVTLDFRMSTTCMYSDVVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIARKFSELSVGHLGVE-KDLVLVPTLHDTPSELGQAV----GVKDWKKG -ECEPIPNKTLPNMVVVERDY--PNTYKKFTALGPLLDKLGNGGKGISWNTQSEVEQL--- ------RDLNYRVTEEGVSKGLPRIESDIDACEVVLMLAPETNGQVAMKAWAALSKI---- ------TGRDHTHLALPRE----D-DKIRYR-DVQAQPRKIISSPTWSGLESEHVSYNAGY -TNVHEMIPWRTLT------GRQQFYQDHLWMLGFGESLCVYKPPIDTKTIA--P--LLN- -------------------------QRSNGNGEVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPCVWMSETDAKKVGIEDNDWI-- ----------------EAFNLNGALVARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-ASEITKTRGGIHNSVT---RTCPKPTHMIGAYAQ---------QSYGFNYY -GTV-GSNRDEFVIVRKLS-------KVDW---LDTPVAQA-------------------- ----- ->NarG_Pseudomonas_fluorescens_gb_AEV63780 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFS-DGHGETRKESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKIRKPLLK---------LWRE--ARQTLPPVEA -WASIVEDKAKADSYKSKRGMGGFIRSNWEEVNEIIAAANVYTVKEH----GPDRV-VGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----D -KPSAYFTEYAKRYTDLPVLVMLKPMLGAAPGAGYQPDRFLR---------ASDLTDN-LG -QDNNPEWKTIALD-AAGELVSPQGSIGYRW---------GEKGKWNILPREG-------- --------GEGREIDLKLSLI-------------------GGDVAEVAFPYFAGEA----- -----------------QEYFQHVAGDAVQFRRVPVHSVVLA-DGSVAKVATVFDL----- -------SAAN-LAIDRGL-------GGANVAKDYNDASVPGTPAWQEQITGVSREKAIQI -AREF------ADNADKTRGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWNRPPRQMNGTSFFYGHSSQWRHEKMSMHDV -------LSPLADKSQFPEHALDYNIRAERAGWLPS-----APQLN-TNPLHICRDAAAAG -MEPK-----DYVVKSL-----QD---------------GSLRFACEQPDSPV-NFPRNMF -IWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN--EDIGHSTECKPTEAEWVDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -ESRSDWEIYKGIAKAFSAMSVGHLGVE-KDLVTVPLMHDSVGELAQPF----GGTDWKSA -GVAPVPGKNAPNLQVVERDY--PNIYKQFTSLGPMLEKLGNGGKGINWNTDTEVKFL--- ------GELNHKEVEAGISQGRPKIDSAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGIDHSHLAISKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDDHVSYNAGY -TNVHESIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVNTRTIA----GVKG- -------------------------KRSNGETEIVLNW-------------------ITPH -QKWGIHSTYSDNLLMLTLSR---------------GGPIVWLSEIDAKRAGIEDNDWI-- ----------------ECFNVNGALTARAVVSQRVKEGMVMMYHAQE-------------- ---RIVNVP-GSETTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMV-------KVDW---LDGSSGDDLPRPLPTDIEEN-------- ----- ->NarG_Pseudomonas_stutzeri_gb_AAZ43099 ------------------------------------------------------------- ----MSH--------LLDQLRF--FNRKQG--EFA-DGHGETRIESR------DW-ENVYR -SRWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----NDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWREARRN--MTPVDA -WASIVEDKAKAESYKSKRGMGGFIRSSWDEVNEIIAAANVYTVKQY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQIWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYAEVAKLTDLWLNPKQG-TDAALAQAFAHVIFKEFHL----E -KPSEYFRDYAKRYTDLPVLVRLN-----EKDGSYIADRFLR---------ASDLADN-LG -QENNPEWKTIAVDGSTGELVSPLGSIGYRW---------GEKGKWNIEARE--G------ --------KDGRDVDLSLTQI------E---------GGETAEVAF---PYFGGIL----- -----------------HEHFQHAEGESIQLRRVPVRTITLA-DGSTTKVATVFDL----- -------MAAN-LGIDRGL-------GGGNVASSYDDASVPGTPAWQEVITGVSREKAIQI -AREF------ADNADKTHGRSMIIVGAAMNHWYHMD-MNYRGLINMLMLCGCVGQTGG-G ---WAHYVGQEKLRPQC---GWLPLAFGLDWSRPPRQMNGTSFFYNHSSQWRHEKMSIHEV -------LSPLADKSQFPEHMLDYNIRAERAGWLPS-----APQLN-RNPLQICRDAEAAG -MSPV-----DYVTQSL-----KD---------------GSLKFACEQPDNPD-NFPRNMF -VWRSNLLGS---SGKGHEYMLKYLLGTKNGVMN-EDLGKRADGFKPTEAEWQDEGAIGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EAKSDWEIYKGIAKAFSKMAEGQLGVE-KDLVTVPLLHDSPGELAQPF----GGTDWKTA -GVDPQPGKNCPNMAVVERDY--PATYKKFTSLGPLLDKLGNGGKGINWNTQDEVDFL--- ------GELNYKVRDEGVSQGRPQIESAIDAAEVILSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLALPKE----H-EAIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHEYIPWRTIT------GRQQFFQDHPWMQAFGEQLMSYRPPINTR------------ -TIDYVK-------GKKSNGNP----------EIVLNW-------------------ITPH -QKWGIHSTYSDNLIMLTLSR---------------GGPIVWMSEVDAKKAGIEDNDWI-- ----------------ECFNANGALTARAVVSQRVMEGMVMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMA-------KVDW---LDGPNGNDLPQPLPQDI----------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_1186915_16 rank: A; ocm:CBP12_03810 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------ETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRVKYPKVRKALLK---------LWRE--ARKNLKPVEA -WASIVEDPVKAQSYKSKRGLGGFVRSSWDEVQELIAAANVYTTKTY----GPDRV-VGFS -PIPAMSMIS------YASGARYLSL----------------------------------- ----MGGACLSFYDWYCDLPPSSPMVWGEQTDVPESADWYNSNYIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAITPDYSEVAKLTDLWLNPKQG-TDAALAQAFNHVIFKEFHL----E -KPSEYFTDYVRRTTDFPMLVLLD-----EHGEGYKTGRFLR---------ASDLTGQ-LG -QDNNPEWKTIALDELSGELVSPLGAIGYRW---------GEKGKWNIEAREG-------- --------SKGADTKLKLSLI------D------------EGQVAEVAFPYFGGDL----- -----------------HDHFQHVEGDNLQYRRIPVREVQLA-DGRSAKVATVFDI----- --------TAGGLAIDRGL-------GGKNVASSYDDASIPGTPAWQEQITGVTREKAIQI -AREF------ADNADKTKGRSMIIVGAAMNHWYHMD-MNYRGLINMLMMCGCVGQTGG-G ---WAHYVGQEKLRPQT---GWTPVAFGLDWHRPPRHMNGTSFFYNHSSQWRYEKMNMHDI -------LSPTANKAEFPEHALDYNIRAERAGWLPS-----APQLN-RNPLQICRDAKAAG -LSPK-----DYAVKAL-----QE---------------GSLRFSCEQPDNPV-NFPRNMF -VWRSNLLGS---SGKGHEYMLKHLLGAEKHGVI---GDETAAGFTPKDVDFSQEGARGKL -DLVTTLDFRMSSTCVYSDIVLPTATW--YEKDDMNTSDMH-PFIHP----L-SAAIDPAW -EARSDWEIFKGIAKKFSELSVGHLGVE-QDLVTIPMQHDSVGELAQPF----GGLDWKTT -GEPLVPGKNAPNMVVVERDY--PNTYKKFTSLGPLLNTQGNGGKGISWNTDDEVEFL--- ------GDLNHRVLDEGVSEGRPQMLSAIDAAECVLSLAPETNGHVAVKAWAALSEF---- ------TGRDHSHLAVGKE----H-ESIRFR-DIQAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTIT------GRQQFYQDHPWMQAFGEQLMSYRPPVSTRSIE----KVQG- -------------------------KMSNGNPEIALNW-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAQKVGIEDNDWV-- ----------------ECFNANGALTARAVVSQRVKEGMIMMYHAQE-------------- ---RIVNVP-GAESTKTRGGHHNSVT---RVVLKPTHMIGGYAQ---------QAYGFNYY -GTV-GCNRDEFVVVRKMN-------KVDW--LEGSDTDDLPQPLPQNI------------ ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.104_k121_2341297_11 rank: C; pbm:CL52_03700 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ----MSR--------LLDQLRF--FKRKQD--EFA-DGHGETRIENR------EW-ENGYR -ARWQY------DKIVRSTHG-VNCTGSCSWKIYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYIYSANRLKYPKVRKPLLK---------LWRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0000931_1 rank: A; reu:Reut_B5002 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLRF--LSRTKE--TFS-DGHGAVVDEDR------SW-ENAYR -GRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPLVRGRLME---------MWRE--ARQTMSPTDA -WESISQDPVKAKRYKSVRGQGGFVRASWDDVSEIIAAANAFTIKEF----GPDRV-LGFS -PIPAMSMVS------YAAGARYLSL----------------------------------- ----IGGACLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTYLMVWGSNVPQTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMVKFGDIWLAPKQG-TDAALAMAMGHVILKEWHT----S -AQSDYFTRYVKQYTDLPMLVILK----LGKSGQLVPDYFLR---------ASHLSLA--E -QANNPEWKTLLIDCASGELIAPNGSIGFRW-----GESGDKVGRWNLELKDGGSARAIDP -CLS----LIDSHDDIVEVGF----------------------------DYYGGKD----- -------------------------ADDVLLRRVPAKRVKLA-DGSEALVTTVFDL----- -------TMAN-YGVDRGL--------GGGNVAMSYDDDVPYTPAWQERHTGVKRNLVIQV -AREF------AQNAHDTQGKSMVIVGAALNHWYHND-MIYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFAGDWVRPPRHMNGTSFFYNHTSQWRHEKLALDEI ------LAPTADAGPYSKLALLDLNAKAERLGWLPS-----APQLE-TNPLDIVDAADSKN -MDPV-----KYAVEEI-----KA---------------GRLNFSCDEPENPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALFG------DERDGIKPGEVKAGEAVEGKL -DLLTVLDFRMSTTCLYGDIVLPSATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKSDWEIYKTIAKKFSEIAGPYLGTR-KDLVLTPLLHDTPGELGQPF----EPKDWKHG -ECEPIPGKTMPQMTVVERNY--GDVYKKFTSIGPLLEKSGNGGKGIGWNTEHEVKEL--- ------AALNKLVTEPGVSQGRPKLETAIDAAEMILTLAPETNGHVAVKAWDALGKI---- ------TGRDHKHLAEGRD----H-DKIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHRWMLDFGEGLCIYKPAINTRTIE--P--MLG- -------------------------KHANGNAELVLNW-------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIE-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.62_Ga0451753_0004490_1 rank: C; cuh:BJN34_33750 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------K--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------HAN------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------GNEELVLN-------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLRMLTLSR---------------GGPHVWVSEIEAKQAGIRDNDWV-- ----------------EVFNVNGTLTARVVVSQRVPVGMCLMYHAQE-------------- ---KIVNVP-GAETSGMRGGIHNSVT---RTVTKPTHMIGGYAQ---------LAYGFNYY -GTV-GSNRDEYVIVRKMK-------KVDW---LEGALKEEGEQA---------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_6 rank: A; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -------------------------MAACR------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------DWYCDLPPASPQIWGEQTDVAESADWYNSNYLMVWGSNIPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -RPSDYFTGYIRQYTDMPMLVMLKQ----DAAGRYLPDYFLR---------ASHLAGN-AD -QAHNPEWKTLVLDETSGNLAVPNGSAGFRW---------DQSGKWNLEEKA--G------ --------INSQPVKAQLSLI------A--------QSDEVVEVGF---PYFGAEH----- --------------------------DELITRRVPVRHIVLA-DGSTARVATVFDL----- -------MAAN-YGIDRGL--------GGGNVACSYLDDVPYTPAWQHKHTGVKPEMVIQV -AREF------AQNADQTHGRSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WCHYVGQEKLRPQT---GWAPLAFAGDWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LSPTADGKMANMALIDYNAKAERMGWLPS-----APQLT-TNPLDVTRHAAAAG -QDPI-----TYAVEQL-----KS---------------GQLDMACNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNAVMN-----SEEGCVKPSEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QAKSDWEIYKGFAKAISEVGGEYLGVQ-QDLVLTPLMHDTPEELGQPF----DPRDWKKG -ECEPIPGKTMPKMTVVERDY--RKIHDKFTSIGPLLEKVGNGGKGIGWQTGHEVDVL--- -------RGLNKTVASGVAAGQPRLDTAIDAAEMILTLAPETNGHVAVKAWAALSKI---- ------TGRDHTHLALPRE----H-DSIRFR-DVQAQPRKIISSPTWSGLESEEVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHLWMRAFGEGLCLYKPHVDLK--T--TAAILG- -------------------------KKPNGHHEIVLNW-------------------ITPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWVSEIDAKKAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRVPEGMSLMYHAQE-------------- ---KIINVP-GAETSGKRGGIHNSVT---RTVVKPTHMIGGYVQ---------LAWGFNYY -GTV-GSNRDEFVIVRKMK-------NVDW---LDQPLSEHA------------------- ----- ->littlewolfcreek_2019_sw_WHONDRS-S19S_0078_B_bin.9_k121_678409_7 rank: C; aql:BXU06_02425 nitrate reductase subunit alpha; K00370 (db=kegg) -MEYARLVTHLAESENSRACFFLAPLLSNYPTLPPLPPPRSPSDQWAVCLRLLTIGGIGTG -LSGPANPLEARMSHFLDRLNF--LGKVKS--TFS-DGHGAVVKEDR------KW-EDGYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGVLMQ---------HWRE--LRKKLGPIEA -WQRISQTPEIATQYKTQRGQGGFVRASWDEVNEIIAASNAFTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------I---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----GVPRLVL------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.15_k121_1272084_2 rank: A; chrm:FYK34_01610 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--MSKVKA--TFS-NGHGAVVKEDR------QW-EDAYR -QRWQH------DKIVRSTHG-VNCTGSCSWKVYVKNGLITWETQQTDYPRTR-----ADL -PNHEPRGCPRGASYSWYVYSAQRVKYPMVRGKLMQ---------MWREARKS--MGAIDA -WESISQNPEKAKEYKSRRGQGGFVRASWDEVNEMVAAANAYTIKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQIWGEQTDVAESADWYNSTYLMVWGSNVPMTRTPDAH -FYTEVRYKGTKTVAVSSDFGEMAKFGDIWLAPKQG-TDAALAMAMGHVIFKEFHL----D -KQSSYFTDYIRRLTDMPMLVRLK-----EEGGRYLPEYFLR---------ASHLEGG-LG -EDNNPDWKTLLIDENTGDIVAPNGSIGFRW-----GQPEGKTGKWNLEHRDGAT------ --------AREIQGQLTLLGQ------Q----------DEVVGVGF---PYFGAEH----- --------------------------DELLTRNVPAKRITLA-DGSTALVATVFDL----- --------MAANYGIDRGL--------GGGNVASSYMDDVPYTPAWQQKHTGVKPEMVIQV -AREF------AQNADQTQGKSMVIVGAALNHWYHMD-MTYRGIINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQS---GWAPLAFGADWNRPARQMNGTSFFYAHTSQWRHEKLGVNEI -------LCPTADGSMANMSLIDYNAKAERMGWLPS-----APQLS-TNPLDITRQAEAAG -QDPV-----AYTVQGL-----KD---------------GTLDMSCNDPDNPK-NFPRNLF -VWRSNILGS---SGKGHEYFLKYLLGTQNALMS-----DEANCITPTEITVRPAA-EGKL -DLLVVLDFRMSTTCLYGDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-SEAVQPLW -QSKTDWEIYKGFAKAISEVGGDYLGVQ-KDLVLTPLMHDTPQELGQAF----DPRDWKKG -ECEPIPGKTMPAMTVVERDY--KAIYQKFTSIGPLMEKAGNGGKGMAWKTGHEIEKL--- -------RAMNKVVQDGVAKGQPRLDTAIDAAEMILTLAPETNGHVAVKAWESLSKI---- ------TGRDHTHLAIPRE----H-DHITFR-DIQAQPRKIISSPIWSGLESEEVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHQWMRAFGEGLCLYKPPVDLKT----------- -TAAVHR------------------HKPNGNTEILLNF-------------------LTPH -QKWGIHSTYSDNLRMLTLSR---------------GGPHVWISEKDAQEAGIVDNDWI-- ----------------EVFNVNGTLTARAVVSQRIPKGMTLMYHAQE-------------- ---KIVNVP-GAEMSGKRGGIHNSVT---RAVTKPTHMIGGYAQ---------YSYGFNYY -GTV-GANRDEFVVVRKMK-------NVDW---MDQPK----------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_3271_6 rank: C; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------T -ASHQAMMNSRS-----------------------------------------------NG -NPEIA------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------LN------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------F------------------------------------- ------------------------------------------------------------- ---------------------------------------------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPCVWVSEVDATKIGLVDNDWV-- ----------------EAFNANGALCARVIVSQRVPEGMMMMYHAQE-------------- ---KIVNVP-GSEIMNTRGGIHNSVT---RAVVKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVILRKMN-------KVDWMDDEASPAGENS------------------- ----- ->nebranchanacostia_2019_sw_WHONDRS-S19S_0081_B_bin.6_k121_1546998_5 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------AW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--HRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCL-----VEKDGAYVPDRYVR---------AADLVGA-LG -EANNPDWKTLVIDEASDALTVPVGSIGFRWGQEKDGAPTADKGKWNLKEET--------- --------SDGRQIKPRLSLV------K--------HHDAVVEAAF---PYFGNIA----- -----------------HEHFNSTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVASSYDDDIPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLRVADL -------LSPLADKGKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLELSREAIAKG -LDPK-----EYVVNQL-----KS---------------GELKFSCEDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGHTGEVKPQDVVWHDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRFSELS---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DGYLGVEKDIVAVPIL--HDTAGE- ------------------------------------------------------------- -----IAQPYDTKDWKK-------------------GECEA-IPGKTMPNFVVVERNYSEI -H--------------EKFTSLGPLLDK--------------------------------- -------------------------------------------------------LGNGGK -GIN-------------------------W---NT-------------------------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_A_bin.2_Ga0451754_0000231_3 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF--LSADKE--HFS-DGHGQTTTENR------SW-EDAYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCARGASYSWYLYSANRVKHPMVRSSLLK---------AWRK--QRQTLSPVAA -WEAVVSDPKTVRRYQSERGKGGFLRTSWDEVNDMVAAANIYTAKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPASPQTWGEQTDVPESADWYNSSYIMMWGSNVPQTRTPDAH -FMAEVRYKGAKVVSVFPDYSEGAKFGDMWLHPKQG-TDAALAMAMGHVILKEFHV----A -GKSEYFDNYCRQYTDMPNLVCM-----VEKDGAYVPDRYVR---------AADLIGA-LG -EANNPDWKTLVIDEESDALTVPVGSIGFRWGQDKDGAPTADKGKWNLKEET--------- --------TDGRKIKPRLSLV------Q--------KHDAVVEAAF---PYFGNIE----- -----------------HEHFNNTSHSDVLKRRVPVRKIQTA-QGE----MLVATV----- ----YDLYVAN-YGVDQGL--------GGDNVAGSFDDDVPYTPAWQEKITGVPRDQVTQV -AREF------AQNAHDTHGKSMVIIGAAMNHWYHMD-MNYRSIMNMLIMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWSRPPRHMNGTSFFYAHTDQWRYETLRVADL -------LSPLADKNKFSGSLIDFNARSERMGWLPS-----APQLE-RNPLDLTREAIAKG -VDPK-----EYVVNQL-----KS---------------GELKFSCDDPDNPK-NFPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG--KDLGQTGDVKPQEVVWRDEAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -EARSDWEIYKGFAKRYSELSDGYLGVE-KDLVAVPILHDTAGEMAQPY----DAKDWKKG -ECEAIPGKTMPNFVVVERNY--SEIYEKFTSLGPLLDKLGNGGKGINWNTDHEIKLL--- ------GELNYKVRNEGVAHGRPNIDTDIDATEVVLTLAPETNGEVAVKAWAALSEF---- ------TGIDHRHLALTRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESEHVSYNAGY -TNVHELIPWRTLT------GRQQLYQDHEWMRAFGEGFCSYKPPVDLRSHQ--Q--VMN- -------------------------AKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWLSEVDAQKVGIEDNDWI-- ----------------EAFNSNGALCARAVVSQRVPEGMVMMYHAQE-------------- ---KIVNVP-GSEITQTRGGIHNSVT---RAVLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVVVRKMN-------KVDW---MDGPAQPAMEA----------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.14_scaffold_493_9 rank: A; fpho:SHINM1_007130 narG; respiratory nitrate reductase subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FIDRLKF----FVTPTEGFA-DKHGATVDEDR------TW-EDGYR -KRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDM -PNHEPRGCQRGASYSWYLYSANRVKYPMVRSPLLK---------LWRE--KRKMLAPVDA -WKAITDDHNAVRSYQSQRGLGGFLRTTWDEVNEMIAAANVHTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCTSFYDWYCDLPPSSPQMWGEQTDVPESADWYNSTYIMMWGSNVPQTRTPDAH -FMTEVRYRGTKVVSVFPDYAEGSKFGDLWLHPKQG-TDAALALAMGHVIVNEFHV----K -NKSDYFDQYCRQYTDMPNLVKL-----VKQGDYYVPDRLVR---------CSDFTDN-LG -QDNNPDWKTVVIDENTNMLTVPVGSIGFRW----GQKEGEDLGKWNLQEKN--------- --------AAGADIRPRLSLI-----------------GGHDGVVLVASPYFGNQQ----- -----------------HDHFQHTDHANILPHNIAVRKLQSR-DGE----ILVASV----- ----YDLFVAN-YGVDQGL--------GGPNVASSYDDDIPYTPAWQEKITGVKRHLVIQV -AREF------ADNADKTHGKSMVIVGASLNHWYHMD-MNYRSVINMLVMCGCIGQSGG-G ---WAHYVGQEKLRPQI---GWAALAFATDWHRPPRQMNGTSFFYAHTDQWRYETLSVKKI -------LSPLADPKKFSGSLIDFNVRSERMGWLPS-----APQLQ-TNPLQVCRDAQKAG -MSAK-----EYAVAQL-----KS---------------GKLRFSCEDTDHPD-NYPRNMF -IWRSNLLGS---SGKGHEYFLKHLLGTTHGVQG--KDLGQSGGQKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----F-SAAVDPAW -MARSDWEIYKGIAKKFSELTEGHLGVE-QDLVTVPIMHDTPDELGQAF----EPKDWKRG -ECEAVPGKTMPNFVLVERDY--PNTYKKFTALGPLMDKLGNGGKGINWNTQHEVKHL--- ------GELNYLVSEEGVTKGRPKIETDIDATEVILMLAPETNGEVAVKAWDALSKF---- ------TGIDHTHLAKTRE----D-EKIRYR-DIQAQPRKIISAPTWSGIESEHVSYNAGY -TNVHELIPWRTIT------GRQQLYQDHHWMRAFGEALCVYKPPIDTASHQ----AMMN- -------------------------SRSNGNPEIALNF-------------------ITPH -QKWGIHS----------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->logan1_2019_sw_WHONDRS-S19S_0097_B_bin.20_k121_1372227_2 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------F-GNLEH -DHFQG----------------------------------------TDHPSVLK----RRV -PVREVQL-KDGKAFVATVFDLFCANYGL-------------------------------- -----------------DRGLGG-----------------EHVARDY-------------- ------------------------------------------------------------- ----------------GAMEPYTPAWA---------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------E--------------------------------- ------------------------------------------------------------- ------------------------------------------------KITGVPADQIITI -AREF------ASNAEVTKGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNSTSFFYAHTDQWRYETLGVEEI -------LSPTAPEGDWDASLIDYNARAERMGWLPS-----APQLK-TNPLEVGKAIKASG -KDAK-----DYVAEAL-----QS---------------GALEMSCFDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGETGAQKPKEVKWHEEAPKGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWDIYKGIAKKFSEIAPEVLGVE-HDVVLTPIQHDSPNEIAQAY----DVADWGHG -QVEAIPGKTMANVALVERNY--AELYQKFTALGPLMEKLGNGGKGIGWNTDHEVEGL--- ------RKLNGTVAADGPAKGMAQIETAIDAAEVILMLAPETNGEVAVKAWADLGKK---- ------TGLDHTHLALPKE----D-EKIRFR-DIQAQPRKIISSPTWSGIESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEGLCVYRPPIDTKAVK--PML---- -------------------------DEAKDAPHVILNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KITNVP-GSPLTGQRGGIHNSVT---RAVLKPTHMIGGYVQ---------LAYGFNYY -GTV-GSNRDEYVIVRKLS-------KVDW---LEGALS-------EGETAA--------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.6_k121_1211148_1 rank: A; emv:HQR01_12825 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRHKKE--QFS-DGHGVTTAEAR------DW-EDSYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLIK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKKW----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALAMAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----IEQDGRLVPERLLR---------ASDFKGD-LG -EKNHPEWKSVAIDEARDEVVAPTGSAGFRW---------GDKGKWNLEEKD--------- --------GKGAEVKLRMTAI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------LDKDH---------------------------------------- ------------------------------------------------------------- -----------------------------------DEVVEVA------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_F_bin.6_scaffold_35_30 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKKE--PFS-EGHGVTTAEAR------DW-EDGYR -QRWQH------DKVVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWRA--ARKDLPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKNY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNSGFLMLWGSNVPQTRTPDAH -FMTEARYRGAKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRKYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDFAGG-LG -ETNNPEWKCVAIDETSDEVVAPSGSVGFRW---------GEQGKWNLKEED--------- --------GRGEAVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFQGTDHPDVLMKRVPVREMQLA-EGRAYVATV--------- ----FDLLCAN-YGLDRGL--------GGQHVARDYADGAPYTPAWAEKITGIPADAIVTT -AREF------AANAEATNGKSMVILGAGVNHWYHMD-MTYRGIINLLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVGEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAARASG -LEPK-----DYIAQAL-----KG---------------GDLELSCMDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPREVKWHEEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESKSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGHG -EIEAIPGRTMATVALVERDY--PNLYNRFTALGPLMDKLGNGGKGIGWNTAAEVENL--- ------RRLNGVQDAGSPAAGMAKIETAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGINHRHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNQLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNTNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW------LEGALPEG--ENAA----------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_F_bin.22_scaffold_791_5 rank: A; aep:AMC99_00129 Respiratory nitrate reductase alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLTF--FRQKSE--TFS-DGHGLTTGEDR------HW-EDGYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIITWETQQTDYPRTR-----PEL -PNHEPRGCPRGASYSWYIYSAQRLKYPLIRKRLVK---------LWREARRT--LPPVAA -WASIQADPVKRKSYTAIRGHGGFVRSTWDEVNEIIAAANAYTAKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLMMWGSNVPQTRTPDAH -FMTEARYRGTKVAVVSPDYAEATKFADLWLNPKQG-TDAALALAMGHVILREFHL----D -RQVPYFEDYCRRYSDMPMLVRL-----VEQDGRLVPERLLR---------ASDVKGG-LG -EGNNPEWKCVAIDEASDELVVPSGSAGFRW---------GEKGKWNLEEKD--------- --------GQGREVKLRMTAILDKDHDE---------------VVEVAFPYFGNRE----- -----------------HDHFEGTDHPDVLMKRVPVRQLDLT-EGR----AYVATV----- ----FDLLCAN-YGLDRGL--------GGEHVARDYAAMSPYTPAWGEKITGVPADAIITA -AREF------AANAEATNGKSMVILGAGLNHWYHMD-MNYRGIINLLVMCGCIGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRQMNSTSFFYAHTDQWRYETLGVSEI -------LSPTAPKGDWDASLIDYNVRAERMGWLPS-----APQLK-TNPLEVGRAAKASG -MEPK-----DYVAQAL-----KG---------------GDLELSCLDPDDPA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTAHGVQG--KDLGEMGGQKPQEVKWHDEAPQGKL -DLLVTLDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-SAAVDPVW -ESRSDWEIYKGIAKTFSEVAPEVLGVE-QDLVLTPIQHDTANEIAQPF----DVADWGKG -EVEPIPGKTMATVAVVERDY--PNLYKRFTALGPLMDKLGNGGKGIGWNTVTEVDNL--- ------RKLNGTVGDDGPTKGMARIDTAIDAAEVLLMLAPETNGEVAVKAWDALSQF---- ------TGRDHKHLALPKE----E-EKIRFR-DIQAQPRKIISSPTWSGLESEHVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHKWMRAFGEALCVYRPPIDTKAVK--PML---- -------------------------DQAEGRPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMSEVDAAKAGLVDNDWV-- ----------------ETFNSNGALVARVVVSQRMKEGTLFMYHAQE-------------- ---KIVNVP-GSPLTGQRGGIHNSVT---RAILKPTHMIGGYVQ---------QAYGFNYY -GTV-GSNRDEYVIVRKLE-------KVDW---LEGALS-------EGENAA--------- ----- ->NASQAN2015_010_A_bin.16_Ga0466474_000034_25 rank: A; oca:OCAR_5043 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLLF--FKKKVD--TFS-GTHGVVTNEDR------SW-ESSYR -SRWQH------DKIVRSTHG-VNCTGSCSWKIYVKNGLVTWETQQTDYPRTR-----PDL -PNHEPRGCPRGASYSWYLYSANRLKFPMIRGRLVR---------LWRE--ARLSLDPVDA -WASIVEDPLKSAEYKSKRGLGGLVRANWDEVNEIIAAANIYTAKTF----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVSMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FMTEARYKGAKVVVVSPDYSEASKFADLWLHPKQG-TDAALAMAIGHVILKEFHV----E -GQSPYFNGYVRENTDLPFLVMLK-----EQDGYYVQDRFLR---------ASDFSGS-LG -QDNNPDWKTVAYDELNGQIVPPCGSIGFRW---------GESGQWNIEQKT--------- --------SDNQAVKLRLSLI------D-----------IKDEVASVGFPYFGGSE----- -----------------HPHFTHSAHDAIQKRNVPVKKIILA-DGTEVLATTVFDL----- -------LVAN-YGIDRGL--------GGGNVAASYDEDVPYTPAWQEKITGVSRSNVIAV -AREF------AINAEKTKGRSMVILGAGINHWYHMD-MNYRGIMNMLMLCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWLPLAFGLDWKRPPRQMNSTSFFYNHTSQWRYETLKVSEI -------LSPTAKPEDWQGSLIDFNVKSERMGWLPS-----APQLQ-TNPLQVVRDAKAAG -IAPA-----DYVVAGL-----KN---------------GSLKMSCEDPDNPL-NFPRNMF -VWRSNLLGS---SGKGHEYFLKYLLGTQHGIQG---KDLGDDGDKPSEVVWHEKAAEGKL -DLLVTLDFRMSTTCLYSDIILPTATW--YEKNDLNTSDMH-PFIHP----L-SKAVDPAW -ESRSDWDIYKGIAKKFSELTIGHLGLE-QDIVTVPVLHDTPGELAQPF----EVKDWKKG -ECEPVPGKTMPSLVVVERDY--PNTYKMFTSLGPLLSKIGNGGKGIAWNTETEVKQL--- ------GELNYLVTEEGISKGLPRIASDIDATEVILMLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAKPRE----D-DKIRFR-DVQAQPRKIISSPTWSGLESEQVCYNACY -TNVHERIPWRTLT------GRQQFYQDHSWMRAFGETLCVYKPPVDTRSIT--P--ILG- -------------------------QKPNGNDELVLNF-------------------LTPH -QKWGIHSTYTDNLLMLTLSR---------------GGPIVWMGEIDAAKVGIKDNDWI-- ----------------EAFNVNGALVARAVVSQRVPEGMCMMYHAQE-------------- ---KIVNMP-GAETTGGRGGIHNSVT---RATLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIIRKMS-------KVDW---LEEPKPEQA------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_A_bin.8_Ga0451740_0000093_1 rank: A; tun:J9260_09180 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- --------------NMLAMCG---CVGQSG------------------------------- -----------------------------------------------------------GG -WAHYV---------------------------------------------GQEKL----- ------------------------------------------------------------- --------------------------------------------------------RPQTG -WL------------------PLAFALDWSRPPRQM-NSTSFFY----------------- ------------------------------------------------------------- ------------------------------------------------------------- --------SHSNQWRYEKLEL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------KEILSPL -ANPA------------------RHSGSLIDYNVRSE------------------------ ------------------------------------------------------------- -----------------------------RMGWLPS-----APQLN-TNPLRIAKAAQAAG -MSPA-----EYTVAAL-----KA---------------GKIAFAAEDPDNPQ-NFPRNLF -VWRSNLLGS---SGKGHEYMLKYLLGTQHGVQS--KDLGVMGGAKPEEVKWHDTAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKDDLNTSDMH-PFIHP----L-TAAVDPAW -EARSDWEIYKGIAKAFSKVCEGHLGVE-TDLVTLPLLHDAPAELGQAM----GVKDWKKG -ECELIPGKTAPALVAVERHY--PDTYARFTAIGPLLEKLGNGGKGISWNTETEVAFL--- -------GQLNHQQTTGINEGRPCLNSAIDAAEMILSLAPETNGQVAVKAWQALSKI---- ------TGIDHSHLAIHKE----D-EKIRFR-DVVAQPRKIISSPTWSGLEDEHVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHDWMRDFGESMLVYRPPINTKTIK--P--LLN- -------------------------QRSNGNPELALNW-------------------ITPH -QKWGIHSTYTDNLIMLTLSR---------------GGPIVWMSETDAKTLGIQDNDWI-- ----------------DLFNANGAIAARAVVSQRVMPGMVMMYHAQE-------------- ---KIVNVP-GSVITGHRGGIHNSVT---RVCPKPTHMIGGYAQ---------QAYGFNYY -GTV-GSNRDEFVIVRKMT-------QVEW---LDNE---------GNDYAQEAVQ----- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_1345490_1 rank: C; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLN---FLARKNADTFS-DGHGVTTTENR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLIRSRLLK---------LWRK------------ ------------------------------------------------------------- --------------------ERTIK------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------TPIGAWAAIQEN--------- --------PEKRADYMKMRGL---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.47_k121_924190_1 rank: A; ops:A8A54_10745 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------FLARKNAGTFS-DGHGVTTTESR------DW-EDAYR -KRWQH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKHPLVRSRLLK---------LWRK--ERTIKTPIGA -WAAIQENPEKRADYMKMRGLGGFVRATWEEVNEIIAAANAYTVKTY----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGVCLSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEVRYKGAKSVVVSPDYSEAAKFSDLWLHPKQG-TDAALAMAMGHVILREFHL----D -RQADYFEDYCRRYTDMPMLVKLTG----KDGHFIPD-RFVR---------ASDFTGA-LD -ETNNPEWKTVAVDAKTKQFVSPGGSIGYRW---------GEQGKWNLEAKDGKGADVDLA -MSFI---LDGEHDTIANVGF----------------------------PYFGNRE----- -----------------HDYFEGTDHDSVLVRKVPARKVKLA-DGEALVATV--------- ----FDLFVAN-YGLDRGL--------NDPNSAKSYQENLPYTPAWAEKITGVPRDQIIAV -AREF------ASNAEKTNGRSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCVGQSGG-G ---WSHYVGQEKLRPQT---GWTALAFALDWNRPPRHMNGTSFFYAHTDQWRYETLKVDEI -------LSPTAPEGPWDASLIDYNIRAERMGWLPS-----APQLK-TNPLEVSKQAAAAG -KEAK-----DFVAEQL-----KA---------------GALSMSCEDPDDKA-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTKHGVLG--KDLGEEGRQISKEAVWHDEAPEGKL -DLLVTLDFRMSTTCVYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SSAADPAW -DARSDWEIFKGIARKFSEVAPEVLGVE-KDVVLVPTLHDTAGELAQPI----DVKDWKKG -EIEPIPGRTMPTVAVVERDY--PNLYKKFTSVGTLLDTVGNGGKGIAWNTEHEVDLL--- ------ARLNGVVQEEGVTRGRPRIESDIDATEVILSLAPETNGEVAVKAWEALSKF---- ------TGRDHTHLAIPKE----D-EKIRFR-DVVAQPRKIISSPTWSGLESEKVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFCVYRPPIDTKT----------- -VNPAIR------------------SKADGKPHLVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWISEPDAKRAGIVDNDWV-- ----------------EVYNTNGAIVARAVVSQRMKDGTVFMYHAQE-------------- ---KIVNTP-GSPITGQRGGIHNSVT---RVITKPTHMIGGYAH---------QSYGFNYY -GTV-GANRDEFVVVRKLE-------TVDW---LEGPHTESVAY--NKEAAE--------- ----- ->lecontecreek_2019_sw_WHONDRS-S19S_0018_F_bin.2_scaffold_1_206 rank: A; bprc:D521_0425 Respiratory nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLKF--LSADKE--EFS-DGHGVTVGEDR------TW-EDAYR -SRWQH------DKIVRSTHG-TNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYMYSANRVKYPMIRGRLLK---------QWREAKSVA-KSPVDA -WANLVENTAKRKEWMELRGKGGFVRSSWDEVNEIIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADIWMHPKQG-TDAAIAMAMGHVILKEFYF----N -KRTEYFDDYVRRYTDMPNLVMLEEKVLDDGRKVLVPGRYAR---------SSDFDGK-LG -QTNGADWKTVAFD-TAGKPVVPNGSIGFRW----GPEGRKDQGKWNLESKE--A------ --------NYGNDVKLKLSLMEDQSIHD------------VVPVGF---PYFGGID----- -----------------TPYFDANKQSDVLVQNIPAKKIILT-ENGVEKEVFVATV----- ----FDLLAGN-YGIDRGL---------GGECAKSYDDNVPYTPAWQESITGVKREQVIAV -ARQF------AENAEKTKGKSMVIIGAAMNHWYHCD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWIRPPRQQNSTSFFYAHTDQWRYEKLGMEEV -------LSPLANKEEYTGSMIDFNVRAERMGWLPS-----APQLK-TNPLEVVKEALAAG -KDPK-----KYVVDGL-----KS---------------GTLQMSCEDPDHPS-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGADEARPSEVEWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -EARSDWDIYKGFAKKFSEVCVGHLGVE-KEIVMTPLMHDTPAELAQAF----DVQEWKKG -ECDLIPGKTAPQIAVVERDY--PNTYNRFTALGPLMDKVGNGGKGIAWDTKVEVEQL--- -------RELNGRVEHGEMKGMAKISTDIDAAEVVLMLAPETNGHVAVKAWDALSKI---- ------TGLEHAHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNACY -TNVHEYIPWRTLT------GRQQFYQDHKWMRAFGEGFVSYRPPVDLKTII--------- -----------EVKGIKPNGNK----------EIVLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDAVKAGIVDNDWV-- ----------------ELYNANGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVTVRKMR-------NIDW---LDTENANSVQA----------------- ----- ->whiteclaycreek2_2019_sw_WHONDRS-S19S_0038_B_bin.50_k121_1710496_1 rank: A; pde:Pden_4236 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNF--LKSTRK-DTFA-DGHGQTTIENR------DW-EDTYR -SRWRH------DKIVRSTHG-VNCTGSCSWKIYVKNGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKTPLVRGRLMR---------RWRDLRRT--LGPIEA -WTAIQSDPAARADYVKARGRGGFVRASWDEVTEIVAAANAYTAKTW----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPMTWGEQTDVPESADWYNAGFLILWGSNVPQTRTPDAH -FYTEARYRGTKSAVVSPDYSEAAKFGDIWLNAKQG-TDAALAIAMGHVILREFHL----D -RQVDYFEDYTRRYSDFPMLVKLEP-----KGDRFVPGRMLR---------AADIDGA-LG -ETNNPDWKTVAIDDASGRLVAPNGSIGHRW---------GEQGTWNLEEKA--------- ---------GAESVRLRTTLI------------LDGQNDGTAGVDF---PYFGGSA----- -----------------TNGWQACDTPDVLTRAIPVRKVALK-DGE----AMVATV----- ----FDLLCAN-YGLDRGL--------GGDWVARDYGSDMPGTPAWAERITGVPADRIIQV -AREF------AANAEKTGGKSMIIIGAAMNHWYHMD-MNYRGVINMLVMCGCVGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWGRPPRHMNSTSAWYAHTDQWRYETVRSDEI ------LSPTAPAGDWSSLSLIDYNIRAERMGWLPS-----APQLR-TNPLQVAAAAKAEG -TEVR-----DYVAREL-----KA---------------GRLEMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVLG--KDLGEEGRRKPVEARWHDKAPEGKL -DLLTCIDFRMSTTAVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKTDWEIFKAIAAKLSEIVPGYLGVE-TDVVQLPLQHDSPGEVAQPR-----VADWKQG -QCDLIPGKTAPAFIAVERDY--PNLYRRFTALGPLMEKAGNGGKGIAWDTKHEVAHL--- ------RALNGTVTDEGPTKGMARIDTAIDAAEVILMLAPETNGEVAVKAWEALSKA---- ------TGREHKHLALPKE----D-EKNRFR-DIAAQPRKIISSPTWSGIESESVCYNAGW -TNVHELIPWRTLT------GRQQLYQDHEWMLAFGEFFLAWRPPVDLKTIT--APATGA- -----------------LGANE---------KHVVLNF-------------------ITPH -QKWGIHSTYSDNLLMLTL------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.46_k121_495423_17 rank: A; acis:CBP35_16735 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--TFS-QGHGQTNGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLK---------HWRA-ALLLAKSPVDA -WANIVENESAKREWQKQRGLGGFVRSTWDEVNQMIAAANVYTIKKH----GPDRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSSFIIAWGSNVPQTRTPDAH -FLTEVRYKGTKVVSITPDYSEVAKLGDLWMHPKQG-TDAAVAMAMGHVILKEFYFKDGGK -GRSTYFDDYARRYTDLPLLVVLKEKTLPDGRTVMVPDRYVR---------ASDFPGQ-LD -QSNNPDWKTVGYD-ELGQVTLPNGSIGFRW----GADGRADEGLWNLENKE--A------ --------RTGNTVKLKLSVI------E--------DGEQAYDVADVAFPYFGGVQ----- ----------------TPNFTANEQGGDVMVRRVPVSHLELA-GHEAQGRVMVATV----- ----FDLLAGN-YGIDRGL--------PGEEPGGSYDADRPYTPAWQESITGVPREQIIAV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHCD-MNYRGIMNMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------LSPLADKKSYSGSMIDYNVRAERMGWLPS-----APQLK-TSPLQVAKDAAAKG -MDAK-----DYVVQSL-----KD---------------GSLQMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGRDEAKPEEVQWHANAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QAKSDWEIYKGFAKAVSEVSVGHLGVE-KDVVLTPIMHDTAGEMAQPY----GVRDWKKG -DCELIPGKTAPQVTVVERDY--PNLYKRFTALGPLMDKAGNGGKGIGWNTQTEVGQL--- ------GDLNGRVKEEGVTQGMPRIVSDIDATEVVLMLAPETNGHVACKAWEALGKQ---- ------TGRDHVHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMRDFGEGFVSYRPPVHLKALH----EVEG- -------------------------KKPNGNREIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAASAGIVDNDWV-- ----------------ELFNANGAIAARAVVSQRVNPGMVMMYHSQE-------------- ---KIINTP-GSEITGTRGGIHNSVT---RIVLKPTHMIGGYAQ---------YSYGFNYY -GTI-GTNRDEFVLVRKMD-------RVDWLDDEVSDTGAHA------------------- ----- ->lewisrun_2019_sw_WHONDRS-S19S_0014_B_bin.30_k121_510322_1 rank: A; hyb:Q5W_04195 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------QG------------------------------------------- ------------------------------------------------------------- -------------------------------------TDAALAMAMGHVVLKEFYFPAN-G -QRSSYFDDYARRYTDLPMLVMLKEQTLPDGSTTLVPDRYLR---------ASDFNGK-LG -QANNPDWKTVAFD-TTGKAVLPNGSIGFRW----GDQGREDAGKWNLESKE--A------ --------RDNGDVKLKLSVL------E-----DGAQDHQVVDVGF---PYFGGQQ----- ----------------TPNFPANAAVGDVNQAKVPAVRLRLG-KAGEERYALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKNYDDNAPYTPAWQETITGVPRQQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWLRPPRQQNSTSFFYAHTDQWRYEKLDVSEI -------VSPLADKAKFGGSMIDYNVRAERMGWLPS-----APQLK-TNPMQVVKDATAAG -MDPK-----DYVVQAL-----RD---------------GSLEMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTENGVQG---KDLGADEAKPTEVKWHKDAPQGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSKSDWEIYKGFAKRFSEVCVGHLGVE-KEVVLTPLMHDTAAELAQPF----EVKEWKKG -ECELVPGKTAPQIAVVERDY--PNLYKRFTALGPLMNKLGNGGKGIGWKTEIEVEQL--- ------GQLNGVTREEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMVAFGEGFSSYRPPVDLK--T--TDVVQG- -------------------------LRPNGHKEIVLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEDDAKSAGIQDNDWI-- ----------------ELFNVNGAVAGRAVVSQRVKNGMVMMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMQ-------KVDW---LDTP---------RDDHLVKAVQSQGEN -P--- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_2728883_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------LYSANRVKYPLVRGRLLE---------RWRT-ALKTARTPVDA -WATIVENPDARRDYQKVRGMGGFVRSSWDEVNQLIAAANVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAVTPDYSEVAKLADLWLHPKQG-TDAALAMAMGHVALNEFYF----K -QRSPYFDDYARRYTDLPLLVMLKEHILPDGSKTLVPDRYLR---------ASDFNGK-LG -QDNNPEWKTVAFD-AGGRAVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RHGAEVKLKLSVI------E--------DGTQAHEVVGVGLPYFGGVS----- ----------------TPHFTANAQQGEVNFVKVPAVRLRLG-KEGEQREALVATV----- ----FDLQVAQ-YGIDRGL----------GSGAKSYDDNAAYTPAWAESITGVPGDQIITV -ARQF------ADNAHKTRGKSMVIIGAAMNHWYHAD-MNYRGVINLLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEI -------VSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVKDATAAG -LDAK-----DYVVRGL-----RD---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNLLGS---SGKGHEYFCKHLLGTESGVQG---KDLGKDDARPAEVAWHEHAPEGKL -DLLVTLDFRMSTTCLYSDVVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCIGHLGVE-KEVVLTPIMHDTAGEIAQPF----DVKEWKKG -QCELIPGKTAPQVTVVERDY--PNVFKRFTALGPLMDKLGNGGKGIGWKTGTEVEQL--- ------GQLNGTTQADGPTKGMPQIVTDIDACEVILQLAPETNGHVAVKAWQALGKQ---- ------TGRDHTHLALYRE----D-EKIRYR-DVQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHPWMIAFGESMSSYRPPVDLKT----TSGIHN- -------------------------IKGNGNPEILLNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGPVVWLSEDDARLAGVQDNDWV-- ----------------EVFNINGAIAARAVVSQRVNPGMLMMYHAQE-------------- ---KIINTP-GSQITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMS-------KVDW---LDTPR--------DDHLAAAYQAQGENP ----- ->yakimariver_2019_sw_WHONDRS-S19S_0060_B_bin.3_k121_3072591_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FTLPRE--RSA-DGHGVVTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------------RWRAALTTARTPVDA -WAT--------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------IVENP------------ ------------------------------------------------------------- ------------------------------------------------------------- -DARRDYQKVRGMG----------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.19_scaffold_731_2 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPQE--TYS-GRHGVATNEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIADDESARRDYQQVRGLGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSSFIIAWGSNIPQTRTPDAH -FFTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVILKEFYFKDGGQ -GRSAYFDDYARRYTDLPLLVMLKEHQLADGSTTLVPDRYLR---------ASDFSGQ-FG -QDNNPEWKTLAFD-TSGNPVLPNGSIGFRW---GEQLDEGELAKWNLESKD--A------ --------RNGQDVKLKLSVV------E--------DGAQPHEIAEVAFPYFGGVE----- ----------------TPNFPANAAQGEINRAKVPTVRLDLVGQGGESRQALVATV----- ----FDLQVAQ-YGIDRGF----------GSGAIDYDDNVPYTPAWQESITGVPRDQVITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNGTSFFYAHTDQWRYEKLGVEEV -------LSPLADKAAFGGSMIDYNVRAERMGWLPS-----APQLK-THPMQVVKDASAAG -LDAK-----DYVARAL-----KD---------------GSLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGADEAKPTEVKWHAKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QAKSDWEIYKGFAQAFSEVCVGHLGVE-KEVVLTPLMHDTPAELAQPF----GVQDWKKG -ECALIPGKTAPQVTVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTDLEVTQL--- ------GQLNGVTLEEGVTKGMPKIVTDIDACEVILQLAPETNGHVAVKAWEAQSKA---- ------TGRDHVHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLK-----TTGGLS- -------------------------IKSNGNAEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGTVIWLSEEDATKVGIVDNDWI-- ----------------ELFNSNGAIVGRAVVSQRVKPGMTMMYHSQE-------------- ---KIINTP-GSEITGARGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLEEPAGAPASGAGH----------------- ----- ->eastforkpoplarcreek_2019_sw_WHONDRS-S19S_0039_B_bin.13_k121_238651_23 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FKLPRE--AFS-GDHGLTTNEDR------TW-EDAYR -NRWAH------DKVVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLE---------RWRA-ALKVAKTPVDA -WALIAEDDAARRDYQQVRGMGGFVRSSWDEVNQLIASANVYTIKKH----GADRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQIWGEQTDVAESADWYNSNFIIAWGSNVPQTRTPDAH -FLTEARYKGTKTVAVTPDYSEVAKLSDLWLHPKQG-TDAALAMAMGHVVLKEFYFKDGGK -GRSAYFDDYARRYTDLPLLVMLKEHKLPDGSITLVPDRYLR---------ASDFNGK-LG -QGNNPEWKTVAFD-ADGRAVLPNGSIGFRW---GEKLGEGETPKWNLESKE--A------ --------RHGQDVKLKLSVV------E--------EGEQEHEIAEVAFPYFGGVQ----- ----------------TPNFPANSAQGEINRAKVPAVRLRLG-KEGDERYALVATV----- ----FDLQAAQ-YGIDRGF----------GSGAASYDDNAPYTPAWQEAITGVPRDQVVTV -ARQF------ADNADKTQGRSMVIIGAAMNHWYHSD-MNYRGVINLLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWAPLAFALDWIRPSRQMNSTSFFYAHTDQWRYEKLGMEEV -------ISPLADRKIYDGSMIDYNVRAERMGWLPT-----APQLK-TNPMQVVRDAAAAG -LDAR-----DYVAKAL-----KA---------------GTLQMSCEDPDAPQ-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGAGDAKPSEVKWHASAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTASW--YEKNDLNTSDMH-PFIHP----L-SAAVDPVW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KDVVLTPLMHDTPAELAQPF----EVKDWKKG -ECELIPGKTAQQITVVERDY--PNTYKRFTALGPLMNKLGNGGKGIAWKTELEVTQL--- ------GQLNGVTLEEGVTQGMPRIVSDIDACEVILQLAPETNGHVAVKAWDALGKV---- ------TGREHKHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHEYIPWRTLT------GRQQFYQDHPWMIAFGEGFSSYRPPVDLKT----TAEIAG- -------------------------VKPNGNPEIQLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEEDAAKAGIVDNDWV-- ----------------ELFNVNGAISARAVVSQRVKPGMTLMYHAQE-------------- ---KQINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDEPAGTAGSGH---------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_B_bin.15_k121_168873_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSQPKE--TFS-GDHGLTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPMVRSRLLE---------RWRA-AMKTAKTPVDA -WATIVEDDAARRDYQKVRGMGGFVRSSWDEVNQIIAASNVYTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWG--------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2011_265_B_bin.52_k121_959771_6 rank: A; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------GEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -FYTEVRYRGTKSAVVSPDYSEAAKFGDIWLNPQAG-TDAALAMAMGHVILREYHL----D -RQAEYFEDYARKYTDMPMLVRLE-----DRDGHLVPGRMLR---------AEDFDGK-LG -ETNNPDWKTVAYDEATGQIAVPNGSIGFRW---------GEEGKWNLEQRA--------- ---------KGAEANLRLSQILDGHHDE---------------IVGVDFPYFGGVA----- -----------------TGDFVKCDHPEVLTRNIPARRAKLA-DGSQVLAATVFDL----- -------FCAN-YGLDRGL--------GGKWVSKDFNDDSPYTPAWAEKITGVAREKIIAV -AREF------AGNAEKTHGKSMVILGAGLNHWYHMD-MNYRGIINMLVMCGCIGQEGG-G ---WSHYVGQEKLRPQT---GWAPLAFALDWNRPPRQMNSTSCWYAHTDQWRYETLRAGEI -------LSPTAPEGDWHISLIDYNIRAERMGWLPS-----APQLK-TNPLEVAKAAKAA- ----------GKAIPAYVAEQLKS---------------GALQMSCEDPDAPE-NWPRNLF -VWRSNLLGS---SGKGHEYFLKHLLGTDHGVMG--KDLGEEGGVMPKEAVWHDEAPKGKL -DLLVTIDFRMSTTCVYSDIVLPTASW--YEKDDLNTSDMH-PFIHP----L-QAAVDPAY -ESKSDWEIFKSIARKFSEVAPEVLGVE-TDIVQLPLLHDTPGELAQAH-----VRDWKKG -ECDLIPGKTAPNYIAVERDY--PNLYKKFTSVGPLLEKLGNGGKGINWDTKVEVGHL--- ------RDLNGVVQDEGVSKGMAKLDTAINAAEMILMLAPETNGEVAVKAWEELEKP---- ------TGRHHAHLAEGAH----H-TKIRFR-DVAAQPRKIISSPTWSGIESETVCYNAGY -TNVHELIPWRTLT------GRQQLYQDHLWMRAFGEGFVSYRPPVDLKTI---TKAVNN- -------------------------DAAEGNPHVVLNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVVWMSEVDAQKARLVDNDWV-- ----------------EAYNINGALTARVVVSQRIKQGTLFMYHAQE-------------- ---KIVNTP-GSEKTGHRGGIHNSVT---RTTLKPTHMIGGYAQ---------LSYGFNYY -GTV-GSNRDEFVIVRKMK-------KVDWLD-TPATHKVEAAE----------------- ----- ->NASQAN2011_265_B_bin.52_k121_465271_4 rank: C; pzh:CX676_21060 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------LLDRLNFFQSKELEQ---FS-DGWGQTTRENR------DW-EDVYR -NRWRH------DKIVRSTHG-VNCTGSCSWKIYVKSGIVTWETQQTDYPRTR-----AGL -PNHEPRGCARGASYSWYLYSANRVKNPLIRGALMR---------AWRK--MRPTMTPVAA -WAAIQNDPVLRASYTKTRGKGGFVRATWDEATEIIAAANAYTAKTY----GPDRV-FGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----LGGTCMSFYDWYCDLPPASPQTWGEQTDVPESADWYNAGFLMLWGSNVPQTRTPDAH -F----------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->watershed3_2019_sw_WHONDRS-S19S_0084_B_bin.45_k121_975195_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSH--FSAPKE--EFA-DGHGVATGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALLVAKSPVDA -WASIVENPQARAEWQKQRGLGGFVRSTWEEINQLVASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----D -KRSAYFDNYVRRYTDMPNLVQLEERTLPDGRKVMVPGRYLR---------ASDFDGK-LG -QSNNPEWKTVALD-QDDKIVLPNGSIGFRW----GAAEREDLGKWNLENKE--A------ --------RGDTQVTLKLSLM------E----GAKDGSAADYEVGDVGFPYFGGID----- -------------TPNFDANKQSAAVGDVLVRKVPVRRVKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------PGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWVRPPRQMNSTS -FFY------------------AH------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------TDQWR--------------------------------- ------------------------------------------------------------- -----------------------Y------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------ERLGVDE------ ------------------------------------------------------------- -------------------------------ILSPL------------------------- --------------ADKSK------------------------------------------ ----- ->NASQAN2015_172_B_bin.54_k121_327740_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------IWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRQVVVPGRYIR---------ASDFNGK-LG -QDNNPDWKTVALD-QNDKIVLPNGSIGFRW----GAEGRSDEGRWNLENKE--A------ --------RGDGDVKLKLSLM------E--------GEDSEYQVGEVAFPYFGGID----- -------------TPNFHANKQVSAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------DGETAAKDYEEDVPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAVG -MDPK-----EYAIKAL-----QD---------------GSLKMSCEDPDNPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGPEDAKPAEVKWHDKAPEGKL -DLLVTLDFRMSTTCMYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----EVNEWQKG -KCELIPGKTAPQITVVERDY--PSTYKRFTALGPLMAKVGNGGKGIGWNTADEVQQL--- ------GELNGHVRTEGVTKGFPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYLDHPWMIAFGEGLTSYRPPVDLKT----VDDMID- -------------------------RKPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKDAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KIINTP-GSEISGMRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVIVRKMR-------KIDW---LDNEANNQVQV----------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_678_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- -------------------------------------NGKLGQDNNP------EW-KTVAL -DQA--------DRVVL-----PNGSIGFRWGAEGRSD--------------------AGK -WNLEDKEARGG--------NEVKLKLSLM------------------------------- ---------------------------------------------------------EGEG -ADYEVGEVA--------------------------------------------------- ----------------------FPYFGGIDT------------------PNFSANKQASA- -------------------------------------VD---------------------D ------------------VLVR--------------------------------------- ------------------------------------------------------KVPVR-- ------------------------------------------------------------- -------------------------------------RIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKT----VDEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQA----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.17_Ga0451756_0000169_17 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--AFS-GGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----PDL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRAALAVA-KSPVDA -WTSIVENPNARLEWQEQRGLGGFVRSTWEEVNQIIASANVYTIKQY----GADRI-IGFS -PIPAMSMIS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QADRMVLPNGSIGFRW----GAEGRSDAGKWNLEDKE--A------ --------RGGNEVKLKLSLM------E--------GEGADYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVGRGL--------PGEDAAASYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKTKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----EYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEEAKPTEVIWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKSFSEVCVGHLGVE-KELLLTPLMHDTPAELAQAF----DVQEWSKG -DCDLIPGVTAPQINVVERDY--PNTYKRFTALGPLLEKHGNGGKGIGWNTDDEVHQL--- ------GELNGKVRAAGVTQGMPKIETDIDACEVVLQLAPETNGHVAVKAWEALGKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTTYRPPVDLKTV----DEMLN- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNRGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKML-------KVDW---LDDEAPATVQV----------------- ----- ->cobbmillcreek_2019_sw_WHONDRS-S19S_0090_A_bin.23_Ga0451756_0000618_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FSNPKE--PFS-GGHGVTTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLK---------HWRA-ALAVAKSPVDA -WASIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTYIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVTVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKE--A------ --------RGDSEVKLKLSLM------E--------GEGSEYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRIKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMQVVKDAQAQG -MDPK-----DYAVKAL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGAEDAKPTEVTWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLMPLMHDTPAELAQAF----DVKEWSKG -ECELIPGKTGPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTTDEVHQL--- ------GELNGKVRAEGVTQGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMQAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RRPNGNKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKNAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KVDW---LDGEAPATVQA----------------- ----- ->NASQAN2011_028_B_bin.24_k121_53788_5 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRA-ALAVAKSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYAEISKLADLWMHPKQG-TDAAIAMAMGHVILKEFYF----D -KRSAYFDDYVRRYTDMPNLVQLEERNLPDGRKVMVPGRYLR---------ASDFNGK-LG -QDNNPEWKTVALD-QNDRVVLPNGSIGFRW----GAEGRSDAGKWNLENKEA-------- --------RGDNEVKLKLSLM------E--------GEGSDYEVGEVAFPYFGGID----- -------------TPNFSANKQASAVDDVLVRHVPVRRVKLG-KAGEERYALVATV----- ----FDLTAAN-YGVARGL--------PGENAATSYDHDTPYTPAWQEKITGVKQDQVIAV -ARQF------ADNADKTRGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTPLAFALDWVRPPRQMNSTSFFYAHTDQWRYERLGVEEI -------LSPLADKSKFGGSMIDYNVRAERMGWLPS-----APQLQ-TNPMKVVKDALAQG -MDPK-----DYAVKSL-----KD---------------GSLKMSCEDPDHPL-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGIEDAKPTEVHWHDQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWEIYKGFAKAFSEVCVGHLGVE-KELMLTPLMHDTPAELAQAF----DVKEWKKG -ECELIPGKTAPQISVVERDY--PNTYKRFTALGPLMEKAGNGGKGIGWNTADEVHQL--- ------GELNGKVRAEGVTKGMPNISTDIDACEVVLQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLALHRE----D-EKIRFR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHEYIPWRTLT------GRQQFYLDHPWMLAFGEGMTSYRPPVDLKT----VDEMID- -------------------------RKPNGHKEISLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNSNGAIAARAVVSQRVNPGMVMMYHAQE-------------- ---KTINTP-GSEITGIRGGIHNSVT---RIVTKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMR-------KIDW------------------------LDGEAPA -TVQA ->NASQAN2015_227_F_bin.21_scaffold_4919_3 rank: C; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLNY--FTNPKE--PFS-GRHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----ADL -PNHEPRGCARGASYSWYLYSANRVKYPMIRARLLQ---------HWRAALAVA-KSPVDA -WTSIVQNEDARREWQQQRGLGGFVRSTWDEVNQLIASANVYTAKQY-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Yukon_2004-1_F_bin.10_scaffold_25058_1 rank: C; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY--FSQPRE--SFS-GDHGVTTGEDR------TW-EDAYR -TRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSMQPVDA -WASIAQSDEKRREYQTVRGLGGFVR------------SNVYTIKKH----GPDRI-VGFS -PIPAMSMVS------YGAGSRYLSL----------------------------------- ----IGGVPLSFYDWYCDLPPASPQVWGEQTDVPESADWYNSTFIIAWGSNVPQTRTPDAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYF----P -DGGKPRSAY---FDDMPMLVMLKEHQLPNGDTVMVPDRYVR---------ASDFNGK-LG -AANNPDWKTVAFD-ESGKVVLPNGAIGFRW----GPDGRADEGQWNLEAKE--A------ --------RHGTEVKLKLSVM------E--------GDNPSLETAKVGFPYFGGIV----- -------------SEHFPNNATGDAAKDVLVRTVPVQRISLG-KEGDKREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------AENADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGMDEV -------LSPLADKKLYGGSMIDYNVRAERMGWLPS-----APQLK-TNPFQVVKDAEAAG -MSPV-----DYTVKSL-----KD---------------GSLAMSCEDPDHPN-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG--------------------------- --------------------------------KDLGADEAK-------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PTEVVW------------------------------ -----------------------------------------HKEAPEGKLAL--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----VVTLD---------------------------------------------------- -----------------------------F------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4056_4 rank: C; buq:AC233_31260 narZ; nitrate reductase; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --WRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDLGPQDAKPTEVKWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -QSRSDWEIYKGFAKKFSEVCVGHLGVE-QEVVLTPLMHDSPAELGQPM----GVQDWKRG -DCELIPGKTAPQITVVERDY--PNVFKRFTALGPLMNKVGNGGKGIAWNTQVEVTQL--- ------GQLNGLVREEGVTKGMPKIDTDIDACEVVLQLAPETNGHVAVKAWEALSKA---- ------TGRAHKHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYQDHAWMLAFGEGFGSYRPPVDMKA----TALMHN- -------------------------QRPNGQPEILLNF-------------------ITPH -QKWGIHSTYTDNVLMLTLSR---------------GGPIVWLSEDDAKSAGIVDNDWV-- ----------------ELFNVNGAIAARAVVSQRVKPGMVMMYHAQE-------------- ---KIINTP-GSEITHVRGGIHNSVT---RIVLKPTHMIGGYAQ---------LSYGFNYY -GTI-GTNRDEFVVVRKMD-------KIDW---LDTPVG-------AERVTRVQAQGENA- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.17_scaffold_4528_3 rank: C; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLSY----FSQPTEPFS-NEHGITTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCQRGASYSWYLYSANRVKHPMVRARLLK---------HWRE--ARLHHDPVDA -WASIMANETKRRDYQQVRGLGGFVRSSWDEVNEIIAAANVHTIKKH----GPDRV-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNSSYIIAWGSNVPQTRTPDAH -FFTEVRYKGCKTVAVTPDYSEVAKLADLWMHPKQG-TDAALAMAMGHVILKEFYF----D -RRAAYFDDYARRYTDLPMLVMLREQTLDNGRTVLVPDRLLR---------ASDFNGK-LG -QANNPDWKTIAFD-TTGKAVAPNGSIGFRW----GPEGRADAGRWNLEDKD--A------ --------RTGADTKLKLSVL------EDEHGEGAAQAHEIVEVGF---PYFGGVV----- ----------------NPHFTGNDQGGDVRRIHVPAVRLRLG-KAGEERHALVATV----- ----FDLQAGQ-YGIDRGL----------GTGAKNFDDDAPYTPAWQEAITGVPREQVIAV -ARQF------AENAEKTEGRSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGKSGG-G ---WAHYVGQEKLRPQT---GWTALAFA--------------------------------- -----------------------------------------------LDWIRPPRQQNSTS -FFY------------------AH------------------------------------- ---------------------------TDQWRYE--------------------------- -----------------------------------------------------KLGMDEVL -SPLADKAAFKGSAIDFK------------------------------------------- ------------------------------------------------------------- --------------------------------APQLNVNPIQVAKA--------------- -------------------------ARAA-------------------------------- --------------------G---------------------------------------- ------------------------------------------------------------- ------------------------------------------VDPKDYTVQGLKNGS---- --------------------------------------IDLACHDPDAP------------ -----------------------------QNW----------------------------- -------PRNMFV----------------W------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.3_scaffold_11088_2 rank: A; metr:BSY238_1272 nitrate reductase, alpha subunit; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ----------------------S-------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------MNYRGVINMLMLCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWIRPPRQMNSTSFFYAHTDQWRYEKLGMDEI -------LSPLADKKAYAGSMIDYNVRAERMGWLPS-----APQLK-TNPLKVVRDASAAG -MDPK-----DYTVKGL-----KD---------------GTLKMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSHGVQG---KDLGRDEAKPSEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSKSDWDIYKGFAKKFSEVCVGHLGVE-REMVLSPMMHDSPGELAQPL----DVKDWKRG -EVDLIPGKTAPNMVVVERDY--PNVYKRFTALGPLMNKVGNGGKGIAWNTQTEVKQL--- ------GELNGLITEQGVTCGMPRIDSDIDACEVVLQLAPETNGHVAVKAWQALGKQ---- ------TGIDHTHLALYRE----D-EKIRYR-DIQAQPRKIISSPTWSGIESETVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFTSYRPPVDLKTT---------- ----------AGIHGIKSNGNP----------EILLNF-------------------ITPH -QKWGIHSTYSDNLHMLTLNR---------------GGPVIWLSEDDAKRAGIVDNDWV-- ----------------ELFNINGAIAARAVVSQRVNNGMTLMYHAQE-------------- ---KIINTP-GSEITGIRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW---LDTPADASNPA------------GSHA- ----- ->NASQAN2016_164_F_bin.17_scaffold_8891_2 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPRE--SFS-GDHGVTTGEDR------TW-ENAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWRE--ARLSQDPVDA -WASIAQSDAKRKEYQSVRGLGGFVRSSWDEVNEMVAAANVYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYCDLPPASPQIWGEQTDVPESADWYNS----------------DAH -FFTEVRYKGTKTVAVTPDYSEVAKLSDIWMKPKQG-TDAAVAMAMGHVILKEFYFPDGGK -ARSTYFDDYVRRYTDMPMLVMLKEQTLPSGEVVMVPDRYLR---------ASDFNGK-LG -AANNPEWKTVALD-ESGKVVLPQGAIGFRW----GPDGRADEGQWNLQAKE--A------ --------RHGNDVKLKLTVM------E-----GEQASLETAKVGF---PYFGGIE----- -------------SEHFPNNATGAGANNVLVRTVPVQRIALG-KAGDTREALVATV----- ----FDLQVAN-YGVARGL--------PGELAAKDFNDDTPYTPAWQERITGTPREQLITV -ARQF------ADNADKTHGKSMVIIGAAMNHWYHAD-MNYRGVINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFGLDWIRPPRQMNSTSFFYAHTDQWRYEKLGMEEV -------LSPLADKKAFGGSMIDYNVRAERMGWLPS-----APQLK-TNPLQVVRDAQAAG -MEPK-----DYAVKGL-----KE---------------GTLSMSCEDPDHPD-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTSNGVQG---KDMGHDEAKPEEVVWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->NASQAN2015_227_B_bin.17_k121_559871_7 rank: A; rfr:Rfer_2792 respiratory nitrate reductase alpha subunit apoprotein; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTY--FSQPKE--AFS-GEHGVSTGEDR------TW-EDAYR -NRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTR-----WDM -PNHEPRGCARGASYSWYLYSANRVKYPLVRGRLLK---------LWREARLS--MDPVDA -WASIAQDDAKRKEYQSVRGLGGFVRSGWDEVNEMVAAANIYTIKKH----GPDRI-IGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCMSFYDWYC-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.12_scaffold_10959_2 rank: A; aon:DEH84_18240 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- --------------------AA-------------------------------DW-VRPSR -QQN--------STSFFYAHT---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------DQWRYEKL----------------- --------------GVNEVLSPLADKAKF-------------------------------- ------------------------------------------------------------- ----------------------------------------GGSMI---------------- ---------------------------D--------------------------------- ------------------------------------------------------------- ----YNVRAER-------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------MGWLPS-----APQLQ-TNPLNLVKEAQAKG -MDAK-----DYAVQSL-----KD---------------GSLKMSCEDPDNPA-NWPRNMF -VWRSNILGS---SGKGHEYFLKHLLGTTHGVQG---KDLGPNDAKPQEVQWHNQAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-SAAVDPAW -EARSDWEIYKGFAQKFSEVCVGHLGAE-REVVMTPIMHDTAAELAQPF----GVQEWKKG -EIDLIPGKTAPQIAVVERDY--PNTFKRFTSLGPLMNKLGNGGKGIGWNTQDEVHAL--- ------GELNGTVREEGVSQGMPKIVSDIDASEVVLMLAPETNGHVAVKAWEALGKQ---- ------TGRDHTHLALHRE----D-EKIRYR-DIQAQPRKIISSPTWSGLESEKVSYNAGY -TNVHELIPWRTLT------GRQQFYMDHPWMIAFGEGFVSYRPPVDLKT----LDDIKG- -------------------------VKPNGNKEIALNF-------------------ITPH -QKWGIHSTYTDNLLMLTLNR---------------GGPVIWLSEDDAKSAGIVDNDWV-- ----------------ELFNTNGAIAARAVVSQRVNNGMVLMYHAQE-------------- ---KIVNTP-GSEITGTRGGIHNSVT---RVVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDWLDDESSNQGVHA------------------- ----- ->NASQAN2016_164_F_bin.17_scaffold_1152_1 rank: C; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- -----------------VTCG---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------------------MPKI- ------------------------------------------------------------D ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------TDIDAC------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------EVVLQLAPETNGHVAVKAWKALGKQ---- ------TGLDHTHLALYRE----D-EKIRFR-DIQAQPRKIISSPTWSGIESETVSYNA-- --------------------GYTNVHEMIPWRTR--EGFTTYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSETDAKSVGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGMRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMN-------KVDW--------------------LEEEAQGENA- ----- ->NASQAN2015_227_F_bin.21_scaffold_2406_1 rank: A; hyn:F9K07_14885 nitrate reductase subunit alpha; K00370 (db=kegg) ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------VSYNAGYTNVHEMI---------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------PWRTL-------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------T------------------------------------- --------------------GRQQFYMDHPWMTAFGENFSSYRPPVDLKT----TAGIQN- -------------------------IKPNGNKEIALNF-------------------ITPH -QKWGIHSTYSDNLMMLTLNR---------------GGSVVWLSEDDAKSAGIEDNDWI-- ----------------EVFNINGAIAARAVVSQRVNPGMTLMYHSQE-------------- ---KIINTP-GSEITGVRGGIHNSVT---RIVLKPTHMIGGYAQ---------FSYGFNYY -GTI-GTNRDEFVVVRKMA-------KVDWLDDEGSSTEPTATHN---------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_F_bin.10_scaffold_7566_1 rank: A; lim:L103DPR2_02670 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- ----MSH--------FLDRLTH--FSSPKE--SFS-DGHGVTTGEDR------TW-EDAYR -DRWAH------DKIVRSTHG-VNCTGSCSWKIYVKGGIVTWETQQTDYPRTRD-----DL -PNHEPRGCARGASYSWYLYSANRVKYPMVRGRLLQ---------HWRA-ALAVSKSPVDA -WANIVENTAARSEWQKQRGLGGFVRSTWEEVNQLIASANVYTAKKY----GPDRV-MGFS -PIPAMSMVS------YAAGSRYLSL----------------------------------- ----IGGVCLSFYDWYCDLPPSSPQVWGEQTDVPESADWYNSNFIIAWGSNVPQTRTPDAH -FFTEVRYKGAKTVAITPDYSEVAKLADLWMHPKQG-TDAAVAMAMGHVILKEFYF----N -KRSAYFDDYVRRYTDMPNLVQLEERTLPDGRKVMVPGHYLR---------ASDFNGK-LG -QDNNPEWKTVAID-ENDKIVLPNGSIGFRW----GAEGRSDMGKWNLESKEA-------- --------RGDAEVKLKLSLM------E--------GATPDYEVGDVGFPYFGGID----- -------------TPNFNANKQGEAVDDVLVRKVPVRRIKLG-KAGEERYALVATV----- ----FDLTVAN-YGVARGL--------AGENAALSYDDDTPYTPAWQEKITGVKRDQVIAV -ARQF------ADNADKTKGKSMVIIGAAMNHWYHSD-MNYRGIINMLMMCGCIGQSGG-G ---WAHYVGQEKLRPQT---GWTALAFALDWVRPPRQMNGTSFFYAHTDQWRYEKLGVEEI -------LSPLADKSKFGGSLIDYNVRAERMGWLPS-----APQLE-TNSFQVVKDAQAAG -MDTK-----DYVVKSL-----KD---------------GSLKMSCEDPDNPK-NWPRNMF -VWRSNLLGS---SGKGHEYFLKHLLGTTNGVQG---KDLGAEEAKPTEVQWHDKAPEGKL -DLLVTLDFRMSTTCLYSDIVLPTATW--YEKNDLNTSDMH-PFIHP----L-STAVDPAW -QSRSDWEIYKGFAQAYSEVCVGHLGVE-KEVVLTPLMHDTPSELAQAF----DVKEWKKG -ECDLIPGKTAPTIAVIERDY--PNTFARFTALGPLMEKAGNGGKGIGWDTKVEVQQL--- ------QSLNGKVHTEGVSKGMAKIVTDIDAAEVILQLAPETNGHVAVKAWEALSKI---- ------TGRDHTHLAIHRE----D-EKIRFR-DVQAQPRKIISSPTWSGI----------- ----------------------------ESETVSYNAGYTNVHE----------------- ----------------------------------MIPWRTLT------------------- ------------------------------------GRQHFYL------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_237162_4 rank: C; deu:DBW_2564 narG; Respiratory nitrate reductase 1 alpha chain; K00370 (db=kegg) ------------------------------------------------------------- --------------------------------TLT-------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------GRQHFYLDHDAYIAFGEHLSTYKPSPT-------------- ----------PEAYGDLRKT-----VNDGHAKMLN---------------------CLTPH -GKWHIHSTYGDTLRMLTLSR---------------GNEPCWLSEEDAAELGIKDNDHV-- ----------------EVYNDHGVYVARACVSARIPKGVCIVYHAVERTYNIP-------- ---KSQIRR-GEHGEPRRGGMNNSFT---RVHLKPNLMCGGYGQ---------FTYHFNYW -GPV-GVNRDTHVLVRKMH-------VVEY------------------------------- ----- ->sharkriverslough_2019_sw_WHONDRS-S19S_0042_B_bin.90_k121_397025_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- --------------------MG--------------WIQDLFAPEQR------SW-EDFYR -NRWAH------DKVVRTTHG-VNCTGSCSWNVYVKQGVVTWEMQALDYPTID-----RSI -PNYEPRGCQRGISTSWYIYSPLRVKHPYMRGALLD------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- --------------------------------------------LWQEARRE--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -----------------------------------------HP------------------ ----------DDPVAAW-------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------ASIT----------------------------------- ------------------------------------------------------------- ----- ->AFN37208|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIVTWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGFRRATWDECLELVASSLLYTAKKY----GPDRV-VAFA -PIPAYSYLS------FGAGTRFIQL----------------------------------- ----FGGFTLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVANGANMNMTRTPDVH -FISEARHNGTKFVVIAPDFSQVAKYSDWWLPVKAG-QDQALWMGIDHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGKVAVTTA--------- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEPYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWSCWALGKDWVPTSRLQQSSSWHYAHSDQWRYEGDFTEYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPLDVVKQAEAAG -AKT------DEQIVKWVVEQVKS---------------KQLKFAIEDVDAPE-NWPRTWL -IWRGNALQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVTFREPAPRGKM -DLLCQLNFRMDTTATYCDVVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMTPLAHDTPDELSQDYQAGMKVLDWGKG -EIEMIPGKTAPHFKVVERDY--ANIYNQWITFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRK----TGDIV-- -------------------------RSPVDDESVVLNY-------------------ITPH -GKWHIHSTYYDNHRLLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPE-------------- ---RTISIPKSQVRGNRRGGAHNSLT---RIRINPMQMAGGYAQ---------WTYAWNYW -GPIGIMTRDTHVAVR--------------------------------------------- ----- ->AFN37205|Nitrolancea_hollandica_Lb ------------------------------------------------------------- -----------------------------------------------------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRHRWQRARGKGGFRRATWDECLELVASALLYTAKKY----GPDRV-VAFA -PIPAYSYLS------YGAGSRFIQL----------------------------------- ----FGGFNLSFYDWYADLXNSFPEVWGDQTDVCESADWYNSKFIVSNAANMNMTRTPDVH -FISEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHP----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSG-PRLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTCWALGKDWIPPSRLQQTSTWHYANSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPS-----YPQFN-RNPFEVVKQAEAAG -AKT------DEQIVKWVVAQLKS---------------KQLRLAIEDVDAPE-NWPRTWL -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAIA-----EEHAKGRVKDVVVREPAPRGKM -DLVCQLNFRMETTATYSDIVLPTAFW--YEKNDLNTTDLH-TFIHP----L-GAATPPAW -ESKTDYEIFKAIAKKVSELAPSVFQGPVKDIVMQPLAHDTPDELSQDYLAEMKVLDWGKG -EVDLIPGKTAPHFKIIERDY--ANLYNQWTSFGPKARENGIVGNGEHIDIKPFYDELLEN -PIDAQPDVRHMRCRVWGGQRYPGLEFAEEAANLLLHLSPESNGEVSYHAFKEGEHQ---- ------VGLPLADLAEGVR----G-VRMTYF-DLTRQVRRTLISPCWTGMVNDGRAYAAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGVKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMVYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYAFNYW -GPIGIFTRDTHVA----------------------------------------------- ----- ->AFN37207|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRC-AAFA -PIPAYSYLS------YGAGSRFFQL----------------------------------- ----FGGFNMSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVIAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIDYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCVGYRW-------ATKETGKWNISMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------EVAQVEF----- ---------------------DIFGTGKVARRGVPIKYLETS-EGK-VAVTTAFDL----- -------LLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEAYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPIEAPILTGCCGRNGG-G ---LNHYVGQEKLTLVA---AWTTWALGRDWIPPSRLQQSPVWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAIDLLASAVRMGWMPF-----YPQFN-RNPLEIVKQAEAAG -AKS------DEQIVKWVVGQLKS---------------GNLRYAIEDIDAPE-NWPRTWV -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EEHAKGRVKDVVLRDPAPRGKM -DLVCDINFRMETTALYSDMVLPTAMW--YEKNDLNTTDLH-SFIHP----L-GAAVPPVW -EAKTDYEIFKAIAKKVSELAPSVFPQPVKDIISNPLIHDTPDELAQDYLSEMKVLDWGKG -EIDLIPGKTGPHLKIVERDY--VNLYNRWISFGPKARENGISGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGGRYPRLEFAEEAANLLLHLSPETNGEVCYHAFKEEEKQ---- ------IGMPLADLAESIR----G-VRMNYF-DLTRQVRRTMISPCWTGMINDGRAYAAWC -LNVERLVPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLDPRKTG--DIVRSP- ----------VDDES------------------VVLNY-------------------ITPH -GKWHIHSTYYENHRMLTLSR---------------GIEPCWINDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMFNYW -GPIGIFTRDTHVAVR--------------------------------------------- ----- ->AFN37206|Nitrolancea_hollandica_Lb ------------------------------------------------------------- ----------------------------------------------R------QW-EEFYR -NRWQH------DNITRSTHG-VNCTGGCSWMVFVKDGIITWEMQATDYPLLE-----PSL -PPYEPRGCQRGISASWYVYSPIRVKYPYMRGPLMD---------FWREARAQH-SDPIQA -WASIVQDEQKRQRWQRARGKGGYRRATWDECLELVASALLYTAKKY----GPDRV-TAFA -PIPAYSYVS------FGAGARFIQL----------------------------------- ----FGGFHLSFYDWYADLPNSFPEVWGDQTDVCESADWYNSKFIVSNAANLNMTRTADVH -FVSEARHNGTKFVVLAPDFSQVAKYSDWWIPVKAG-QDQALWMGADHVILKEFYI----D -RQVPYFIEYQKRYTDGPMLVKVHQ----TKGGAYSMGQFLR---------ANRINRY--K -DVENGNWQLLVWDKQSGP-RLPKGCIGYRW-------AKKETGKWNITMED--A------ --------MDNTPLDPLLSFL---GQHD---------------------AVAEVEF----- ---------------------DIFGTGKVSRRAVPIKYLETS-EGK----VAVTTA----- ----FDLLLAQ-FAVGRPG--------LTGDYPKSYDDDMPYTPAWQEGYTGIGRDTVIRF -AREF------AGNAEATQGRSMVITGASLNHWYNNG-LCYRGPITALILCGCCGRNGG-G ---LNHYVGQEKLSLVS---AWQSWALAKDWFPPSRVQQSSTWHYAHSDQWRYEGDFTDYA --------PIPRETRWAKGHAMDLLASAVRMGWMPM-----YPQFN-RNPLELVKQAEAAG -AKS------DEQVVEWVVGQLKS---------------GNLRYAIEDVDAPE-NWPRVWL -IWRGNAFQS---SAKGAEYFLRHYSGTHDNAVA-----EEHAKGRVKDVVFREPAPRGKF -DLLCDLNFRMDTTALYSDIVLPTAMW--YEKNDLNTTDLH-TFIHP----L-GAAVPPVW -EAKSDYEIFKSLAKKVSELAPSVFPQPVKDIVSNPLAHDTPDELSQDYLAEMKVLDWGKG -EIEMIPGKTAPHFKIVERDY--VNFYNRWISYGRKARENGIVGNGVHIDIKPFYDELLEN -PLDAQPDVRHMRCIEWGGQRYPRLEFAEEACNLIMFLAPESNGEVCYHAFKEEEKQ---- ------LGLPLADLAEAVR----G-VRMNFF-DLTRQVRRTLISPCWTGMVNDGRAYSAWC -LNVERLIPWRTLS------GRQHHYMDHPYYIDYGEQLMTHKPKLD--PRK--TGDIVR- ---------------SPVDDES-----------VVLNY-------------------ITPH -GKWHIHSTYYDNHRMLTLSR---------------GIEPCWLNDKDAARIGIKDNDWV-- ----------------EVYNDNGVMVTRAAVSARVQMGTCMIYHAPERT------------ ----ISIPK-SQVRGNRRGGAHNSLT---RTRINPMQMAGGYAQ---------WTYMWNYW -GPIGILTRDTHVAVR--------------------------------------------- ----- ->WP_005004540|Nitrococcus_mobilis ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMEDG-------- --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGSVLVATV--------- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIHDLDNSPID- ------------------------------DKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVE-------------- ---RTIYIPKSQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->Nitrococcus_mobi_EAR23355 ------------------------------------------------------------- --------------------MG--------------WIQDLINPKTR------RW-EEFYR -NRWQH------DNIFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLGRGEGGRGI -PPYEPRGCQRGISASWYVYSPIRVKYPYGKGVLLD---------FWREARSSH-NNPVEA -WSSIVTDENKRKRWQKARGKGGYRRTTWDELLELIASACLYTAQKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPNSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FISEARHEGAKFVVLAPDFSQVSKYADWWIPVKKG-EDLGLWMAAGHVIYTEFYV----K -RQVPYFIDYVTRYTDMPFLVKLE-----KDGDGYRPGRYLT---------SEEVKKY--K -KQENAAWKQLVFDRKSNEARCPKGQIGHRH---------GKHGQWNLKMED--G------ --------LDNSPIEPVLSFL--GESDD---------------------VAMVQFY----- ----------------------EFASQTVYKRGVPAKKIDTG-SGS----VLVATV----- ----YDLNMGQ-YAVNRGL---------PGDYPESYDDLKPYTPAWQEQFSGIGRQTVIRF -AREF------AGTAEKTKGRSMVIVGASANHWYHNN-HIYRAAINCLIACGCCGRNGG-G ---MNHYVGQEKLAIVA---PWNALALAGDWGIKPRLQQSPVWHYVNSDSWRYEGSFEEYA --------PSPPNAKWAKGHSVDLVAKSVRMGWMPH-----YPQFN-RSPLEVAREAEKAG -AKD------DKGMADYVVQALKK---------------KNLSFSVDDPDAPE-NWPRVWF -IWRGNAMQS---SAKGAEFFLRHYLGTHDNAVA-----EERAKPHVKHVKFREPAPRGKF -DLVVDINFRMDSTALYSDIVLPTAFW--YEKNDLNSTDLH-SFIHP----L-GQAVPPVW -ESKSDWDIFKAFAKKISEMAPSVFSEPFKDVVAAPLTHDTPDEIAQRD-----VKDWLEG -ECEPIPGKTMPHFRVVERDY--SLLYNKYISLGSAIRENGISGNGCSFPITKQYDELTNQ -PVGGSPDPRHRRAVEWGGKRYPCVEDALDAANVLLYLAPETNGEVAYQAFKSEQEH---- ------CGVPLTDLAEPYR----G-HQVTFY-DLTRQPRRLLCSPVWTGNCGDGRAYSAWT -LQIDRLVPFRTLT------GRQHIYIDHPWYMDFGEHLCTYRPKLDYKKIH--DLD---- -------------------------NSPIDDKTLILNY-------------------ITPH -GKWNIHSTYKDNHRMLTLSR---------------GMDPVWINDKDAARVGLKDNDWV-- ----------------EVYNDNGVIVTRANVSRRVQSGMCLYYHAVERT------------ ----IYIPK-SQIRGGRRAGGHNSVT---RTRINPVYLAGGNAQ---------FTYLFNYW -GPTGIMTRDTHVAVRKLE-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_B_bin.21_k121_1443778_1 rank: C; mox:DAMO_0778 narG; Nitrate reductase, alpha chain; may be more similar to a nitrite oxidoreductase; K00370 (db=kegg) ------------------------------------------------------------- ---------------------------------MS-WIEDIISPNTR------KW-EEFYR -NRWQY------DKVVRSTHG-VNCTGGCSWAIHVKDGIVVWEMQQLDYPQFN-----KDV -PPYEPRGCQRGISYSWYLYSPIRVKYPIIRGALID---------LFRE------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------E ------------------------------------------------------------- ------------------------------------------------------------- --------KKKCG------------------------------------------------ ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------G ------------------------------------------------------------- -----------------------------------------DPVLA--------------- ------------------------------------------------------------- ------------------------------------------------------------- ---------------------------------------------------W--------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------------------------------------ANLQADDTK------------ ---------------------------RKRYQRA--------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----- ->Nitrobacter_winogradskyi_gb_ABA05326 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLAD---------LWHEAKASY-PDPVQA -WASLVEDEEKRNRIQKARGKGGFRRAKWEELIELIAASCLYTARKH----GPDRV-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----FGGGLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWSTVAMALDWNKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPNFH-RNPIEVVAEAERAG -AKS------TADIATYVADQVAS---------------KKLDLAINDPDAEE-NWPRVWF -IWRANAIQS---SAKGHEFFLRHYLGAHDNVIA-----EERAKGKTTTVKYRDTAPQGKY -DLVVDINFRMNTTGLYSDIILPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDIVLQPLMHDTPDELAQPE-----ILDWAEG -ECKLVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVNIPIKKQYDQMLEN -PIMPMPDSRHMRCVEWGGKRYPSLEDVLDACNVVLLCAPVANGEVSYQGFVNEEQH---- ------VGLPLADIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLVNDGRAYSAWC -MNIERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRLLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RIRINPLFLAGGYAQ---------FTYGWNYW -GPTGIFTRDTHVVVRKME-------KVEW------------------------------- ----- ->WP_011314088|Nitrobacter_winogradskyi ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYVRGPLYD---------LWKEAKASH-PDPVQA -WASLVGDEQKRSRIQKARGKGGFRRAKWEELVELIAAAALYTARKY----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------SNRVARY--K -DVENGEWKMLVLDTATGEPRAFKGQVGDRW--------GSTHGKWNLSAED--T------ --------LDNSPIDPVLSFI------D--------QSDGVVQVGFD--DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGE----VLVTTG----- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKSVRCGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TADIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLISKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNIPIKKQYDQMLDN -PIMPMPDARHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGLTNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->Nitrobacter_sp_Nb_311A_ZP_01048070 ------------------------------------------------------------- ---------------------------------MS-WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLYD---------LWREAKASH-PDPVQA -WASLVGDEQKRLRMQKARGKGGFRRAKWEELVELIAAAALYTARKW----GPDRV-MGFS -PIPAMSMLS------YAAGSRFLQL----------------------------------- ----FGGVNMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMAANMNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYI----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGNTYKTGRLLR---------AKRVARY--Q -DVENGDWKMLVLDSKTGEPRAFKGQVGDRW--------GSTHGKWNLSAED----TLDNS -PIDPVLSFIDQSDGVVQVGF------D---------------------DFVNGSV----- -----------------------------VSRGVPVKRIATD-KGEVLVTTG--------- ----FDIMMSQ-FGHSRGL--------EGSFATSYDDENAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWNTIAMALDWTKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLQAKAVRSGWMPF-----TPHFN-RNPIELAAEAERAG -AKS------TDDIVTHVVDQVAS---------------KKVNFAIDDPDAEE-SWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNSIA-----EDRAKGKTQRVKYRDTAPRGKY -DLVVDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIAKKVSELSPLAFSKPVRDVVVQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTLLMCAPEANGEVCYQGFHNEEHH---- ------VGLPLVDIAEPTR----G-VSSTFY-DLTRQPRRILTSPCWTGMTNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDSQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGFNYW -GPTGIFTRDTHVVVRKME-------KLEW------------------------------- ----- ->A_Nitrobacter_hamburgensis_YP_578638 ------------------------------------------------------------- --------------------MS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRVKYPYIRGPLLD---------MWREAKASS-ADPVQA -WGALIGDEQKRSRIQKARGKGGFRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLMSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNMNMTRTPDVH -FISEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFVDYIKRYTDLPFLVELES-----NGNTYKTGRLLR---------SNRVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVKRVATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATNAELTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWATVALALDWAKPPRLVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPKWAKGHAIDLEAKAVHNGWMPF-----TPHFN-RNPIEVAAEAERSG -AKN------VQDIETYVVDQVVS---------------KKLQMAIDDPDAAE-NWPRMWF -IWRGNAIQS---SAKGHEFFLRHYLGAHDNAIA-----EDRAKGKAQVVKYHETAPRGKY -DLVIDLNFRMNTTSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWEIFKLIGKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWSLG -ECKAVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGISAVGVQIPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDACNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPNR----N-VAATFY-DLTRQPRRIITSPCWTGMVNDGRAYSAWC -MNVERLVPWRTLT------GRQSLYLDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- -----SR---------------------VDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->B_Nitrobacter_hamburgensis_YP_578186 ---------------------------------------------------------MTTG -LAAGQR--------TEETQMS--------------WILDLVNPRER------KW-EEFYR -NRWSH------DNVFRSTHG-VNCTGGCSWAIYVKDGIITWEMQQTDYPLLE-----RSL -PPYEPRGCQRGISASWYVYSPIRIKYPYVRGPLLD---------MWREAKASS-ADPVQA -WGALVGDEQKRARMQKARGKGGYRRAKWEELVELIAAASLHTARKH----GPDRI-MGFS -PIPAMSMLS------FAAGTRFLSL----------------------------------- ----MGGSLLSFYDWYADLPTSFPEIWGDQTDVCESADWYNSKFIVSMASNLNMTRTPDVH -FIAEARTEGTKFVVLSPDFSQIAKYCDEWIPIQAG-QDTALWMAANHVILKEYYV----D -RQVPYFIDYVKRYTDLPFLVELEP-----NGTTYKTGRLLR---------ARHVPRY--K -DVENGDWKMLLLDANSGELRAPKGQVGDRW--------GSVHGKWNLSGED----TLDNS -PLDPVLSFIDRSDDVVQVGF------D---------------------DFANGRI----- -----------------------------VSRGVPVRRIATD-KGEILCATG--------- ----FDIMMSQ-FGISRGL--------EGAFATSYDDEDAPYTPAWQERHTGIGRETAIRF -AREF------ATTAEYTNGKSMVIVGASANHWYYNN-LCYRSATVALILCGCCGVNGG-G ---INHYVGQEKLAPVA---PWASIALALDWSKPPRVVQSSTWHYAHSCQWRYEQEFTEYG --------LTAPNPRWAKGHAIDLEAKAVRSGWMPF-----TPHFN-RNPIEVAAEAERAG -AKS------TEDIATHVIDQVAS---------------KKLNLAIEDPDAAE-NWPRLWF -IWRGNAIQS---SAKGHEFFLRHYLGTHDNAIA-----EDRAKGKTHTVKYHDTAPRGKY -DLVVDLNFRMDTSSLYSDIVLPTAFW--YEKNDLNTTDLH-SFLHV----L-GQAVPPVW -ESKTDWDIFKLIAKKVSELAPLAFSKPVRDVVLQPLMHDTPDELAQPE-----ILDWAEG -ECKPVPGKSFPHVRVVERDY--ANLYNKFISFGPKAREDGVSAVGVNVPIKKQYDQMLDN -PIMPMPDPRHMRCVEWGGKRYPSLEDVLDGCNTVLLCAPEANGEVCYQAFHNEEHH---- ------VGLPLVDLAEPTR----N-VATTFY-DLTRQPRRLLTSPCWTGMMNDGRAYSAWC -MNVERLVPWRTLT------GRQTLYIDHQWYLDFGEHIPTYKPRLN--PRK--TGDIVK- --------------------------SRVDDRSLVLNY-------------------ITPH -GKWNIHSTYKDNHRMLMLSR---------------GMDPVWINDRDAEKVGIEDNDWV-- ----------------EVYNDNGVVVTRANVSRRIQPGTCMYYHAVE-------------- ---RTVYIP-KSQERKWRGGGHNSLT---RTRINPLFLAGGYAQ---------FTYGWNYW -GPTGILTRDTHVVVRKME-------KLEW------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0000472_14 rank: A; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGQRSTWGVVSESRRRFLVKAGL -ASAAGA--------AINLNLFGCGRSHAPLQHFKGTTAGHFDLGPRTTPKLGNW-QDLYR -QRWTW------DKVVKGSHGWANCRSACEWDLYVKDGIVVREEQSATYEASE-----PGV -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------PRGSGQWEKISWEQAIKEIAQKTVDAVTEF----GTDTVFQDLG -PNFDFGPST--------AGRFKFMYQAGSLFADM-------------------------- ---------WGEI---GDLNFGATMALGAAQIGGSSDEWFLSDFIVVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPIETG-TDAALGLAVARHLFEVNAI----D -------LPFVREQTDLPLLVRLDTGRFLRETDLNSG------------------GNA--- ----------------------------------------DQLYLWHPQKNAPVFAPGC-- --------TGNTTRKLTLDFE----------------------------APIDGQW----- -------------------------------------TIKLH-DGKEVAIAPVGAL----- ----LKEHLEP-WTFEHTA-----------------------------SVTHLHVDQVKKF -AEGW-----------AKCQRPMVLSSWGSNRFVHSD-LMNRSKILCLMLKGALGKKGT-G ----YQATGIVDMEGFNNAMQMDHEGVR--------------------------------- -------------------------------GRLGALLGIMPPADLFQAVLDIVMQRKTEG -DVAL-----ETEMNYL-----KHHLCSSDVMESNFKAPGYRAAVVKEHEGMLPRSLESYY -QEARQKDWS---QGLPRKAPVKVYFSGGANILRRSNMP-----------QYYKTFIWDEM -QCIVDINPKYSFTGTQSDYILPAAGW--YEKAGIKYTMSYVPYLH-----YCDVAVPPLG -ESKGEWEIFWLLTREMERYA---------------------------------------- ---KEKNLPVLDGCGRGSNDF--KTLHQRYSNQGELGQ----------------------- --------------------------------HDDEKVMKEILHGDATEGMTIEGLKQTGI -AKFTSAGKPVAADAINNP----D-WKGEGV-MTTLTRFTVHKEPWPTYS----------- --------------------GRITSFIDHPWFIEMREQFPIHKDSPKAGG----------- ---------------------------------------------------DYPFQFVSCH -ARWSIHSTWRDTPMMLRLQR---------------GEPLVYINPIDAERVGVKDFEYV-- ----------------EIFNNYGSVRMRVKVAAMVRPGVAYYYHAWE-------------- ---------------PHQFPNHQSFKWLIPGLVNPLYMAGGYGQ---------INHAMNRY -QPG-SAVQDTRIGIR------------PW---HGQATGAHPVKRPEAAATSK-------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001772_1 rank: C; doe:DENOEST_1434 s25dA; putative steroid C25 dehydrogenase-like alpha-subunit; K24713 (db=kegg) --------------------------------------MGNLIKTGIASASRRKFLVMAGA -ASAAGA---------ALSLFGCGRAPLQH--FKGTTASGRFDLGPRTAPKLGNW-QDLYR -QRWTW------DKVAKGSHGWANCRSACEWDLYVKDGVVVREEQSATYEASE-----PGI -PDFNPRGCQKGACYTEVMYGPSRTTVPLKRVG---------------------------- -----------------SRGSGKWEKISWEQAMKEIAQKTVDAAEKW----GTDTIYQDLG -PNFDFGAST--------AGRFKFQF----------------------------------- ---MAGGVFADNWAEIGDLNVGASITTGAAHLGGSSDEWFLSDFIIVWMMNPSVTQIPDAH -FLYEARYNGTELVVIDPQYSATAIHADQWLPLESG-TDAALGLAVARHLLETGAI----D -------LPYIREQTDLPLLARLDTGRFLRESEMVNG------------------GNA--- ----------------------------------------DQLYMWHPQKNAPVPAPGC-- --------LNNTTRNLKLDFE----------------------------PPIDGQW----- -------------------------------------KVKLA-DGKEVGVVPVGAM----- ----LKEHLDS-WTFEHAA-----------------------------KVTHLHIDQIKKF -AEGW-----------AKAQRPMVLSSWGSNRYVHSD-LMNRTKLLLLMLKGAMGKKGA-G ----------YQATGWV-------------------------------------------- ----------------------------------------------DLDGFGNAMQMEKSG -MT------------------------------------GRLAVMLNAM------------ ---------P--------------------------------------------------- ------------------------------------------P------------------ ------------------------------------------------------------- -----------------------KELFNA-------------------------------- --------------------------------VVDIIKKRKTEGDVALEG----------- ----------------ENN----Y-LRTK-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------LCTSDVVEVNLKSDGY--- -----------------------RAALNKEQKGLYPHELDEYYKEAHD------------- -----------------------------KGWAP--------------------------- -----GLPRKAPPKIFF-------------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_3 rank: A; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MSISRRHFIVGSAV -AVAGVG------------LYS--LRPKKP--VVYPVGVRAPKVAAR-KVHYNDY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQAAIYEPHR-----PDV -PDFNPRGCQKGACYTQLQVSEARVKYPLKCVG---------------------------- -----------------ERGEGKWKRVSWDTALDEIADRLIDIAVRDGTESIIFDDTTNVG -YGPE-----------TAGDVRFAAA----------------------------------- ----IQATRLDSWSGVGDMPNGLIQTWGLYNCEGTSDDWYLSDYIVIWVGNPNYTRIPDAH -FLHEARYRGAKLVVVAPDLNPSTAHADLWINVNAE-TDSALALSCAQVMIAEKLY----K -------KDYVLQQTDFPFLVRKDDQRFLRAADMVKG--------------GAD------- ----------------------------------------NALYLWDEAKHAPVIAPGCEG --------DGDGGRIMALGGI------K---------------------PALSGTF----- -------------------------------------KVTTQ-DGKTVEVQTVFDM----- ----IRAKLDAEYTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPKAMIIASYGSCKHYHHD-LNQRSFVLLMNLTGNQGQQGG-G ----------YRISAW-----WAMDGLD--------------------------------- -------------------------------QMADSTVPLKDMLRIIPKAIRGLSPRDYEG -LFTEYSDKEGHTPALLFLY--LH---------------GGYKEMWDKPHLQDPALPRPF- ---ADYVQES---IDKGW-SKVHPPLGREPRAYI---FTGGNPLRRWPSPQIAKQHLWPKF -ELVVSVNFRMSTSSLFSDYVLPVAAY--YEKYGIKYAQTYVPYIIT----S-DKATEPLG -ESKSDWETFGLLSKHVAERARVRGVTMVRGL----------------------------- ----------------KDVLFDLSKAYEVHTHHG--------------------KYDP--- ----------------------------TDPEDPIKLMDAIFANSPSIGCNTGREALDMGA -VPVIGTGRPSLIDQNYSP----YDPKDTYW-PHKDFIDKKIAWPTLT------------- --------------------GRQQFYIDHPWFLEGKEHLPTFKPSIHANSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHAVWRDVKLLLRLQR---------------GQPACWLNPKEAEKRGIKDGDMV-- ----------------RVFNDHGTCECMVKVSAITAPGEVIIYHAW--------------- ----------EPYQFKKWQGNQEPVE---APW-KALHLAGGYAQ---------LHWRVYYH -GPN-HSPRGAPVEVEKIGYEGG-------------------------------------- ----- ->flintriver_2019_sw_WHONDRS-S19S_0015_A_bin.5_Ga0451753_0001210_4 rank: C; ag:AFF61325 s25dA; steroid C-25 hydroxylase alpha subunit (EC:1.17.99.10); K24713 (db=kegg) -----------------------------------------------MQISRRGFIVGSAV -AAAGVG--------LYSLKSK--KAVIKPGITLP-DKTPAKKIKYN------DY-SDIWR -EKWKW------DKVVKGTHTRANCCAACSWDVYVRDGIAWREEQNAIYEPPR-----PGI -PDQNPRGCQKGACYTALQLSESRVKYPLKRAG---------------------------- -----------------NRGEGKWKRISWDEALTEIADKLLDIAVAEGTETICFDDLSNTG -YGPETAGDFR-----FSTGMQVSRL----------------------------------- ----------DGWSGVGDMPLGVIQTWGAFNCEGTSDDWFRSDYIVIWLGNPSYTRIPDAH -FLHEARYRGAKLVVVAPDLNATTVHADMWLNVKPE-TDAALGLACAQIMISENLY----K -------KDYVLEQTDFPFLVRKDNQRFLRVSDVVKG--------------GAD------- ----------------------------------------NAFYLWDEAKNAIAMAPGCEG --------DGDGGRSLKLGAL------K---------------------PALSGTR----- -------------------------------------SVKLA-DGSTVECITVFDM----- ----IKERLDKEHTPEQAA-----------------------------KITGLHPNVIRTF -AREM-----------AAAPSAMIIASYGACKHYHSD-LFQRSFILLMNLTGNQGKPGG-G -MRVAAWWGMDGLDAMA----DSTIPMA--------------------------------- -----------------------------------------DMMKIIPKAVRGLTPRDYES -LYTDYSNREGHTPTMVFLY--VH---------------GGYKELWDKPYLQDPNLPRNI- ---SSYMRES---IDKGW-TKVHPPENKSPKAYI---FTGGNPLRRWPSPQIAREKLWPKF -DLVCSVTFKMSTSTLWADYVLPVAAY--YEKYGIKYAQSYVPYIIS----S-DKATEPLG -ESKSDWETFGLMAKKVAERAKARNITMVRGL----------------------------- ----------------DDKPFDVSKVYDFYTGNG--------------------KYDP--- ----------------------------TDPEDPVRLMDEIFAGSPNVACNSAREALQRGA -VPVTGPGRPSLINQNYSD----YDGKDTYW-PHRDFIEKKVAWPTIT------------- --------------------GRQQFYIDHPWFIEGKEALPTHKAPPLATSKF--PLRMYG- -----------------------------------------------------------GH -NRWSIHSIWRDVKLLLRLQR---------------GQPAAWMNPAELQKRGLKDGDMV-- ----------------RVYNDHATFECNIKSSPATAPGEIIVYHAWEPFQFK--------- -----------------KWQSNQEVT---EAPVKGLHLAGGYTQ---------LHFRVYYG -SMH-HTPRGAAVEVEKAPT----------------------------------------- ----- ->NASQAN2015_111_B_bin.76_k121_226837_116 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVSRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDIWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVRAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVETR-TGK-VTVTTVFAL----- ----LRKRATE-HSPEKMS-----------------------------TETGLNPKAMRTV -AREF----------AKAGQRAMIYAGFSACKWLHGD-ILQRSMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLEEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DTAVKPLG -EAVDDFEALRRVSAAISTIAREKATPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRDSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQQGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDAGSFVCMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLYS-------RGKV---TAAKARIA-------------------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_F_bin.26_scaffold_99_5 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHSAL -AGAALA-----------------LQHGDA------LADALTR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIEVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVNTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRIVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------NVETR-TGK-VTVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKRAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DQAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIRDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARKVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCEFKLHS-------RGKV---------------------------TAAK -VRIA ->NASQAN2014_190_B_bin.96_k121_3766_2 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLTHSAL -AAGAAL--------ALHHGAA--------------MADALSR-PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVFKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIDEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGNI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VAVTTVFAL----- ----LKKRAAE-HSPEKMS-----------------------------DETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRVVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRAS--------------GNRWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTPAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVW----------NSDESPFHADIAESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPIYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDATARNVRDGDLI-- ----------------EVFNDGGSFICMAHVSAGIMPGTVYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---------------------------TAAK -VRIA ->greatmiami_2019_sw_WHONDRS-S19S_0099_F_bin.30_scaffold_496_3 rank: A; sdf:ACG33_10685 putative steroid C25 dehydrogenase (S25dA4); K24713 (db=kegg) -----------------------------------------------MSVNRRQFLAHTAL -ASAALA--------LQHGAAM--ADALTR--------------PYR------RI-EDVWR -KKWTW------DRVAHGTHG-TNCAGTCAFNVYIRNGVVWREEQQAEYERSGT----PDV -PDYGPRGCNKGLRHARYMYGKQRVLYPMKRVG---------------------------- -----------------KRGEGKWQRISWDQATREIAEKFIDVAVKH----GPDSITLGSG -TQLAVKMAS------YSALARFSNI----------------------------------- ----TGVTVPEFYSGVGDLPTGFYMTTGLTYLGDTMAAVYKSKCVLVWMANPAVTRIPDAH -FFWEAKYNGTEVVTISPEFTPTAMHSSKWLNIKPG-TDTALAMAMVHTIIEEKLY----D -------AAYIREQTDLPFLVREDNGEFLRAEDLN----------------LVDMLAV--- ---------------------------RENV-----------FYLWDQKTRRMVQAPGTGA -AEAPVGRRRRKFETIALGDI------E---------------------PALEGRW----- -------------------------------------TVQTR-TGK-VTVTTVFAL----- ----LKKRAAD-HSPENMS-----------------------------AETGLNPNAMRTV -AREF----------AKAGKQAMIYAGFSACKWLHGD-ILQRAMVLLCALTGATGHEGG-G ---VQMANGPKSRGITS--FAFAGVGAA--------------------------------- ------------------------SRIVASTLWDYD-----HGKMKQLNEKIYGKKLA--- ----------DEFDSHY-----QH------------------------------SLKEDWF -------PQY---GKNGWKMGIFAGENGANWRASGN--------------RWRTEAF-EKL -EMIVALVPDAGITMHHADIVLPIAHH--YERADIMLQSRH-PYVQV----L-DRAVKPLG -EAVDDFEALRRVSAAISAIAREKGTAAIKDD----------------------------- ----------------VDGRTFRRDLKRT-----------------------LELYTM--- ---------------------------DGAIKDSRDIVQFIINATPGIPKMSFAELAAKGI -VRVDESRGSTVWNSDESP----FHADIA------ESVHEKR--PYETLT----------- --------------------GRQQFYIDHEWFLKFDEALPVYHPPLKQKGYP--LQMTMG- ------------------------------------------------------------H -ARHGIHSMWRDDSFLVSLQR---------------GEPDIYVNPDDAAARNVRDGDLI-- ----------------EVFNDGGSFICMAHLSAGIMPGTLYMYHGWD-------------- -------------PTMFRGRQNFAAVIPTAGLVKPTSVAGDYGH---------LGYRVLAY -APN-QTYRDFTCNFKLHS-------RGKV---TAAKVRIA-------------------- ----- ->providencecreek_2019_sw_WHONDRS-S19S_0007_B_bin.10_k121_1581149_4 rank: A; shal:SHALO_2978 molybdopterin oxidoreductase, alpha subunit (db=kegg) ----------------------------------------------MANSSRRNFLKASG- ---------------FSAAMLAGQGTLFAKTDVIK-VENAKDSYPNA------SFTETNYR -DEFKFTYGEKAEHGYAYHCV--NCQGNCAWEVWGNNGIVTRENQSAKYPAF------GHN -PDFNPRGCNKGVQHSQVMYEKDRILYPMKRIG---------------------------- -----------------ERGKGKWKRISWDEAATEVAQKLYTTM-------------IDPK -KGPAAITVH------AGTGLLTEGRRPSVLRFGT-------------------------- ---QLGASRIYPASYLGDMFTGAAIAYGEGNMGCTYDFMFNVSTSIMWGANPSATRIPDAH -FVWEGKYNGSKIIVITPEYNATAARAHLWVPIKPG-TDSFLAMSIINEMLAKKLY----- ------LPQAVKTYTDLPFLVDAKTKRFIRRSDAEHA------------------------ ---------------HDEKTHHLYE---------------DEFYCWNLKSGKPELMPGTEG -SERKTIMLKDKGWDI-----------D---------------------PALEGEW----- -------------------------------------EMTLQ-GGKKVKVTTVFEL----- ----LKKEASK-YSAKDTQ-----------------------------KITGVHLDVVTEL -ATHI-----------AKDKCVEITTGFSLNKYFNGV----LSIWNIATICGLTGRFGPRG ------------------------------------------------------------- -------------------------------GLNTE------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------NEFQLSG------------------------------------------------ ------LEALSGFAGKYS------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- -------------------------PRFA-------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ------------------------------------------------------------- ----------SGFLSEFM------------------------------------------- ------------------------------------------------------------- ----- ->muddycreek_2019_sw_WHONDRS-S19S_0082_B_bin.95_k121_853774_5 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MKLTRRTVLQGIAG -ASAATVVGGQD---ALGEAGAPAAKTGKD--VPVIIDDPREHYPNT-----RPV-EDMYR -SEFADTFGDPDDHGTAFHCV--NCQGNCAWQVWIKDGKVTRENQSAAYPAIR-----EDI -PDSNPRGCNKGVQHSQVMYEADRIRYPMKRVG---------------------------- -----------------ERGGGKWERISWDEAIDTIAQKLYRTM-------------VERG -PQGNYVH--------VGAGLLSEARGASIKRMGA-------------------------- ---LLGAVRPYIASYVGDMFPGVSLVYGEGNIGCSYDFMYGTNVQVYWGCNPNTSRIPDAH -YVWEGKYNGSKVIVISPEFNSTAIHADRWIPIKPG-FDGHLAMSLMHELVDKQLY----D -------AELVRKFTDLPMLIREDSGAMLRLSDIDPARAAAEGALAFDAELAEKFGKKAHG -KKDHAEDVFLAVNEVGGKLTAMPGGEGSAL---------GTLR----------------- --------LQDVGWKIT--------------------------------PALSGNW----- -------------------------------------TVTLR-DGKTVRVHTVFDA----- ----LRKELEA-FTPEKTH-----------------------------KLTGVHPTLVRDL -ARDI-----------ALPEVVSVTMGFALGKHFNGM-LTQRAIASLMALTCRMGPRGGLN --TENEWSISGLGGLSGFDGAFKHRFAS--------------------------------- -------------------------------GAVSEH----QLGDGAATSKKAYTDDEIRE -ATG------QDAASYR----------------------AEIAALLEKS-----KNDRGVD -PAKGRFGKPWWDTVETFFIVADARFRRNKSGYR--------------------EAFLDKA -KFFAVADMKMGETARFADIVLPSASH--YEVWDLRVNPGYHRFANIA---QPPKGLEPVG -EAKSEWHIATMLVTRMQEIA---------------------------------------- --------------------L--AEYAR--------------------------------- --------------------------------TKNIGVMHIPDPTHTRDGIRPLDKF---- -------------VELFTD----H------------------------------------- --------------------GKLGT---DKQAVEFALGHV--------------------- ------------------------------------------------------------- -------DQFRGEDLESCYDR----------------GGFLVVNDKGGKT----------- -------------------------------SPLYP------------------------- ------------------------------------------------------------- -----DKPYSTF----------------------------------ENHF----------- ----- ->icacos_2019_sw_WHONDRS-S19S_0094_B_bin.166_k121_1114214_14 rank: A; pmx:PERMA_0657 dimethylsulfide dehydrogenase subunit alpha (Dimethylsulfide dehydrogenase molybdenum subunit) (DMS DH alphasubunit) (DMS DH molybdenum subunit) (db=kegg) -----------------------------------------------MSISRRDALRNLLF -GTVAAG--------VAAKVPTAEAKEFSDPQPVR-VDDPRKSYPDT------QTTEDFYR -AEFQAVRGNPDERGFAYHC--VNCQGNCAFEVWTENGKVTRENQSASYPQLA-----PNL -PDANPRGCNKGSQHSQVMYEADRLLYPMKRAG---------------------------- -----------------ERGSGKWKRISWDEAITEIAENL------------HRGL-VEKG -PSSNYVH--------IGAGVLTEARAASIKRLGSL------------------------- ----IGAVRPYIASYVGDMFPGVTVVYGEGNIGCTYDFVFTTNVAVFWGCNPNTSRIPDAH -YLWEGKYNGSKIIVITPEFNSTAIHADLWVPLKAG-YDGHLALSIIHRIIQRKLF----R -------PEFLKEYTDLPFLVRKDTKELVRLSDVALD--------------AKGFDGA--- ----------------SARLFGEHPH--------------ECFLAFNTKNRKFTAMPGTEG -SGVETLRLQDMDWDI-----------D---------------------PALNGSW----- -------------------------------------KLTLK-DGKQVQVTTAFEL----- ----FKKEVAA-FAPEKVQ-----------------------------KLTGVHPSIVDEL -ATDL-----------TKAKVSLVTMGFAVGKHFNGM-LSQRAIASLTAFCGKLGPEGGLN --TENEWNISGLEGLSGFQGKYQHRFAS--------------------------------- -------------------------------GFVSE-----FMLGEGLEDADALYSDEDMR -RGT------GDSKAEY-----KA---------------KVQALLEQGKNDERYKEGKPYW -T-----------TVENFLLFADSRFRRNKGNYQ--------------------KAFLEKA -KFIAYGDVRANDMAIYADILLPCKTP--YECWDLRTNPGYHRYANIA---YPPPNLKPVG -ESKSEWEIATLVVEKLEALAKQKAAAT--------------------------------- ----------------GEDRY---------------------------------VVIP--- --------------------------------DKTHTQEGVRRLDELVREFTKDGTL-RTD -KDAVEYALEHVDQFKPNDTKSLY-ERGGFL-QLNEKAGKSS--PLYADK-----PYNTFE -NQLFLHQRFDTLT------GRLTFYVDHPLWIAANAHVPTAKQPIRPARHP--------- ------------------------------------------------------FVLMTPH -ARWSIHSTYKTSPILLRLQR---------------GKPCVMINPEIARARGIQDGDTI-- ----------------KMFNELGEVRVMAKLSPACPPDALVMEHGWE-------------- ---------------PFMYDGKKGHNLIIGDMLNLLELTDGWGH-------LKFGTNWDGN -----QHAYESTMDIAKA------------------------------------------- ----- ->riogrande_2019_sw_WHONDRS-S19S_0066_B_bin.130_k121_990031_60 rank: A; sul:SYO3AOP1_1175 molydopterin dinucleotide-binding region (db=kegg) -----------------------------------------------MTVSRRDLLKAAAL -GSVAIGSNTLAKNAFTEPIPQKEAKDI----PVI-VEDPRASYLNTK-----SI-EDMYR -REFAETFGEKKDHGYAYHCV--NCQGNCAWQVWTKDGKVTRENQSASYPQIA-----PNI -PDYNPRGCNKGVQHSQIMYEQDRLLYPMKRVG---------------------------- -----------------PRGEGKWKRISWDEAITEVSENLYNTMQE---K----------- --GPAGNYIH------IGAGVLTEGRAASVKRLGT-------------------------- ---LLGAVRPYIASYVGDMFPGVSTVYGEGNIGCTYDFIFKTNVAIFWGCNPNTSRIPDAH -FLWEGKYNGSKIVVISPEYNSTAIHADLWVPIKPG-YDGHLAMAVLNEIVFKKMY----N -------ESFVKEFTDLPLLVRKDNKELVRFAEIDTKDSNFD---------SKSSEKL--- --------------LKKILKRELKEHEVF--------------LAWNQKTNKMTVLPGSEG -SPVETLRLKDRGWNI-----------N---------------------PALSGTW----- -------------------------------------KIKLK-DGHTVEVTTVFDL----- ----FKQELKK-FDPLRMH-----------------------------AVTGVHPTIVSEL -ARDM-----------IVPKNTLVTMGFSLGKYFNGM-LIQRAISALTAISGRLGESGGLN -T-ENEWNITGLSGLSGFEGKYQHRFAS--------------------------------- -------------------------------GFVSE-----YMLGDNLNDYDHLYAEAEIK -EST------GLGKKQY-----RE---------------KIEKIVKDG------ANDEGFK -NGKPYWTTM---ETFLLFADAR--FRRNKGSYK--------------------EAFLKKA -KFIAYGDYRMSDFCNYADILLPCKSH--YEVWDIRTNPG---YHRFANIAYPPANLKNVG -EAKSEWEISTLIAEKIQDIA------------------LKKYKS--------------SG -DKKAIHVPDTTHTQTGFRAL--DEVVNEFTIGG---------------------KVR--- --------------------------------SDKDAVEYMLEHVDQFKPNSTKTMY-ERG -GFLVLNDKAGKSSPLYSN----K-PYNT------FESNKLLYQPFETLT----------- --------------------GRLTFYVDHHLWIETGAHIPTARNPIRPKK----------- ----------------------------------------------------FPFVLMTPH -ARWSIHSTYKTSKILQRLQR---------------GKPYIMINPKVAEAKGIKDGDEV-- ----------------KMFNDLGETFLMAKITPSAPEHSLVMEHGWEPFMYKNKVGH---- ----------------------NALV---GDMINLLELSDGWGH-------LKFGTNWDGN -----QHAYETTVDIVKA------------------------------------------- ----- diff --git a/bin/color_labels.R b/bin/color_labels.R deleted file mode 100755 index a6db0332..00000000 --- a/bin/color_labels.R +++ /dev/null @@ -1,49 +0,0 @@ -#!/usr/bin/env Rscript -# Load necessary libraries -library(ape) - -# Define the input files -newick_file <- commandArgs(trailingOnly = TRUE)[1] -labels_file <- commandArgs(trailingOnly = TRUE)[2] -output_pdf <- commandArgs(trailingOnly = TRUE)[3] - -# Read the Newick tree -tree <- read.tree(newick_file) - -# Read the labels to be colored -labels_to_color_raw <- readLines(labels_file) -labels_to_color <- sapply(strsplit(labels_to_color_raw, "\t"), `[`, 2) # Extract the second column - -# Print the labels to be colored for debugging -cat("Labels to be colored:\n") -print(labels_to_color) - -# Print the valid labels found in the tree for debugging -cat("Valid labels found in the tree:\n") -print(tree$tip.label) - -# Prepare the color vector -tip_colors <- rep("black", length(tree$tip.label)) - -# Apply red color to the specified labels -for (i in seq_along(tree$tip.label)) { - if (tree$tip.label[i] %in% labels_to_color) { - tip_colors[i] <- "red" - } -} - -# Debug statement to check which labels are set to red -cat("Tip colors set to red:\n") -print(tree$tip.label[tip_colors == "red"]) - -# Set plot size -pdf(output_pdf, width = 20, height = 20) - -# Plot the tree without tip labels to adjust spacing -plot(tree, type = "unrooted", show.tip.label = FALSE, no.margin = TRUE) - -# Add tip labels with custom colors and larger font size -tiplabels(tree$tip.label, frame = "none", adj = c(1, 1), col = tip_colors, cex = 0.7) - -# Close the PDF device -dev.off() diff --git a/bin/parse_annotations.py b/bin/parse_annotations.py deleted file mode 100755 index 7326864c..00000000 --- a/bin/parse_annotations.py +++ /dev/null @@ -1,46 +0,0 @@ -#!/usr/bin/env python -import pandas as pd -import sys -import os - -FASTA_COLUMN = os.getenv('FASTA_COLUMN', 'input_fasta') - -def extract_query_ids(tsv_path, ko_terms): - df = pd.read_csv(tsv_path, sep='\t') - - # Split KO terms on newline to handle multiple entries correctly - ko_terms = ko_terms.strip().split('\n') - print(f"Searching for KOs: {ko_terms}") - - # Define columns to search for KO terms, excluding 'query_id' - search_columns = [col for col in df.columns if (col.endswith('_id') or col.endswith('_description') or col.endswith('_EC')) and col != 'query_id'] - - # Debugging: Output the columns being searched - print(f"Searching in columns: {search_columns}") - - # Create a filter mask for any row containing any of the KO terms in the specified columns - mask = df[search_columns].apply(lambda x: x.astype(str).str.contains('|'.join(ko_terms), case=False, na=False)).any(axis=1) - filtered_df = df[mask] - - print(f"Found {len(filtered_df)} matching entries.") - - return filtered_df[[FASTA_COLUMN, 'query_id']] - -def main(): - if len(sys.argv) != 4: - print("Usage: python parse_annotations.py ") - sys.exit(1) - - tsv_path, ko_list_path, output_file = sys.argv[1:] - with open(ko_list_path, 'r') as f: - ko_list = f.read() - - results_df = extract_query_ids(tsv_path, ko_list) - - # Write results to output file - results_df.to_csv(output_file, sep='\t', index=False, header=False) - - print(f"Extracted {len(results_df)} entries written to {output_file}") - -if __name__ == '__main__': - main() diff --git a/bin/update_annots_trees.py b/bin/update_annots_trees.py deleted file mode 100755 index 6ebff2ad..00000000 --- a/bin/update_annots_trees.py +++ /dev/null @@ -1,84 +0,0 @@ -#!/usr/bin/env python -import json -import sys -import re -import pandas as pd -from Bio import Phylo -from io import StringIO - -def load_jplace_file(jplace_path): - with open(jplace_path, 'r') as file: - jplace_data = json.load(file) - return jplace_data - -def load_and_parse_tree(tree_data): - tree_data = re.sub(r'\{(\d+)\}', r'[&edge=\g<1>]', tree_data) - handle = StringIO(tree_data) - tree = Phylo.read(handle, "newick") - return tree - -def find_closest_labeled_ancestor(clade, tree): - if clade.is_terminal() and clade.name: - return clade.name - path = tree.get_path(clade) - for ancestor in reversed(path): - if ancestor.is_terminal() and ancestor.name: - return ancestor.name - min_distance = float('inf') - closest_leaf = None - for leaf in tree.get_terminals(): - distance = tree.distance(clade, leaf) - if distance < min_distance and leaf.name: - min_distance = distance - closest_leaf = leaf.name - return closest_leaf if closest_leaf else "" - -def load_tree_mapping(mapping_tsv): - df = pd.read_csv(mapping_tsv, sep='\t') - return dict(zip(df['gene'], df['call'])) - -def extract_placement_details(jplace_data, tree, tree_mapping): - placements = jplace_data['placements'] - placement_map = {} - for placement in placements: - for placement_detail in placement['p']: - edge_num = placement_detail[1] - clades = list(tree.find_clades({"comment": f"&edge={edge_num}"})) - if clades: - clade = clades[0] - closest_leaf = find_closest_labeled_ancestor(clade, tree) - if closest_leaf and closest_leaf in tree_mapping: - closest_leaf = f"{tree_mapping[closest_leaf]};{closest_leaf}" - else: - closest_leaf = f"No mapping found;{closest_leaf}" - else: - closest_leaf = f"Clade not found;{edge_num}" - for name, _ in placement['nm']: - placement_map[name] = closest_leaf - return placement_map - -def update_tsv(tsv_path, output_tsv_path, placement_map): - df = pd.read_csv(tsv_path, sep='\t') - df['tree_verified'] = df['query_id'].map(placement_map).fillna('') - - # Reorder columns to place 'tree_verified' after 'gene_number' - col_order_start = df.columns.tolist()[:df.columns.get_loc('gene_number')+1] + ['tree_verified'] - col_order_end = [col for col in df.columns if col not in col_order_start] - df = df[col_order_start + col_order_end] - - df.to_csv(output_tsv_path, sep='\t', index=False) - -def main(): - if len(sys.argv) != 5: - print("Usage: python update_annots_trees.py ") - sys.exit(1) - - jplace_path, tsv_path, mapping_tsv, output_tsv_path = sys.argv[1:] - jplace_data = load_jplace_file(jplace_path) - tree = load_and_parse_tree(jplace_data['tree']) - tree_mapping = load_tree_mapping(mapping_tsv) - placement_map = extract_placement_details(jplace_data, tree, tree_mapping) - update_tsv(tsv_path, output_tsv_path, placement_map) - -if __name__ == "__main__": - main() diff --git a/bin/update_tree.py b/bin/update_tree.py deleted file mode 100755 index 9bc228ef..00000000 --- a/bin/update_tree.py +++ /dev/null @@ -1,49 +0,0 @@ -#!/usr/bin/env python -import json -import xml.etree.ElementTree as ET -import re -from collections import defaultdict -import sys -from ete3 import Tree, Phyloxml - -def parse_jplace(jplace_path): - with open(jplace_path, 'r') as file: - jplace_data = json.load(file) - return jplace_data['tree'], jplace_data['placements'] - -def add_placements_to_tree(tree_newick, placements): - # Load the tree - tree = Tree(tree_newick, format=1) - - # Add placements - for placement in placements: - for p in placement['p']: - edge_num = p[1] - name = placement['nm'][0][0] - edge = tree.search_nodes(name=str(edge_num)) - if edge: - new_clade = Tree(name=name, dist=0.0) - edge[0].add_child(new_clade) - - return tree - -def save_tree_as_phyloxml(tree, output_path): - phyloxml = tree.write(format=5) - with open(output_path, 'w') as file: - file.write(phyloxml) - -def main(): - jplace_path = 'aligned_sequences.jplace' # Replace with the actual path if different - output_xml_path = 'aligned_sequences_updated.xml' # Replace with the actual path if different - - # Parse the jplace file - tree_newick, placements = parse_jplace(jplace_path) - - # Add placements to the tree - tree = add_placements_to_tree(tree_newick, placements) - - # Save the tree in phyloXML format - save_tree_as_phyloxml(tree, output_xml_path) - -if __name__ == "__main__": - main() diff --git a/modules/local/trees/trees.nf b/modules/local/trees/trees.nf deleted file mode 100644 index bc3720a3..00000000 --- a/modules/local/trees/trees.nf +++ /dev/null @@ -1,92 +0,0 @@ -process TREES { - label 'process_tiny' - - errorStrategy 'finish' - - input: - path( ch_combined_annotations, stageAs: "initial-annotations.tsv" ) - val( trees_list ) - path( ch_collected_proteins ) - path( tree_data_files ) - path( ch_trees_scripts ) - file( ch_add_trees ) - - output: - path("updated-annotations.tsv"), emit: updated_annotations, optional: true - path("aligned_sequences.jplace"), emit: tree_placements, optional: true - path("colored_tree.pdf"), emit: colored_tree, optional: true - path("colored_tree_python.pdf"), emit: colored_tree_python, optional: true - - script: - """ - # export constants for script - export FASTA_COLUMN="${params.CONSTANTS.FASTA_COLUMN}" - - ln -s ${tree_data_files}/* . - ln -s ${ch_trees_scripts}/*.py . - ln -s ${ch_trees_scripts}/*.R . - - cp initial-annotations.tsv current-annotations.tsv - - # Symlink additional tree directories if provided - if [[ "${params.add_trees}" != "" ]]; then - ln -s ${ch_add_trees}/* ${tree_data_files}/ - fi - - # Append additional tree directories to trees_list - if [ -d "${params.add_trees}" ]; then - for dir in \$(ls ${params.add_trees}); do - trees_list+=";\$dir" - done - fi - - # Split trees_list into an array - IFS=';' read -ra TREE_OPTIONS <<< "${trees_list}" - - for tree_option in "\${TREE_OPTIONS[@]}"; do - echo "Processing tree: \${tree_option}" - - # Determine the search terms file for the current tree - KO_LIST="\${tree_option}/\${tree_option}.refpkg/\${tree_option}_search_terms.txt" - python parse_annotations.py current-annotations.tsv \${KO_LIST} "extracted_query_ids.txt" - - if [ -s "extracted_query_ids.txt" ]; then - # The file is not empty, proceed with processing - - # Loop through each line in the output file, extract the corresponding sequence - mkdir -p extracted_sequences - while IFS=\$'\t' read -r input_fasta query_id; do - seqtk subseq \${input_fasta}_called_genes.faa <(echo \${query_id}) > extracted_sequences/\${input_fasta}_\${query_id}.fasta - done < extracted_query_ids.txt - - # Combine all sequences into one file - cat extracted_sequences/*.fasta > combined_extracted_sequences.fasta - - # Align sequences to the reference alignment - mafft --thread ${params.threads} --add combined_extracted_sequences.fasta --reorder trees/\${tree_option}/\${tree_option}.refpkg/\${tree_option}.aln > aligned_sequences.fasta - - # Run pplacer - pplacer -j ${task.cpus} -c trees/\${tree_option}/\${tree_option}.refpkg aligned_sequences.fasta - - # Generate visualization using guppy tog (translate .jplace to other formats) - guppy tog -o aligned_sequences.xml aligned_sequences.jplace - - # Update the annotations using the mapping and the placements - python update_annots_trees.py aligned_sequences.jplace current-annotations.tsv "trees/\${tree_option}/\${tree_option}.refpkg/\${tree_option}-tree-mapping.tsv" updated-annotations.tsv - - # Set the updated annotations as the current for the next tree - mv updated-annotations.tsv current-annotations.tsv - - # Color labels and generate PDF - Rscript color_labels.R aligned_sequences.xml extracted_query_ids.txt colored_tree.pdf - - else - echo "No gene IDs of interest found for tree \${tree_option}, skipping sequence extraction and analysis." - fi - done - - # Finalize the process - mv current-annotations.tsv updated-annotations.tsv - - """ -} From 8c7dcf8990007331791ec390202e0687e4c0fe83 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Fri, 24 Apr 2026 14:05:10 +0300 Subject: [PATCH 16/19] chore: remove DRAM-v1 db_description_builder and db_utils Both are unreferenced DRAM-v1 helpers under bin/assets/forms/. They shell out to a DRAM-setup.py CLI that isn't part of the DSL2 pipeline, and upstream has already removed them. Co-Authored-By: Claude Opus 4.7 (1M context) --- bin/assets/forms/db_description_builder.py | 964 --------------------- bin/assets/forms/db_utils.py | 287 ------ 2 files changed, 1251 deletions(-) delete mode 100755 bin/assets/forms/db_description_builder.py delete mode 100755 bin/assets/forms/db_utils.py diff --git a/bin/assets/forms/db_description_builder.py b/bin/assets/forms/db_description_builder.py deleted file mode 100755 index c9b4d7d9..00000000 --- a/bin/assets/forms/db_description_builder.py +++ /dev/null @@ -1,964 +0,0 @@ -""" -*DRAM v1/early v2 DB description builder script* - -Contains most of the backend for the DRAM_setup.py script, used to setup databases for each user. -""" -from os import path, mkdir -from datetime import datetime -from shutil import move, rmtree, copyfile -from glob import glob -import gzip -from collections import defaultdict -import logging -import tarfile - -from skbio import read as read_sequence -from skbio import write as write_sequence - -from dram2.utils.database_handler import DatabaseHandler -from db_utils import ( - run_process, - download_file, - merge_files, - remove_prefix, - setup_logger, -) - -NUMBER_OF_VIRAL_FILES = 2 - - -DEFAULT_DBCAN_RELEASE = "10" -DEFAULT_DBCAN_DATE = "07292021" -DEFAULT_UNIREF_VERSION = "90" -DEFAULT_VOGDB_VERSION = "latest" -DFLT_OUTPUT_DIR = "." -LOGGER = logging.getLogger("database_processing.log") -DEFAULT_MMMSPRO_DB_NAME = "db" - -from dram2.camper_kit import download as download_camper_tar_gz -from dram2.camper_kit import process as process_camper_tar_gz -from dram2.camper_kit import DOWNLOAD_OPTIONS as CAMPER_DOWNLOAD_OPTIONS -from dram2.camper_kit import PROCESS_OPTIONS as CAMPER_PROCESS_OPTIONS -from dram2.camper_kit import DRAM_SETTINGS as CAMPER_DRAM_SETTINGS -from dram2.fegenie_kit import download as download_fegenie_tar_gz -from dram2.fegenie_kit import process as process_fegenie_tar_gz -from dram2.fegenie_kit import DOWNLOAD_OPTIONS as FEGENIE_DOWNLOAD_OPTIONS -from dram2.fegenie_kit import PROCESS_OPTIONS as FEGENIE_PROCESS_OPTIONS -from dram2.fegenie_kit import DRAM_SETTINGS as FEGENIE_DRAM_SETTINGS -from dram2.sulphur_kit import download as download_sulphur_tar_gz -from dram2.sulphur_kit import process as process_sulphur_tar_gz -from dram2.sulphur_kit import DOWNLOAD_OPTIONS as SULPHUR_DOWNLOAD_OPTIONS -from dram2.sulphur_kit import PROCESS_OPTIONS as SULPHUR_PROCESS_OPTIONS -from dram2.sulphur_kit import DRAM_SETTINGS as SULPHUR_DRAM_SETTINGS - -KEGG_CITATION = "Kanehisa, M., Furumichi, M., Sato, Y., Ishiguro-Watanabe, M., and Tanabe, M.; KEGG: integrating viruses and cellular organisms. Nucleic Acids Res. 49, D545-D551 (2021)." -GENE_KO_LINK_CITATION = "" -KOFAM_CITATION = "" -UNIREF_CITATION = "" -PFAM_CITATION = "" -DBCAN_CITATION = "" -VOGDB_CITATION = "" -VIRAL_REFSEQ_CITATION = "" -PEPTIDASE_CITATION = "" -DRAM_CITATION = "" -# TODO: check if dbcan or pfam is down, raise appropriate error -# TODO: upgrade to pigz? - - -def get_iso_date(): - return datetime.today().strftime("%Y%m%d") - - -def download_pfam_hmm(output_dir=".", logger=LOGGER, verbose=True): - pfam_hmm = path.join(output_dir, "Pfam-A.hmm.dat.gz") - link_path = ( - "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.hmm.dat.gz" - ) - logger.debug(f"Downloading Pfam from: {link_path}") - download_file(link_path, logger, pfam_hmm, verbose=verbose) - return pfam_hmm - - -def download_dbcan( - output_dir=".", - logger=LOGGER, - dbcan_hmm=None, - version=DEFAULT_DBCAN_RELEASE, - verbose=True, -): - dbcan_hmm = path.join(output_dir, f"dbCAN-HMMdb-V{version}.txt") - if int(version) < int(DEFAULT_DBCAN_RELEASE): - link_path = ( - f"http://bcb.unl.edu/dbCAN2/download/Databases/dbCAN-HMMdb-V{version}.txt" - ) - else: - link_path = f"http://bcb.unl.edu/dbCAN2/download/dbCAN-HMMdb-V{version}.txt" - - logger.debug(f"Downloading dbCAN from: {link_path}") - download_file(link_path, logger, dbcan_hmm, verbose=verbose) - return dbcan_hmm - - -def download_dbcan_fam_activities( - output_dir=".", - logger=LOGGER, - version=DEFAULT_DBCAN_RELEASE, - upload_date=DEFAULT_DBCAN_DATE, - verbose=True, -): - dbcan_fam_activities = path.join( - output_dir, f"CAZyDB.{upload_date}.fam-activities.txt" - ) - link_path = f"https://bcb.unl.edu/dbCAN2/download/Databases/V{version}/CAZyDB.{upload_date}.fam-activities.txt" - logger.info(f"Downloading dbCAN family activities from : {link_path}") - download_file(link_path, logger, dbcan_fam_activities, verbose=verbose) - return dbcan_fam_activities - - -def download_dbcan_subfam_ec( - output_dir=".", - logger=LOGGER, - version=DEFAULT_DBCAN_RELEASE, - upload_date=DEFAULT_DBCAN_DATE, - verbose=True, -): - dbcan_subfam_ec = path.join(output_dir, f"CAZyDB.{upload_date}.fam.subfam.ec.txt") - link_path = ( - f"https://bcb.unl.edu/dbCAN2/download/Databases/" - f"V{version}/CAZyDB.{upload_date}.fam.subfam.ec.txt" - ) - logger.info(f"Downloading dbCAN sub-family encumber from : {link_path}") - download_file(link_path, logger, dbcan_subfam_ec, verbose=verbose) - return dbcan_subfam_ec - - -def download_kofam_hmm(output_dir=".", logger=LOGGER, verbose=False): - kofam_profile_tar_gz = path.join(output_dir, "kofam_profiles.tar.gz") - download_file( - "ftp://ftp.genome.jp/pub/db/kofam/profiles.tar.gz", - logger, - kofam_profile_tar_gz, - verbose=verbose, - ) - return kofam_profile_tar_gz - - -def generate_modified_kegg_fasta(kegg_fasta, gene_ko_link_loc=None): - """ - Takes kegg fasta file and gene ko link file, adds kos not already in headers to headers - Whish I knew about this, oh well I may split this out. - """ - genes_ko_dict = defaultdict(list) - if gene_ko_link_loc is not None: - if gene_ko_link_loc.endswith(".gz"): - gene_ko_link_fh = gzip.open(gene_ko_link_loc, "rt") - else: - gene_ko_link_fh = open(gene_ko_link_loc) - for line in gene_ko_link_fh: - gene, ko = line.strip().split() - genes_ko_dict[gene].append(remove_prefix(ko, "ko:")) - for seq in read_sequence(kegg_fasta, format="fasta"): - new_description = seq.metadata["description"] - for ko in genes_ko_dict[seq.metadata["id"]]: - if ko not in new_description: - new_description += "; %s" % ko - seq.metadata["description"] = new_description - yield seq - - -def process_kegg( - kegg_loc, - output_dir, - logger, - gene_ko_link_loc=None, - download_date=None, - threads=10, - verbose=True, -): - if download_date is None: - download_date = get_iso_date() - if gene_ko_link_loc is not None: - # add KOs to end of header where KO is not already there - kegg_mod_loc = path.join(output_dir, "kegg.mod.fa") - write_sequence( - generate_modified_kegg_fasta(kegg_loc, gene_ko_link_loc), - format="fasta", - into=kegg_mod_loc, - ) - else: - kegg_mod_loc = kegg_loc - # make mmseqsdb from modified kegg fasta - kegg_mmseqs_db = path.join(output_dir, "kegg.%s.mmsdb" % download_date) - make_mmseqs_db( - kegg_mod_loc, - kegg_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("KEGG database processed") - return {"kegg": kegg_mmseqs_db} - - -def process_kofam_hmm( - kofam_profile_tar_gz, - output_dir=DFLT_OUTPUT_DIR, - logger=LOGGER, - threads=1, - verbose=False, -): - kofam_profiles = path.join(output_dir, "kofam_profiles") - mkdir(kofam_profiles) - run_process( - ["tar", "-xzf", kofam_profile_tar_gz, "-C", kofam_profiles], - logger, - verbose=verbose, - ) - merged_kofam_profiles = path.join(output_dir, "kofam_profiles.hmm") - merge_files( - glob(path.join(kofam_profiles, "profiles", "*.hmm")), merged_kofam_profiles - ) - run_process(["hmmpress", "-f", merged_kofam_profiles], logger, verbose=verbose) - LOGGER.info("KOfam database processed") - return {"kofam_hmm": merged_kofam_profiles} - - -def download_kofam_ko_list(output_dir=".", logger=LOGGER, verbose=False): - kofam_ko_list_gz = path.join(output_dir, "kofam_ko_list.tsv.gz") - download_file( - "ftp://ftp.genome.jp/pub/db/kofam/ko_list.gz", - logger, - kofam_ko_list_gz, - verbose=verbose, - ) - return kofam_ko_list_gz - - -def download_pfam(output_dir=".", logger=LOGGER, verbose=True): - pfam_full_zipped = path.join(output_dir, "Pfam-A.full.gz") - download_file( - "ftp://ftp.ebi.ac.uk/pub/databases/Pfam/current_release/Pfam-A.full.gz", - logger, - pfam_full_zipped, - verbose=verbose, - ) - return pfam_full_zipped - - -def download_viral( - output_dir=".", logger=LOGGER, viral_files=NUMBER_OF_VIRAL_FILES, verbose=True -): - """Can only download newest version""" - # download all of the viral protein files, need to know the number of files - # TODO: Make it so that you don't need to know number of viral files in refseq viral - - faa_base_name = "viral.%s.protein.faa.gz" - viral_faa_glob = path.join(output_dir, faa_base_name % "*") - for number in range(viral_files): - number += 1 - refseq_url = ( - "ftp://ftp.ncbi.nlm.nih.gov/refseq/release/viral/viral.%s.protein.faa.gz" - % number - ) - refseq_faa = path.join(output_dir, faa_base_name % number) - download_file(refseq_url, logger, refseq_faa, verbose=verbose) - - # then merge files from above - merged_viral_faas = path.join(output_dir, "viral.merged.protein.faa.gz") - run_process( - ["cat %s > %s" % (" ".join(glob(viral_faa_glob)), merged_viral_faas)], - logger, - shell=True, - ) - return merged_viral_faas - - -def download_uniref( - output_dir=".", - logger=LOGGER, - version=DEFAULT_UNIREF_VERSION, - threads=10, - verbose=True, -): - uniref_fasta_zipped = path.join(output_dir, "uniref%s.fasta.gz" % version) - uniref_url = ( - "https://ftp.uniprot.org/pub/databases/uniprot/uniref/uniref%s/uniref%s.fasta.gz" - % (version, version) - ) - download_file(uniref_url, logger, uniref_fasta_zipped, verbose=verbose) - return uniref_fasta_zipped - - -def download_peptidase(output_dir=".", logger=LOGGER, verbose=True): - peptidase_faa = path.join(output_dir, "merops_peptidases_nr.faa") - merops_url = "ftp://ftp.ebi.ac.uk/pub/databases/merops/current_release/pepunit.lib" - download_file(merops_url, logger, peptidase_faa, verbose=verbose) - return peptidase_faa - - -def download_vogdb( - output_dir=".", logger=LOGGER, version=DEFAULT_VOGDB_VERSION, verbose=True -): - vog_hmm_targz = path.join(output_dir, "vog.hmm.tar.gz") - vogdb_url = f"http://fileshare.csb.univie.ac.at/vog/{version}/vog.hmm.tar.gz" - download_file(vogdb_url, logger, vog_hmm_targz, verbose=verbose) - return vog_hmm_targz - - -def process_kofam_ko_list( - kofam_ko_list_gz, output_dir=".", logger=LOGGER, threads=1, verbose=False -): - # TODO: fix this so that it is gunzipped to the path - kofam_ko_list = path.join(output_dir, "kofam_ko_list.tsv") - run_process( - ["gunzip", "-c", kofam_ko_list_gz], - logger, - save_output=kofam_ko_list, - verbose=verbose, - ) - LOGGER.info("KOfam ko list processed") - return {"kofam_ko_list": kofam_ko_list} - - -def process_uniref( - uniref_fasta_zipped, - output_dir=".", - logger=LOGGER, - version=DEFAULT_UNIREF_VERSION, - threads=10, - verbose=True, -): - uniref_mmseqs_db = path.join( - output_dir, "uniref%s.%s.mmsdb" % (version, get_iso_date()) - ) - make_mmseqs_db( - uniref_fasta_zipped, - uniref_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("UniRef database processed") - return {"uniref": uniref_mmseqs_db} - - -def process_mmspro( - full_alignment, - output_dir, - logger=LOGGER, - db_name=DEFAULT_MMMSPRO_DB_NAME, - threads=10, - verbose=True, -): - mmseqs_msa = path.join(output_dir, "%s.mmsmsa" % db_name) - run_process( - ["mmseqs", "convertmsa", full_alignment, mmseqs_msa], logger, verbose=verbose - ) - mmseqs_profile = path.join(output_dir, "%s.mmspro" % db_name) - run_process( - [ - "mmseqs", - "msa2profile", - mmseqs_msa, - mmseqs_profile, - "--match-mode", - "1", - "--threads", - str(threads), - ], - logger, - verbose=verbose, - ) - tmp_dir = path.join(output_dir, "tmp") - run_process( - [ - "mmseqs", - "createindex", - mmseqs_profile, - tmp_dir, - "-k", - "5", - "-s", - "7", - "--threads", - str(threads), - ], - logger, - verbose=verbose, - ) - return mmseqs_profile - - -def process_pfam( - pfam_full_zipped, output_dir=".", logger=LOGGER, threads=10, verbose=True -): - pfam_profile = process_mmspro( - pfam_full_zipped, output_dir, logger, "pfam", threads, verbose - ) - LOGGER.info("PFAM database processed") - return {"pfam": pfam_profile} - - -def process_dbcan(input, output_dir, logger=LOGGER, verbose=True, threads=1): - output = path.join(output_dir, path.basename(input)) - move(input, output) - run_process(["hmmpress", "-f", output], logger, verbose=verbose) - LOGGER.info("dbCAN database processed") - return {"dbcan": output} - - -def process_viral( - merged_viral_faas, - output_dir=".", - logger=LOGGER, - viral_files=NUMBER_OF_VIRAL_FILES, - threads=10, - verbose=True, -): - refseq_viral_mmseqs_db = path.join( - output_dir, "refseq_viral.%s.mmsdb" % get_iso_date() - ) - make_mmseqs_db( - merged_viral_faas, - refseq_viral_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("RefSeq viral database processed") - return {"viral": refseq_viral_mmseqs_db} - - -def process_peptidase( - peptidase_faa, output_dir=".", logger=LOGGER, threads=10, verbose=True -): - peptidase_mmseqs_db = path.join(output_dir, "peptidases.%s.mmsdb" % get_iso_date()) - make_mmseqs_db( - peptidase_faa, - peptidase_mmseqs_db, - logger, - create_index=True, - threads=threads, - verbose=verbose, - ) - LOGGER.info("MEROPS database processed") - return {"peptidase": peptidase_mmseqs_db} - - -def process_vogdb( - vog_hmm_targz, - output_dir=".", - logger=LOGGER, - version=DEFAULT_VOGDB_VERSION, - threads=1, - verbose=True, -): - hmm_dir = path.join(output_dir, "vogdb_hmms") - mkdir(hmm_dir) - vogdb_targz = tarfile.open(vog_hmm_targz) - vogdb_targz.extractall(hmm_dir) - vog_hmms = path.join(output_dir, f"vog_{version}_hmms.txt") - merge_files(glob(path.join(hmm_dir, "VOG*.hmm")), vog_hmms) - run_process(["hmmpress", "-f", vog_hmms], logger, verbose=verbose) - LOGGER.info("VOGdb database processed") - return {"vogdb": vog_hmms} - - -def download_vog_annotations( - output_dir, logger=LOGGER, version=DEFAULT_VOGDB_VERSION, verbose=True -): - vog_annotations = path.join(output_dir, "vog_annotations_%s.tsv.gz" % version) - download_file( - "http://fileshare.csb.univie.ac.at/vog/%s/vog.annotations.tsv.gz" % version, - logger, - vog_annotations, - verbose=verbose, - ) - return vog_annotations - - -def download_genome_summary_form( - output_dir, logger=LOGGER, branch="master", verbose=True -): - genome_summary_form = path.join( - output_dir, "genome_summary_form.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/genome_summary_form.tsv" - % branch, - logger, - genome_summary_form, - verbose=verbose, - ) - return genome_summary_form - - -def download_module_step_form(output_dir, logger=LOGGER, branch="master", verbose=True): - function_heatmap_form = path.join( - output_dir, "module_step_form.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/module_step_form.tsv" - % branch, - logger, - function_heatmap_form, - verbose=verbose, - ) - return function_heatmap_form - - -def download_etc_module_database( - output_dir, logger=LOGGER, branch="master", verbose=True -): - etc_module_database = path.join( - output_dir, "etc_mdoule_database.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/etc_module_database.tsv" - % branch, - logger, - etc_module_database, - verbose=verbose, - ) - return etc_module_database - - -def download_function_heatmap_form( - output_dir, logger=LOGGER, branch="master", verbose=True -): - function_heatmap_form = path.join( - output_dir, "function_heatmap_form.%s.tsv" % get_iso_date() - ) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/function_heatmap_form.tsv" - % branch, - logger, - function_heatmap_form, - verbose=verbose, - ) - return function_heatmap_form - - -def download_amg_database(output_dir, logger=LOGGER, branch="master", verbose=True): - amg_database = path.join(output_dir, "amg_database.%s.tsv" % get_iso_date()) - download_file( - "https://raw.githubusercontent.com/WrightonLabCSU/DRAM/%s/data/amg_database.tsv" - % branch, - logger, - amg_database, - verbose=verbose, - ) - return amg_database - - -def check_file_exists(*paths): - for i in paths: - if i is None: - continue - elif path.isfile(i): - continue - else: - raise ValueError(f"Database location does not exist: {i}") - - -def prepare_databases( - output_dir, - loggpath=None, - kegg_loc=None, - gene_ko_link_loc=None, - kofam_hmm_loc=None, - kofam_ko_list_loc=None, - kegg_download_date=None, - uniref_loc=None, - uniref_version=DEFAULT_UNIREF_VERSION, - pfam_loc=None, - pfam_hmm_loc=None, - dbcan_loc=None, - dbcan_fam_activities: str = None, - dbcan_subfam_ec: str = None, - dbcan_version=DEFAULT_DBCAN_RELEASE, - dbcan_date=DEFAULT_DBCAN_DATE, - viral_loc=None, - peptidase_loc=None, - vogdb_loc=None, - vogdb_version=DEFAULT_VOGDB_VERSION, - vog_annotations=None, - genome_summary_form_loc=None, - module_step_form_loc=None, - etc_module_database_loc=None, - function_heatmap_form_loc=None, - amg_database_loc=None, - camper_tar_gz_loc=None, - number_of_viral_files=NUMBER_OF_VIRAL_FILES, - fegenie_tar_gz_loc=None, - sulphur_tar_gz_loc=None, - skip_uniref=False, - keep_database_files=False, - branch="master", - threads=10, - verbose=True, - select_db=None, - clear_config=False, -): - - dram_settings = { - "kegg": { - "name": "KEGG db", - "description_db_updated": "Unknown, or Never", - "citation": KEGG_CITATION, - }, - "gene_ko_link": {"name": "KEGG Gene KO link", "citation": KEGG_CITATION}, - "kofam_hmm": {"name": "KOfam db", "citation": KOFAM_CITATION}, - "kofam_ko_list": {"name": "KOfam KO list", "citation": KOFAM_CITATION}, - "uniref": { - "name": "UniRef db", - "description_db_updated": "Unknown, or Never", - "citation": UNIREF_CITATION, - }, - "pfam": {"name": "Pfam db", "citation": PFAM_CITATION}, - "pfam_hmm": { - "name": "Pfam hmm dat", - "description_db_updated": "Unknown, or Never", - "citation": PFAM_CITATION, - }, - "dbcan": {"name": "dbCAN db", "citation": DBCAN_CITATION}, - "dbcan_fam_activities": { - "name": "dbCAN family activities", - "citation": DBCAN_CITATION, - }, - "dbcan_subfam_ec": { - "name": "dbCAN subfamily EC numbers", - "citation": DBCAN_CITATION, - }, - "vogdb": {"name": "VOGDB db", "citation": VOGDB_CITATION}, - "vog_annotations": { - "name": "VOG annotations", - "description_db_updated": "Unknown, or Never", - "citation": VOGDB_CITATION, - }, - "viral": { - "name": "RefSeq Viral db", - "description_db_updated": "Unknown, or Never", - "citation": VIRAL_REFSEQ_CITATION, - }, - "peptidase": { - "name": "MEROPS peptidase db", - "description_db_updated": "Unknown, or Never", - "citation": PEPTIDASE_CITATION, - }, - "genome_summary_form": {"name": "Genome summary form"}, - "module_step_form": {"name": "Module step form"}, - "function_heatmap_form": {"name": "Function heatmap form"}, - "amg_database": {"name": "AMG database"}, - "etc_module_database": {"name": "ETC module database"}, - } - dram_settings.update(CAMPER_DRAM_SETTINGS) - dram_settings.update(FEGENIE_DRAM_SETTINGS) - dram_settings.update(SULPHUR_DRAM_SETTINGS) - database_settings = { - "kegg": {}, - "gene_ko_link": {}, - "kofam_hmm": {}, - "kofam_ko_list": {}, - "uniref": {"version": uniref_version}, - "pfam": {}, - "pfam_hmm": {}, - "dbcan": {"version": dbcan_version}, - "dbcan_fam_activities": {"version": dbcan_version, "upload_date": dbcan_date}, - "dbcan_subfam_ec": {"version": dbcan_version, "upload_date": dbcan_date}, - "vogdb": {"version": vogdb_version}, - "vog_annotations": {"version": vogdb_version}, - "viral": {}, - "peptidase": {}, - "genome_summary_form": {"branch": branch}, - "module_step_form": {"branch": branch}, - "function_heatmap_form": {"branch": branch}, - "amg_database": {"branch": branch}, - "etc_module_database": {"branch": branch}, - } - database_settings.update(CAMPER_DOWNLOAD_OPTIONS) - database_settings.update(FEGENIE_DOWNLOAD_OPTIONS) - database_settings.update(SULPHUR_DOWNLOAD_OPTIONS) - process_settings = { - "kegg": {}, - "gene_ko_link": {}, - "kofam_hmm": {}, - "kofam_ko_list": {}, - "uniref": {"version": uniref_version}, - "pfam": {}, - "pfam_hmm": {}, - "dbcan": {}, - "dbcan_fam_activities": {}, - "dbcan_subfam_ec": {}, - "vogdb": {}, - "vog_annotations": {}, - "viral": {"viral_files": number_of_viral_files}, - "peptidase": {}, - "genome_summary_form": {}, - "module_step_form": {}, - "function_heatmap_form": {}, - "amg_database": {}, - "etc_module_database": {}, - } - process_settings.update(CAMPER_PROCESS_OPTIONS) - process_settings.update(FEGENIE_PROCESS_OPTIONS) - process_settings.update(SULPHUR_PROCESS_OPTIONS) - - # setup temp, logging, and db_handler - if not path.isdir(output_dir): - mkdir(output_dir) - temporary = path.join(output_dir, "database_files") - mkdir(temporary) - main_log = path.join(output_dir, "database_processing.log") - setup_logger(LOGGER, *[(main_log, loggpath) if loggpath is not None else main_log]) - db_handler = DatabaseHandler(logger=LOGGER) - if clear_config or select_db is None: - db_handler.clear_config() - - db_handler.config["log_path"] = main_log - db_handler.write_config() - LOGGER.info("Starting the process of downloading data") - - if skip_uniref: - LOGGER.info("Skipping UniRef") - del database_settings["uniref"] - - locs = { - i.removesuffix("_loc"): j - for i, j in locals().items() - if i.endswith("_loc") and j is not None - } - download_functions = { - i.removeprefix("download_"): j - for i, j in globals().items() - if callable(j) and i.startswith("download_") - } - process_functions = { - i.removeprefix("process_"): j - for i, j in globals().items() - if callable(j) and i.startswith("process_") - } - functions = { - i: j for i, j in globals().items() if callable(j) and i.startswith("download_") - } - - # Check any specified paths exist - missing_user_inputs = [i for i in locs if not path.exists(i)] - if len(missing_user_inputs) > 1: - raise ValueError( - f"The fallowing user provided paths don't seem to exist: {missing_user_inputs}" - ) - - un_obtainable = [ - i for i in database_settings if i not in locs and i not in download_functions - ] - - for i in un_obtainable: - LOGGER.info( - f"The {i}_loc argument was not used to specify a downloaded {i} file, and dram can not" - " download it its self. So it is assumed that the user wants to set up DRAM without it" - ) - del database_settings[i] - - # check inputs - if skip_uniref and uniref_loc is not None: - raise ValueError( - "Cannot skip UniRef processing and provide a location of UniRef." - " Skipping UniRef will cause provided UniRef file to not be used." - ) - - if select_db is not None: - miss_name = [i for i in select_db if i not in database_settings] - user_inputs = [i for i in locs if i not in select_db] - if len(miss_name) > 0: - LOGGER.error( - "Only the databases in the db list can be pased to select_db, " - f"you passed {miss_name} which is/are not in the list." - ) - raise ValueError("Bad user input, see log") - - if len(user_inputs) > 0: - LOGGER.error( - f"The user provided location for {user_inputs}, but required it not be used by proving" - f" the select_db argument for other databases. This would suggest that the" - " user may have made a mistake and so this error is rased." - ) - raise ValueError("Bad user input, see log") - - database_settings = {i: database_settings[i] for i in select_db} - - LOGGER.info("Database preparation started") - - # Download DBs - for i, j in database_settings.items(): - if locs.get(i) is None: - LOGGER.info(f"Downloading {i}") - if i in process_functions: - locs[i] = download_functions[i](temporary, LOGGER, **j, verbose=verbose) - else: - locs[i] = download_functions[i]( - output_dir, LOGGER, **j, verbose=verbose - ) - j["Download time"] = datetime.now().strftime("%m/%d/%Y, %H:%M:%S") - j["Origin"] = "Downloaded by DRAM" - else: - j = {k: "Unknown" for k in j} - j["Download time"] = "Unknown" - j["Origin"] = "Provided by user" - j["Original path"] = locs[i] - if i not in process_functions: - LOGGER.info(f"Copying {locs[i]} to output_dir") - locs[i] = copyfile( - locs[i], path.join(output_dir, path.basename(locs[i])) - ) - - LOGGER.info("All raw data files were downloaded successfully") - - # Process databases - for i in locs: - processed_locs = {} - if i in process_functions: - LOGGER.info(f"Processing {i}") - processed_locs = process_functions[i]( - locs[i], - output_dir, - LOGGER, - threads=threads, - verbose=verbose, - **process_settings[i], - ) - else: - processed_locs = {i: locs[i]} - for k, v in processed_locs.items(): - final_dest = path.join(output_dir, path.basename(v)) - if v != final_dest: - for db_file in glob("%s*" % v): - move(db_file, path.join(output_dir, path.basename(db_file))) - v = path.join(output_dir, path.basename(v)) - # update_dram_forms the settings per OUTPUT fill, including the process_settings - # and database_settings, which are per input file. - if db_handler.config.get("setup_info") is None: - db_handler.config["setup_info"] = {} - db_handler.config["setup_info"][k] = { - **dram_settings[k], - **process_settings[i], - **database_settings[i], - } - db_handler.set_database_paths(**{f"{k}_loc": v}) - db_handler.write_config() - LOGGER.info(f"Moved {k} to final destination, configuration updated") - - LOGGER.info("Populating the description db, this may take some time") - db_handler.config["description_db"] = path.realpath( - path.join(output_dir, "description_db.sqlite") - ) - db_handler.write_config() - db_handler.populate_description_db( - db_handler.config["description_db"], select_db, update_config=False - ) - # todo make db handler such that the destruction on success write_config - db_handler.write_config() - LOGGER.info("DRAM description database populated") - - if not keep_database_files: - rmtree(temporary) - LOGGER.info("Database preparation completed") - - -def update_dram_forms(output_dir, branch="master"): - if not path.isdir(output_dir): - mkdir(output_dir) - form_locs = dict() - form_locs["genome_summary_form_loc"] = download_genome_summary_form( - output_dir, branch - ) - form_locs["module_step_form_loc"] = download_module_step_form(output_dir, branch) - form_locs["etc_module_database_loc"] = download_etc_module_database( - output_dir, branch - ) - form_locs["function_heatmap_form_loc"] = download_function_heatmap_form( - output_dir, branch - ) - form_locs["amg_database_loc"] = download_amg_database(output_dir, branch) - db_handler = DatabaseHandler() - db_handler.set_database_paths(**form_locs) - - -""" - -os.system("DRAM.py annotate -i /home/projects-wrighton-2/DRAM/development_flynn/release_validation/data_sets/15_soil_genomes/all_data/Cytophaga_hutchinsonii_ATCC_33406.fasta -o test_15soil --use_camper --use_fegenie") -import os -os.system('DRAM-setup.py prepare_databases --output_dir /home/projects-wrighton-2/DRAM/dram_data/dram1.4_final_06_21_22/ --kegg_loc /home/Database/KEGG/kegg-all-orgs_20220603/kegg-all-orgs_unique_reheader_20220603.pep --threads 40') -os.system('DRAM-setup.py -h ') - version print DRAM version - prepare_databases Download and process databases for annotation - set_database_locations - Set database locations for already processed databases - update_description_db - Update description database - update_dram_forms Update DRAM distillate and liquor forms - print_config Print database locations - import_config Import CONFIG file - export_config Export CONFIG file -os.system('DRAM-setup.py print_config') -os.system('DRAM-setup.py export_config') -os.system('DRAM-setup.py import_config --config_loc dram2/CONFIG') -os.system('DRAM-setup.py set_database_locations') -os.system('DRAM-setup.py update_description_db') - -os.system('DRAM-setup.py prepare_databases --output_dir download_test') -os.system('DRAM-setup.py prepare_databases --output_dir download_test' -os.system('DRAM-setup.py prepare_databases --output_dir download_test --select_db vogdb') - ' --kegg_loc KEGG_LOC /home/Database/KEGG/kegg-all-orgs_20220129/kegg-all-orgs_unique_reheader_20220129.pep" ' # KEGG protein file, should be a single .pep, please merge all KEGG pep files (default: None) - '--threads 30' Number of threads to use building mmseqs2 databases (default: 10) - # '--gene_ko_link_loc ' # KEGG gene ko link, can be gzipped or not - '--kofam_hmm_loc' # hmm file for KOfam (profiles.tar.gz) (default: None) - '--kofam_ko_list_loc' # KOfam ko list file (ko_list.gz) (default: None) - ' --gene_ko_link_loc' # GENE_KO_LINK_LOC KEGG gene ko link, can be gzipped or not (default: None) - ' --kegg_download_date' # Date KEGG was download to include in database name (default: None) - ' --uniref_loc' # File path to uniref, if already downloaded (uniref90.fasta.gz) (default: None) - ' --uniref_version' # UniRef version to download (default: 90) - ' --skip_uniref' # Do not download and process uniref90. Saves time and memory usage and does not impact DRAM distillation - ' --pfam_loc' # File path to pfam-A full file, if already downloaded (Pfam-A.full.gz) (default: None) - ' --pfam_hmm' # pfam hmm .dat file to get PF descriptions, if already downloaded (Pfam-A.hmm.dat.gz) (default: None) - ' --dbcan_loc' # File path to dbCAN, if already downloaded (dbCAN-HMMdb-V9.txt) (default: None) - ' --dbcan_fam_activities' # CAZY family activities file, if already downloaded (CAZyDB.07302020.fam-activities.txt) (default: None) - ' --dbcan_version' # version of dbCAN to use (default: 10) - ' --vogdb_loc' # hmm file for vogdb, if already downloaded (vog.hmm.tar.gz) (default: None) - ' --vog_annotations_loc' # vogdb annotations file, if already downloaded (vog.annotations.tsv.gz) (default: None) - ' --viral_loc' # File path to merged viral protein faa, if already downloaded (viral.x.protein.faa.gz) (default: None) - ' --peptidase_loc' # File path to MEROPS peptidase fasta, if already downloaded (pepunit.lib) (default: None) - ' --genome_summary_form_loc' # File path to genome summary form,if already downloaded (default: None) - ' --module_step_form_loc' # File path to module step form, ifalready downloaded (default: None) - ' --etc_module_database_loc' # File path to etc module database, if already downloaded (default: None) - ' --function_heatmap_form_loc' # File path to function heatmap form, if already downloaded (default: None) - ' --amg_database_loc' # File path to amg database, if already downloaded (default: None) - ' --branch' # git branch from which to download forms; THIS SHOULD NOT BE CHANGED BY REGULAR USERS (default: master) - ' --keep_database_files' # Keep unporcessed database files (default: False) - - - - - - - - - - - - - - - - - - - - - - -) -""" \ No newline at end of file diff --git a/bin/assets/forms/db_utils.py b/bin/assets/forms/db_utils.py deleted file mode 100755 index fc9595bb..00000000 --- a/bin/assets/forms/db_utils.py +++ /dev/null @@ -1,287 +0,0 @@ -""" -*Old DRAM v1/early v2 DB utils code* - - -General utility, available to all dram tools -""" -import subprocess -from dataclasses import dataclass -from urllib.request import urlopen, urlretrieve -from urllib.error import HTTPError, URLError -from typing import Optional -from pathlib import Path -import logging - -# from os import getenv -import pandas as pd - - -def export_posible_path( - path: Optional[Path], relative_path: Optional[Path] = None -) -> Optional[str]: - if path is None: - return None - out_path = path.absolute() - if relative_path is not None and relative_path in out_path.parents: - out_path = out_path.relative_to(relative_path) - return out_path.as_posix() - - -def import_posible_path( - path: Optional[str], relative_path: Optional[Path] = None -) -> Optional[Path]: - if path is None: - return None - out_path = Path(path) - if relative_path is None: - return out_path.absolute() - return (relative_path / out_path).absolute() - - -@dataclass -class Fasta: - """ - The Fasta Class - --------------- - - Store your data and access it safly - """ - - name: str - origin: Path - tmp_dir: Path - faa: Path - fna: None | Path - gff: None | Path - mmsdb: None | Path - - def export(self, output_dir): - return ( - self.name, - export_posible_path(self.origin), - export_posible_path(self.tmp_dir, output_dir), - export_posible_path(self.faa, output_dir), - export_posible_path(self.fna, output_dir), - export_posible_path(self.gff, output_dir), - export_posible_path(self.mmsdb, output_dir), - ) - - @classmethod - def import_strings( - cls, - relative_path: Path, - name: str, - origin: str, - tmp_dir: str, - faa: str, - fna: str, - gff: str, - mmsdb: str, - ): - ob = cls( - name, - import_posible_path(origin), - import_posible_path(tmp_dir, relative_path), - import_posible_path(faa, relative_path), - import_posible_path(fna, relative_path), - import_posible_path(gff, relative_path), - import_posible_path(mmsdb, relative_path), - ) - return ob - - def get_fna(self) -> Path: - """ - Get the fna and handel it not existing - - :returns: - :raises ValueError: - """ - if self.fna is None: - raise ValueError( - "The fna file is not defined, did you import allready called faa files?" - ) - return self.fna - - def get_gff(self) -> Path: - """ - Get the gff and handel it not existing - - :returns: - :raises ValueError: - """ - if self.gff is None: - raise ValueError( - "The gff file is not defined, did you import allready called faa files?" - ) - return self.gff - - def get_mmsdb(self) -> Path: - """ - Get the mmsdb and handel it not existing - - :returns: - :raises ValueError: - """ - if self.mmsdb is None: - raise ValueError( - "The mmsdb file is not defined, are you trying to skip or develop the annotate pipeline?" - ) - return self.gff - - -class DramUsageError(Exception): - "Raised when dram is not used corectly, usally it means you are missing a step" - pass - - -def get_package_path(local_path: Path): - """ - Locate the package data or non python files - - :param local_path: - :returns: - """ - abs_snake_path = Path(__file__).parent.parent.absolute() / local_path - return abs_snake_path - - -def download_file( - url: str, - output_file: Path, - logger: logging.Logger, - alt_urls: None | list[str] = None, -): - """ - Download a file, probably a database - - :param url: - :param output_file: - :param logger: - :param alt_urls: - :returns: - :raises URLError: - """ - # TODO: catching error 4 and give error message to retry or retry automatically - links = [url] if alt_urls is None else [url] + alt_urls - for link in links: - logger.debug("downloading %s" % url) - try: - urlretrieve(link, output_file) - return - except BaseException as error: - # BaseException is good http was to exact - logger.warning(f"Something went wrong with the download of the url: {link}") - logger.warning(error) - raise URLError( - "DRAM whas not able to download a key database, check the logg for details" - ) - # run_process(['wget', '-O', output_file, url], verbose=verbose) - - -def get_annotation_ids_by_row(data, logger): - # functions = {i: j for i, j in ID_FUNCTION_DICT.items() if i in data.columns} - # missing = [i for i in ID_FUNCTION_DICT if i not in data.columns] - logger.info( - "Note: the fallowing id fields " - f"were not in the annotations file and are not being used: {missing}," - f" but these are {list(functions.keys())}" - ) - out = data.apply( - lambda x: { - i - for k, v in functions.items() - if not pd.isna(x[k]) - for i in v(str(x[k])) - if not pd.isna(i) - }, - axis=1, - ) - return out - - -# def get_all_annotation_ids(data, logger): -# data = get_ids_from_annotations_by_row(data, logger) -# data.apply(list) -# out = Counter(chain(*data.values)) -# return out - - -def run_process( - command, - logger, - shell: bool = False, - capture_stdout: bool = True, - save_output: str = None, - check: bool = False, - stop_on_error: bool = True, - verbose: bool = False, -) -> str: - """ - Standardization of parameters for using subprocess.run, provides verbose mode and option to run via shell - """ - # TODO just remove check - try: - results = subprocess.run( - command, - check=check, - shell=shell, - stdout=subprocess.PIPE, - stderr=subprocess.PIPE, - text=True, - ) - except subprocess.CalledProcessError as error: - logger.critical(f"The subcommand {command} experienced an error") - if stop_on_error: - raise error - if results.returncode != 0: - logger.critical( - f"The subcommand {command} experienced an error: {results.stderr}" - ) - logging.debug(results.stdout) - if stop_on_error: - raise subprocess.SubprocessError( - f"The subcommand {' '.join(command)} experienced an error, see the log for more info." - ) - - if save_output is not None: - with open(save_output, "w") as out: - out.write(results.stdout) - - if capture_stdout: - return results.stdout - - -def merge_files(files_to_merge, outfile, has_header=False): - """It's in the name, if has_header assumes all files have the same header""" - with open(outfile, "w") as outfile_handle: - if has_header: - outfile_handle.write(open(files_to_merge[0]).readline()) - for file in files_to_merge: - with open(file) as f: - if has_header: - _ = f.readline() - outfile_handle.write(f.read()) - - -def divide_chunks(l, n): - # looping till length l - for i in range(0, len(l), n): - yield l[i: i + n] - - -def remove_prefix(text, prefix): - if text.startswith(prefix): - return text[len(prefix):] - return text # or whatever - - -def remove_suffix(text, suffix): - if text.endswith(suffix): - return text[: -1 * len(suffix)] - return text # or whatever - - -def get_ordered_uniques(seq): - seen = set() - seen_add = seen.add - return [x for x in seq if not (x in seen or seen_add(x) or pd.isna(x))] From 721fcaa8e1b3fbc30f742a48a6dbd4144d5974e5 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Sat, 25 Apr 2026 22:39:49 +0300 Subject: [PATCH 17/19] fix(db_search): correct DB_channel_SETUP case mismatch Eight references used DB_CHANNEL_SETUP (all caps) but the workflow is defined as DB_channel_SETUP. Groovy is case-sensitive so the references failed at runtime with "No such variable: DB_CHANNEL_SETUP". Co-Authored-By: Claude Opus 4.7 (1M context) --- subworkflows/local/db_search.nf | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/subworkflows/local/db_search.nf b/subworkflows/local/db_search.nf index 71ccef7d..126f69a3 100644 --- a/subworkflows/local/db_search.nf +++ b/subworkflows/local/db_search.nf @@ -147,7 +147,7 @@ workflow DB_SEARCH { HMM_SEARCH_KOFAM ( ch_combined_proteins_locs, params.kofam_e_value, - DB_CHANNEL_SETUP.out.ch_kofam_db, + DB_channel_SETUP.out.ch_kofam_db, ch_kofam_list, true, kofam_name @@ -172,7 +172,7 @@ workflow DB_SEARCH { HMM_SEARCH_DBCAN ( ch_combined_proteins_locs, params.dbcan_e_value, - DB_CHANNEL_SETUP.out.ch_dbcan_db, + DB_channel_SETUP.out.ch_dbcan_db, default_sheet, false, dbcan_name @@ -189,7 +189,7 @@ workflow DB_SEARCH { HMM_SEARCH_CAMPER ( ch_combined_proteins_locs, params.camper_e_value, - DB_CHANNEL_SETUP.out.ch_camper_hmm_db, + DB_channel_SETUP.out.ch_camper_hmm_db, ch_camper_hmm_list, false, camper_name @@ -210,7 +210,7 @@ workflow DB_SEARCH { HMM_SEARCH_FEGENIE ( ch_combined_proteins_locs, params.fegenie_e_value, - DB_CHANNEL_SETUP.out.ch_fegenie_db, + DB_channel_SETUP.out.ch_fegenie_db, default_sheet, false, fegenie_name @@ -240,7 +240,7 @@ workflow DB_SEARCH { HMM_SEARCH_CANTHYD ( ch_combined_proteins_locs, params.canthyd_e_value, - DB_CHANNEL_SETUP.out.ch_canthyd_hmm_db, + DB_channel_SETUP.out.ch_canthyd_hmm_db, ch_canthyd_hmm_list, false, canthyd_name @@ -255,7 +255,7 @@ workflow DB_SEARCH { HMM_SEARCH_SULFUR ( ch_combined_proteins_locs, params.sulfur_e_value, - DB_CHANNEL_SETUP.out.ch_sulfur_db, + DB_channel_SETUP.out.ch_sulfur_db, default_sheet, false, sulfur_name @@ -291,7 +291,7 @@ workflow DB_SEARCH { HMM_SEARCH_METALS ( ch_combined_proteins_locs, params.metals_e_value, - DB_CHANNEL_SETUP.out.ch_metals_db, + DB_channel_SETUP.out.ch_metals_db, default_sheet, false, metals_name @@ -305,7 +305,7 @@ workflow DB_SEARCH { HMM_SEARCH_VOG ( ch_combined_proteins_locs, params.vog_e_value, - DB_CHANNEL_SETUP.out.ch_vogdb_db, + DB_channel_SETUP.out.ch_vogdb_db, default_sheet, false, vogdb_name From f1a60ec7ccfcb345be621d2faa2577fa5a9e2c51 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Sat, 25 Apr 2026 23:02:11 +0300 Subject: [PATCH 18/19] fix(db_search): correct formattedOutputchannels case mismatch Variable was declared as formattedOutputchannels (lowercase 'c') at line 124, but seven references used formattedOutputChannels (uppercase 'C'), tripping MissingPropertyException at runtime. Co-Authored-By: Claude Opus 4.7 (1M context) --- subworkflows/local/db_search.nf | 16 ++++++++-------- 1 file changed, 8 insertions(+), 8 deletions(-) diff --git a/subworkflows/local/db_search.nf b/subworkflows/local/db_search.nf index 126f69a3..d9abe777 100644 --- a/subworkflows/local/db_search.nf +++ b/subworkflows/local/db_search.nf @@ -153,7 +153,7 @@ workflow DB_SEARCH { kofam_name ) ch_kofam_formatted = HMM_SEARCH_KOFAM.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_kofam_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_kofam_formatted) } // PFAM annotation if (use_pfam) { @@ -180,7 +180,7 @@ workflow DB_SEARCH { ch_dbcan_unformatted = HMM_SEARCH_DBCAN.out.formatted_hits SQL_DBCAN(ch_dbcan_unformatted, dbcan_name, ch_sql_descriptions_db) ch_dbcan_formatted = SQL_DBCAN.out.sql_formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_dbcan_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_dbcan_formatted) } // CAMPER annotation if (use_camper) { @@ -195,7 +195,7 @@ workflow DB_SEARCH { camper_name ) ch_camper_hmm_formatted = HMM_SEARCH_CAMPER.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_camper_hmm_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_camper_hmm_formatted) // MMseqs ch_combined_query_locs_camper = ch_mmseqs_query.join(ch_gene_locs) @@ -216,7 +216,7 @@ workflow DB_SEARCH { fegenie_name ) ch_fegenie_formatted = HMM_SEARCH_FEGENIE.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_fegenie_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_fegenie_formatted) } // Methyl annotation if (use_methyl) { @@ -246,7 +246,7 @@ workflow DB_SEARCH { canthyd_name ) ch_canthyd_hmm_formatted = HMM_SEARCH_CANTHYD.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_canthyd_hmm_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_canthyd_hmm_formatted) } // Sulfur annotation @@ -261,7 +261,7 @@ workflow DB_SEARCH { sulfur_name ) ch_sulfur_formatted = HMM_SEARCH_SULFUR.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_sulfur_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_sulfur_formatted) } // MEROPS annotation if (use_merops) { @@ -297,7 +297,7 @@ workflow DB_SEARCH { metals_name ) ch_metals_formatted = HMM_SEARCH_METALS.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_metals_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_metals_formatted) } // VOGdb annotation if (use_vog) { @@ -311,7 +311,7 @@ workflow DB_SEARCH { vogdb_name ) ch_vog_formatted = HMM_SEARCH_VOG.out.formatted_hits - formattedOutputChannels = formattedOutputChannels.mix(ch_vog_formatted) + formattedOutputchannels = formattedOutputchannels.mix(ch_vog_formatted) } // Viral annotation if (params.use_viral) { From 051d70bc4f19a298bb31d0b4ad6ac9497a7854fc Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Taavi=20P=C3=A4ll?= Date: Sun, 26 Apr 2026 09:44:33 +0300 Subject: [PATCH 19/19] fix(annotate): drop MMSEQS_INDEX publishDir to save disk The mmseqs2 index files (*.mmsdb, .mmsdb.idx, .mmsdb_h, ...) are intermediate, memory-mapped artifacts only consumed by MMSEQS_SEARCH via the Nextflow channel; they are never read from results/. Copying them per-bin can be hundreds of GB and was filling GPFS quota, causing publishDir copy failures that aborted the pipeline. Co-Authored-By: Claude Opus 4.7 (1M context) --- conf/modules.config | 7 ------- 1 file changed, 7 deletions(-) diff --git a/conf/modules.config b/conf/modules.config index 91471656..da436784 100644 --- a/conf/modules.config +++ b/conf/modules.config @@ -107,13 +107,6 @@ process { mode: 'copy', ] } - withName: MMSEQS_INDEX { - publishDir = [ - path: "${params.outdir}/ANNOTATE/MMSEQS2", - mode: 'copy', - ] - } - withName: MMSEQS_SEARCH { publishDir = [ path: "${params.outdir}/ANNOTATE/MMSEQS2",