Repository 'seqsero2s'
hg clone http://toolrepo.galaxytrakr.org/repos/jpayne/seqsero2s

Changeset 21:6041d8f4eeeb (2026-05-15)
Previous changeset 20:4dbbf92ff30a (2026-05-15)
Commit message:
planemo upload commit 24ade7c48613defc1061058737056f0bc64e7709
modified:
Dockerfile
job_conf.yml
misc/bioconda-recipes-seqsero2s-meta.yml
patch_stringmlst.sh
seqsero2S.xml
tool-data/all_fasta.loc.sample
removed:
SeqSero2S/LICENSE
SeqSero2S/MANIFEST.in
SeqSero2S/README.md
SeqSero2S/bin/Initial_Conditions_SS2.py
SeqSero2S/bin/Initial_Conditions_SS2S.py
SeqSero2S/bin/SeqSero2S.py
SeqSero2S/bin/SeqSero2_update_kmer_database.py
SeqSero2S/bin/deinterleave_fastq.sh
SeqSero2S/seqsero2s_db/H_and_O_and_specific_genes.fasta
SeqSero2S/seqsero2s_db/antigens.pickle
SeqSero2S/seqsero2s_db/invA_mers_dict
SeqSero2S/seqsero2s_db/kmer/salmonella.log
SeqSero2S/seqsero2s_db/kmer/salmonella_35.txt
SeqSero2S/seqsero2s_db/kmer/salmonella_aroC.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_config.txt
SeqSero2S/seqsero2s_db/kmer/salmonella_dnaN.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_hemD.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_hisD.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_profile.txt
SeqSero2S/seqsero2s_db/kmer/salmonella_purE.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_sucA.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_thrA.tfa
SeqSero2S/seqsero2s_db/kmer/salmonella_weight.txt
SeqSero2S/seqsero2s_db/mlst.pickle
SeqSero2S/seqsero2s_db/special.pickle
SeqSero2S/setup.py
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb Dockerfile
--- a/Dockerfile Fri May 15 17:55:16 2026 +0000
+++ b/Dockerfile Fri May 15 19:51:16 2026 +0000
[
b'@@ -1,138 +1,138 @@\n-# Multi-stage Dockerfile for SeqSero2S\r\n-# Default build: docker build -t seqsero2s:latest .\r\n-# Test build: docker build --target test -t seqsero2s:test .\r\n-\r\n-# ============================================================================\r\n-# Stage 1: Base image with mambaforge for faster dependency resolution\r\n-# ============================================================================\r\n-FROM condaforge/mambaforge:latest AS base\r\n-\r\n-LABEL maintainer="SeqSero2S Maintainers"\r\n-LABEL description="Simplified Salmonella serotype prediction from genome sequencing data"\r\n-\r\n-# Set environment variables to reduce conda output and ensure non-interactive\r\n-# Disable SSL verification for VPN environments\r\n-ENV CONDA_ALWAYS_YES=true \\\r\n-    CONDA_AUTO_UPDATE_CONDA=false \\\r\n-    DEBIAN_FRONTEND=noninteractive\r\n-\r\n-# Configure conda to skip SSL verification\r\n-RUN conda config --set ssl_verify false\r\n-\r\n-# ============================================================================\r\n-# Stage 2: Builder - Install all dependencies and SeqSero2S\r\n-# ============================================================================\r\n-FROM base AS builder\r\n-\r\n-# Update base packages and install build essentials\r\n-RUN apt-get update && \\\r\n-    apt-get install -y --no-install-recommends \\\r\n-    wget \\\r\n-    ca-certificates \\\r\n-    bash \\\r\n-    && apt-get clean && \\\r\n-    rm -rf /var/lib/apt/lists/*\r\n-\r\n-# Create conda environment with all dependencies\r\n-# Using mamba for faster dependency resolution\r\n-RUN mamba create -n seqsero2s -c conda-forge -c bioconda \\\r\n-    python>=3 \\\r\n-    pip \\\r\n-    setuptools \\\r\n-    blast>=2.2 \\\r\n-    zstd \\\r\n-    samtools \\\r\n-    bedtools>=2.17 \\\r\n-    sra-tools>=2.8 \\\r\n-    spades>=3.9 \\\r\n-    salmid \\\r\n-    bwa>=0.7 \\\r\n-    seqtk>=1.3 \\\r\n-    stringmlst>=0.6 \\\r\n-    mlst>=2.32.2 \\\r\n-    perl-list-moreutils \\\r\n-    && mamba clean -afy\r\n-\r\n-# Install SeqSero2S from local fork\r\n-WORKDIR /tmp/build/SeqSero2S\r\n-\r\n-# Copy the current build context (the cloned source code) into the container.\r\n-COPY . .\r\n-\r\n-# Install SeqSero2S\r\n-RUN /opt/conda/envs/seqsero2s/bin/python -m pip install . -vv --no-deps --no-build-isolation --no-cache-dir\r\n-\r\n-# Apply the stringMLST.py patch inline using \'sed\'.\r\n-# This exactly replicates the original python patch script by commenting out the old line and adding the new one.\r\n-RUN if [ -f "/opt/conda/envs/seqsero2s/bin/stringMLST.py" ]; then \\\r\n-        sed -i \'s|            log = dbPrefix+\'\\\'\'.log\'\\\'\'|            # log = dbPrefix+\'\\\'\'.log\'\\\'\'\\n            log = os.path.join(os.getcwd(), "kmer.log")|g\' /opt/conda/envs/seqsero2s/bin/stringMLST.py && \\\r\n-        echo "PATCHED: stringMLST.py log path fixed"; \\\r\n-    else \\\r\n-        echo "SKIP: stringMLST.py not found"; \\\r\n-    fi\r\n-\r\n-# ============================================================================\r\n-# Stage 3: Test image - runs validation tests\r\n-# ============================================================================\r\n-FROM builder AS test\r\n-\r\n-# Create test directory\r\n-WORKDIR /test\r\n-\r\n-# Run test commands from the conda recipe\r\n-RUN echo "Running SeqSero2S tests..." && \\\r\n-    /opt/conda/envs/seqsero2s/bin/SeqSero2S.py -h && \\\r\n-    echo "SeqSero2S.py -h: PASSED" && \\\r\n-    /opt/conda/envs/seqsero2s/bin/blastn -help && \\\r\n-    echo "blastn -help: PASSED" && \\\r\n-    /opt/conda/envs/seqsero2s/bin/SalmID.py -h && \\\r\n-    echo "SalmID.py -h: PASSED" && \\\r\n-    /opt/conda/envs/seqsero2s/bin/mlst -h && \\\r\n-    echo "mlst -h: PASSED" && \\\r\n-    echo "All tests completed successfully!"\r\n-\r\n-# Default command shows test results\r\n-CMD ["echo", "All SeqSero2S tests passed successfully!"]\r\n-\r\n-# ============================================================================\r\n-# Stage 4: Production/Distribution image - minimal runtime (DEFAULT)\r\n-# ============================================================================\r\n-FROM condaforge/mambaforge:latest AS dist\r\n-\r\n-# Copy conda environment from builder\r\n-C'..b'&& \\\n+    apt-get install -y --no-install-recommends \\\n+    wget \\\n+    ca-certificates \\\n+    bash \\\n+    && apt-get clean && \\\n+    rm -rf /var/lib/apt/lists/*\n+\n+# Create conda environment with all dependencies\n+# Using mamba for faster dependency resolution\n+RUN mamba create -n seqsero2s -c conda-forge -c bioconda \\\n+    python>=3 \\\n+    pip \\\n+    setuptools \\\n+    blast>=2.2 \\\n+    zstd \\\n+    samtools \\\n+    bedtools>=2.17 \\\n+    sra-tools>=2.8 \\\n+    spades>=3.9 \\\n+    salmid \\\n+    bwa>=0.7 \\\n+    seqtk>=1.3 \\\n+    stringmlst>=0.6 \\\n+    mlst>=2.32 \\\n+    perl-list-moreutils \\\n+    && mamba clean -afy\n+\n+# Install SeqSero2S from local fork\n+WORKDIR /tmp/build/SeqSero2S\n+\n+# Copy the current build context (the cloned source code) into the container.\n+COPY . .\n+\n+# Install SeqSero2S\n+RUN /opt/conda/envs/seqsero2s/bin/python -m pip install . -vv --no-deps --no-build-isolation --no-cache-dir\n+\n+# Apply the stringMLST.py patch inline using \'sed\'.\n+# This exactly replicates the original python patch script by commenting out the old line and adding the new one.\n+RUN if [ -f "/opt/conda/envs/seqsero2s/bin/stringMLST.py" ]; then \\\n+        sed -i \'s|            log = dbPrefix+\'\\\'\'.log\'\\\'\'|            # log = dbPrefix+\'\\\'\'.log\'\\\'\'\\n            log = os.path.join(os.getcwd(), "kmer.log")|g\' /opt/conda/envs/seqsero2s/bin/stringMLST.py && \\\n+        echo "PATCHED: stringMLST.py log path fixed"; \\\n+    else \\\n+        echo "SKIP: stringMLST.py not found"; \\\n+    fi\n+\n+# ============================================================================\n+# Stage 3: Test image - runs validation tests\n+# ============================================================================\n+FROM builder AS test\n+\n+# Create test directory\n+WORKDIR /test\n+\n+# Run test commands from the conda recipe\n+RUN echo "Running SeqSero2S tests..." && \\\n+    /opt/conda/envs/seqsero2s/bin/SeqSero2S.py -h && \\\n+    echo "SeqSero2S.py -h: PASSED" && \\\n+    /opt/conda/envs/seqsero2s/bin/blastn -help && \\\n+    echo "blastn -help: PASSED" && \\\n+    /opt/conda/envs/seqsero2s/bin/SalmID.py -h && \\\n+    echo "SalmID.py -h: PASSED" && \\\n+    /opt/conda/envs/seqsero2s/bin/mlst -h && \\\n+    echo "mlst -h: PASSED" && \\\n+    echo "All tests completed successfully!"\n+\n+# Default command shows test results\n+CMD ["echo", "All SeqSero2S tests passed successfully!"]\n+\n+# ============================================================================\n+# Stage 4: Production/Distribution image - minimal runtime (DEFAULT)\n+# ============================================================================\n+FROM condaforge/mambaforge:latest AS dist\n+\n+# Copy conda environment from builder\n+COPY --from=builder /opt/conda/envs/seqsero2s /opt/conda/envs/seqsero2s\n+\n+# Update PATH to use the conda environment\n+ENV PATH=/opt/conda/envs/seqsero2s/bin:$PATH \\\n+    CONDA_DEFAULT_ENV=seqsero2s \\\n+    CONDA_PREFIX=/opt/conda/envs/seqsero2s\n+\n+# Install minimal runtime dependencies\n+RUN apt-get update && \\\n+    apt-get install -y --no-install-recommends \\\n+    ca-certificates \\\n+    procps \\\n+    && apt-get clean && \\\n+    rm -rf /var/lib/apt/lists/* /tmp/* /var/tmp/*\n+\n+# Create working directory\n+WORKDIR /data\n+\n+# Create non-root user for running the application\n+RUN useradd -m -u 1000 -s /bin/bash seqsero2s && \\\n+    chown -R seqsero2s:seqsero2s /data\n+USER seqsero2s\n+\n+# Add metadata labels\n+LABEL org.opencontainers.image.version="1.1.4" \\\n+      org.opencontainers.image.authors="LSTUGA" \\\n+      org.opencontainers.image.url="https://github.com/LSTUGA/SeqSero2S" \\\n+      org.opencontainers.image.documentation="https://github.com/LSTUGA/SeqSero2S" \\\n+      org.opencontainers.image.source="https://github.com/LSTUGA/SeqSero2S" \\\n+      org.opencontainers.image.licenses="GPL-2.0-or-later" \\\n+      org.opencontainers.image.title="SeqSero2S" \\\n+      org.opencontainers.image.description="Simplified Salmonella serotype prediction from genome sequencing data"\n+\n+# No entrypoint or command for dist target\n+\n+\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/LICENSE
--- a/SeqSero2S/LICENSE Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,342 +0,0 @@\n-NOTE: parties interested in commercial licenses should contact the UGA\xe2\x80\x99s Innovation Gateway (https://research.uga.edu/gateway/).\n-\n-\n-GNU GENERAL PUBLIC LICENSE\n-                       Version 2, June 1991\n- \n- Copyright (C) 1989, 1991 Free Software Foundation, Inc., <http://fsf.org/>\n- 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA\n- Everyone is permitted to copy and distribute verbatim copies\n- of this license document, but changing it is not allowed.\n-\n-                            Preamble\n-\n-  The licenses for most software are designed to take away your\n-freedom to share and change it.  By contrast, the GNU General Public\n-License is intended to guarantee your freedom to share and change free\n-software--to make sure the software is free for all its users.  This\n-General Public License applies to most of the Free Software\n-Foundation\'s software and to any other program whose authors commit to\n-using it.  (Some other Free Software Foundation software is covered by\n-the GNU Lesser General Public License instead.)  You can apply it to\n-your programs, too.\n-\n-  When we speak of free software, we are referring to freedom, not\n-price.  Our General Public Licenses are designed to make sure that you\n-have the freedom to distribute copies of free software (and charge for\n-this service if you wish), that you receive source code or can get it\n-if you want it, that you can change the software or use pieces of it\n-in new free programs; and that you know you can do these things.\n-\n-  To protect your rights, we need to make restrictions that forbid\n-anyone to deny you these rights or to ask you to surrender the rights.\n-These restrictions translate to certain responsibilities for you if you\n-distribute copies of the software, or if you modify it.\n-\n-  For example, if you distribute copies of such a program, whether\n-gratis or for a fee, you must give the recipients all the rights that\n-you have.  You must make sure that they, too, receive or can get the\n-source code.  And you must show them these terms so they know their\n-rights.\n-\n-  We protect your rights with two steps: (1) copyright the software, and\n-(2) offer you this license which gives you legal permission to copy,\n-distribute and/or modify the software.\n-\n-  Also, for each author\'s protection and ours, we want to make certain\n-that everyone understands that there is no warranty for this free\n-software.  If the software is modified by someone else and passed on, we\n-want its recipients to know that what they have is not the original, so\n-that any problems introduced by others will not reflect on the original\n-authors\' reputations.\n-\n-  Finally, any free program is threatened constantly by software\n-patents.  We wish to avoid the danger that redistributors of a free\n-program will individually obtain patent licenses, in effect making the\n-program proprietary.  To prevent this, we have made it clear that any\n-patent must be licensed for everyone\'s free use or not licensed at all.\n-\n-  The precise terms and conditions for copying, distribution and\n-modification follow.\n-\n-                    GNU GENERAL PUBLIC LICENSE\n-   TERMS AND CONDITIONS FOR COPYING, DISTRIBUTION AND MODIFICATION\n-\n-  0. This License applies to any program or other work which contains\n-a notice placed by the copyright holder saying it may be distributed\n-under the terms of this General Public License.  The "Program", below,\n-refers to any such program or work, and a "work based on the Program"\n-means either the Program or any derivative work under copyright law:\n-that is to say, a work containing the Program or a portion of it,\n-either verbatim or with modifications and/or translated into another\n-language.  (Hereinafter, translation is included without limitation in\n-the term "modification".)  Each licensee is addressed as "you".\n-\n-Activities other than copying, distribution and modification are not\n-covered by this License; they are outside its scope.  The act of\n-running the'..b'E STATED IN WRITING THE COPYRIGHT HOLDERS AND/OR OTHER PARTIES\n-PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY OF ANY KIND, EITHER EXPRESSED\n-OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF\n-MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE.  THE ENTIRE RISK AS\n-TO THE QUALITY AND PERFORMANCE OF THE PROGRAM IS WITH YOU.  SHOULD THE\n-PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF ALL NECESSARY SERVICING,\n-REPAIR OR CORRECTION.\n-\n-  12. IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING\n-WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MAY MODIFY AND/OR\n-REDISTRIBUTE THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES,\n-INCLUDING ANY GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING\n-OUT OF THE USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED\n-TO LOSS OF DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY\n-YOU OR THIRD PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER\n-PROGRAMS), EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE\n-POSSIBILITY OF SUCH DAMAGES.\n-\n-                     END OF TERMS AND CONDITIONS\n-\n-            How to Apply These Terms to Your New Programs\n-\n-  If you develop a new program, and you want it to be of the greatest\n-possible use to the public, the best way to achieve this is to make it\n-free software which everyone can redistribute and change under these terms.\n-\n-  To do so, attach the following notices to the program.  It is safest\n-to attach them to the start of each source file to most effectively\n-convey the exclusion of warranty; and each file should have at least\n-the "copyright" line and a pointer to where the full notice is found.\n-\n-    {description}\n-    Copyright (C) {year}  {fullname}\n-\n-    This program is free software; you can redistribute it and/or modify\n-    it under the terms of the GNU General Public License as published by\n-    the Free Software Foundation; either version 2 of the License, or\n-    (at your option) any later version.\n-\n-    This program is distributed in the hope that it will be useful,\n-    but WITHOUT ANY WARRANTY; without even the implied warranty of\n-    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the\n-    GNU General Public License for more details.\n-\n-    You should have received a copy of the GNU General Public License along\n-    with this program; if not, write to the Free Software Foundation, Inc.,\n-    51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.\n-\n-Also add information on how to contact you by electronic and paper mail.\n-\n-If the program is interactive, make it output a short notice like this\n-when it starts in an interactive mode:\n-\n-    Gnomovision version 69, Copyright (C) year name of author\n-    Gnomovision comes with ABSOLUTELY NO WARRANTY; for details type `show w\'.\n-    This is free software, and you are welcome to redistribute it\n-    under certain conditions; type `show c\' for details.\n-\n-The hypothetical commands `show w\' and `show c\' should show the appropriate\n-parts of the General Public License.  Of course, the commands you use may\n-be called something other than `show w\' and `show c\'; they could even be\n-mouse-clicks or menu items--whatever suits your program.\n-\n-You should also get your employer (if you work as a programmer) or your\n-school, if any, to sign a "copyright disclaimer" for the program, if\n-necessary.  Here is a sample; alter the names:\n-\n-  Yoyodyne, Inc., hereby disclaims all copyright interest in the program\n-  `Gnomovision\' (which makes passes at compilers) written by James Hacker.\n-\n-  {signature of Ty Coon}, 1 April 1989\n-  Ty Coon, President of Vice\n-\n-This General Public License does not permit incorporating your program into\n-proprietary programs.  If your program is a subroutine library, you may\n-consider it more useful to permit linking proprietary applications with the\n-library.  If this is what you want to do, use the GNU Lesser General\n-Public License instead of this License.\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/MANIFEST.in
--- a/SeqSero2S/MANIFEST.in Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,25 +0,0 @@
-include LICENSE
-include README.md
-include MANIFEST.in
-include version.py
-include setup.py
-include seqsero2s_db/antigens.pickle
-include seqsero2s_db/H_and_O_and_specific_genes.fasta
-include seqsero2s_db/invA_mers_dict
-include seqsero2s_db/special.pickle
-include seqsero2s_db/mlst.pickle
-include seqsero2s_db/kmer/salmonella_35.txt
-include seqsero2s_db/kmer/salmonella_aroC.tfa
-include seqsero2s_db/kmer/salmonella_config.txt
-include seqsero2s_db/kmer/salmonella_dnaN.tfa
-include seqsero2s_db/kmer/salmonella_hemD.tfa
-include seqsero2s_db/kmer/salmonella_hisD.tfa
-include seqsero2s_db/kmer/salmonella.log
-include seqsero2s_db/kmer/salmonella_profile.txt
-include seqsero2s_db/kmer/salmonella_purE.tfa
-include seqsero2s_db/kmer/salmonella_sucA.tfa
-include seqsero2s_db/kmer/salmonella_thrA.tfa
-include seqsero2s_db/kmer/salmonella_weight.txt
-include bin/deinterleave_fastq.sh
-include bin/Initial_Conditions_SS2.py
-include bin/Initial_Conditions_SS2S.py
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/README.md
--- a/SeqSero2S/README.md Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,151 +0,0 @@
-# SeqSero2S
-
-Salmonella serotype prediction from genome sequencing data.
-
-Online version: http://www.denglab.info/SeqSero2
-
-# Updates since SS2 v1.2.1
-1. Convert the sequences of the following alleles to their reverse complement sequences in the SeqSero2 database.
-```
--fliC_b_Wien_CDC_b,d,j__1488\
--fliC_d_from-II-48:d:z6_SRR1168371__1521\
--fliC_a_Salmonella.enterica_from-cdc-Stk2184_other.a__1488
--fliC_l,v_from-Nchanga_SRR1153349__1503
--fliC_l,z13,z28_Salmonella.enterica_from-CDC_2011K-0215_l,v__1506
--fljB_1,7_Salmonella.enterica_from-cdc_Stk1415_1__1521
--fljB_1,5_from-cdc_Stk2184_1__1521
--fljB_1,5_from-Infantis-micro-assembly_SRR1106258_1__1521
--fljB_z6_from-II-48:d:z6_SRR1168371__1503
-```
-2. Delete the following alleles from the SeqSero2 database because of the existence of mutations.
-```
--fliC_y_Bareillystr_AOZP01000027_other.y__1508
--fliC_d_Muenchenstr_ARYW01000085_b,d,j__1496
--fliC_d_Muenchenstr_ARYX01000110_b,d,j__1488
--fliC_g,m_Enteritidisstr_ALHD01000038_g,m__1507
--fljB_1,2_Newportstr_AYDZ01000021_1__1510
-```
-2. Add a fliC 1,5,7 allele and a fliC 1,2,7 allele into the SeqSero2 database.
-```
--fliC_1,5,7_Salmonella.enterica_from-cdc-Stk1778_1,5,7_1521
--fliC_1,2,7_Salmonella.enterica_from-cdc-Stk2293_1,2,7_1521
-```
-3. Delete the O54 allele
-```
--O-54_wbbF__1380
-```
-4. Fixed the bug that caused the misidentification of O9 and O2 by the micro-assembly workflow
-5. Update serotype names based on the simplified KWS scheme
-6. Remove the 9,46,27 allele
-```
--O-9,46,27_partial_wzy__1019
-```
-7. Remove two fljB_1,2 allels
-```
--fljB_1,2_from-Brazzaville_SRR2058145_1__1521
--fljB_1,2_Salmonella.enterica_1,4,5,12:i:1,2,7_AY353272_1__1521
-```
-8. Run 7-gene MLST analysis using stringMLST/mlst
-
-# Introduction 
-SeqSero2S is a pipeline for Salmonella serotype prediction from raw sequencing reads or genome assemblies
-
-# Dependencies 
-SeqSero2S has three workflows:
-
-(A) Allele micro-assembly (default). This workflow takes raw reads as input and performs targeted assembly of serotype determinant alleles. Assembled alleles are used to predict serotype and flag potential inter-serotype contamination in sequencing data (i.e., presence of reads from multiple serotypes due to, for example, cross or carryover contamination during sequencing). 
-
-Allele micro-assembly workflow depends on:
-
-1. Python 3;
-2. Biopython 1.73;
-3. [Burrows-Wheeler Aligner v0.7.12](http://sourceforge.net/projects/bio-bwa/files/);
-4. [Samtools v1.8](http://sourceforge.net/projects/samtools/files/samtools/);
-5. [NCBI BLAST v2.2.28+](https://blast.ncbi.nlm.nih.gov/Blast.cgi?PAGE_TYPE=BlastDocs&DOC_TYPE=Download);
-6. [SRA Toolkit v2.8.0](http://www.ncbi.nlm.nih.gov/Traces/sra/sra.cgi?cmd=show&f=software&m=software&s=software);
-7. [SPAdes v3.9.0](http://bioinf.spbau.ru/spades);
-8. [Bedtools v2.17.0](http://bedtools.readthedocs.io/en/latest/);
-9. [SalmID v0.11](https://github.com/hcdenbakker/SalmID);
-10. [stringMLST v0.6.3](https://github.com/jordanlab/stringMLST);
-
-(B) Raw reads k-mer. This workflow takes raw reads as input and performs rapid serotype prediction based on unique k-mers of serotype determinants. 
-
-Raw reads k-mer workflow (originally SeqSeroK) depends on:
-
-1. Python 3;
-2. [SRA Toolkit](http://www.ncbi.nlm.nih.gov/Traces/sra/sra.cgi?cmd=show&f=software&m=software&s=software) (optional, just used to fastq-dump sra files);
-3. [mlst v2.22.1](https://github.com/tseemann/mlst).
-
-
-(C) Genome assembly k-mer. This workflow takes genome assemblies as input and the rest of the workflow largely overlaps with the raw reads k-mer workflow
-
-# Installation
-### Git
-Install mlst and stringMLST first
-```
-conda install mlst
-```
-```
-pip install stringMLST
-```
-To install the SeqSero2S git repository locally:
-```
-git clone https://github.com/LSTUGA/SeqSero2S.git
-cd SeqSero2S
-python3 -m pip install --user .
-```
-
-# Executing the code 
-Make sure all SeqSero2S and its dependency executables are added to your path (e.g. to ~/.bashrc). Then type SeqSero2S.py to get detailed instructions.
-
-    Usage: SeqSero2S.py 
-
-    -m <string> (which workflow to apply, 'a'(raw reads allele micro-assembly), 'k'(raw reads and genome assembly k-mer), default=a)
-
-    -t <string> (input data type, '1' for interleaved paired-end reads, '2' for separated paired-end reads, '3' for single reads, '4' for genome assembly, '5' for nanopore reads (fasta/fastq))
-
-    -i <file> (/path/to/input/file)
-
-    -p <int> (number of threads for allele mode, if p >4, only 4 threads will be used for assembly since the amount of extracted reads is small, default=1) 
-
-    -b <string> (algorithms for bwa mapping for allele mode; 'mem' for mem, 'sam' for samse/sampe; default=mem; optional; for now we only optimized for default "mem" mode)

-    -d <string> (output directory name, if not set, the output directory would be 'SeqSero_result_'+time stamp+one random number)
-
-    -c <flag> (if '-c' was flagged, SeqSero2S will only output serotype prediction without the directory containing log files)
-    
-    -n <string> (optional, to specify a sample name in the report output)
-    
-    -s <flag> (if '-s' was flagged, SeqSero2S will not output header in SeqSero_result.tsv)
-     
-    --check <flag> (use '--check' flag to check the required dependencies)
-    
-    -v, --version (show program's version number and exit)
-
-
-# Examples
-Allele mode:
-
-    # Allele workflow ("-m a", default), for separated paired-end raw reads ("-t 2"), use 10 threads in mapping and assembly ("-p 10")
-    SeqSero2S.py -p 10 -t 2 -i R1.fastq.gz R2.fastq.gz
-
-K-mer mode:
-
-    # Raw reads k-mer ("-m k"), for separated paired-end raw reads ("-t 2")
-    SeqSero2S.py -m k -t 2 -i R1.fastq.gz R2.fastq.gz
-
-    # Genome assembly k-mer ("-t 4", genome assemblies only predicted by the k-mer workflow, "-m k")
-    SeqSero2S.py -m k -t 4 -i assembly.fasta
-
-# Output 
-Upon executing the command, a directory named 'SeqSero_result_Time_your_run' will be created. Your result will be stored in 'SeqSero_result.txt' in that directory. And the assembled alleles can also be found in the directory if using "-m a" (allele mode).
-
-
-# Citation
-Zhang S, Den-Bakker HC, Li S, Dinsmore BA, Lane C, Lauer AC, Fields PI, Deng X. 
-SeqSero2: rapid and improved Salmonella serotype determination using whole genome sequencing data.
-**Appl Environ Microbiology. 2019 Sep; 85(23):e01746-19.** [PMID: 31540993](https://aem.asm.org/content/early/2019/09/17/AEM.01746-19.long) 
-
-Zhang S, Yin Y, Jones MB, Zhang Z, Deatherage Kaiser BL, Dinsmore BA, Fitzgerald C, Fields PI, Deng X.  
-Salmonella serotype determination utilizing high-throughput genome sequencing data.  
-**J Clin Microbiol. 2015 May;53(5):1685-92.** [PMID: 25762776](http://jcm.asm.org/content/early/2015/03/05/JCM.00323-15)
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/bin/Initial_Conditions_SS2.py
--- a/SeqSero2S/bin/Initial_Conditions_SS2.py Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,109 +0,0 @@\n-#!/usr/bin/env python\n-\n-subs=['II', 'I', 'I', 'II', 'I', 'II', 'II', 'I', 'II', 'II', 'II', 'II', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'I', 'II', 'II', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'II', 'II', 'II', 'II', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'VI', 'II', 'I', 'VI', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'IV', 'I', 'I', 'II', 'I', 'I', 'IV', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'IV', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'VI', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'VI', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'bongori', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'IV', 'II', 'I', 'I', 'I', 'I', 'I', 'VI', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'IIIb', 'I', 'II', 'I', 'I', 'I', 'I', 'VI', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'VI', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'IV', 'I', 'II', 'I', 'II', 'II', 'II', 'I', 'II', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'IIIb', 'I', 'I', 'IIIb', 'IIIb', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'IIIb', 'IIIb', 'IIIb', 'I', 'I', 'I', 'I', 'IIIb', 'IIIb', 'I', 'I', 'I', 'II', 'IIIb', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'IIIb', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'IV', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'II', 'II', 'I', 'II', 'I', 'I', 'II', 'II', 'I', 'I', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'bongori', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I"..b"','30','28','44','8','16','18','7','7','43','47','6,14','13','13','42','4','44','9,46','3,10','13','13','13','16','30','9','40','40','44','48','48','52','57','58','66','40','40','7','7','40','7','41','41','43','41','38','4','4','42','42','42','18','8','28','18','18','18','21','21','21','40','28','39','30','35','35','38','38','43','28','57','43','51','51','7','53','53','50','56','7','7','7','59','62','63','7','54','47','43','44','44','44','44','44','50','45','41','47','47','47','47','48','48','45','16','6,14','1,3,19','11','11','3,10','8','11','6,14','16','16','16','11','3,10','9,46','13','8','13','6,14','17','8','9','13','8','8','13','53','41','48','56','17','50','44','17','44','1,3,19','43','41','42','41','11','42','42','43','48','8','8','53','53','9','51','50','50','9,46','9,46,27','7','44','48','48','47','3,10','3,10','45','45','7','7','9,46','16','6,14','6,14','40','38','40','35','40','35','4','44','30','28','16','18','13','13','21','21','18','16','17','45','63','62','35','18','21','48','16','44','51','48','50','50','8','40','44','43','11','41','40','60','4','40','9,46','7','4','8','11','7','9','42','48','66','7','3,10','50','57','6,14','16','43','9','40','7','16','47','7','52','58','53','53','65','65','65','59','58','61','41','16','61','61','60','61','60','60','60','65','47','48','35','50','47','47','48','47','43','35','35','6,14','6,14','38','38','47','42','50','35','50','38','47','42','58','30','9','47','16','42','40','7','8','38','48','21','66','3,10','18','48','40','66','40','4','7']\n-\n-remove_list=['Schleissheim', 'Sendai', 'Blegdam', 'Naestved', 'Rostock', 'Moscow', 'Antarctica', 'Rosenberg', 'Chittagong', 'Bilu', 'Dessau', 'Cannonhill', 'Ilugun']\n-\n-rename_dict={'Nitra': 'Enteritidis',\n- 'Kiel': 'Dublin',\n- 'Koessen': 'Panama',\n- 'Phaliron': 'Kalumburu',\n- 'Istanbul': 'Hadar',\n- 'Haardt': 'Blockley',\n- 'Ferruch': 'Kottbus',\n- 'Sanga': 'Eboko',\n- 'Pakistan': 'Litchfield',\n- 'Bellevue': 'Lezennes',\n- 'Sunnycove': 'Daarle',\n- 'Noya': 'Akanji',\n- 'Virginia': 'Muenchen',\n- 'Djelfa': 'Skansen',\n- 'Konstanz': 'Gatuni',\n- 'Bardo': 'Newport',\n- 'Houston': 'Panama',\n- 'Martonos': 'Finkenwerder',\n- 'Midway': 'Florida',\n- 'Lindern': 'Charity',\n- 'Bahrenfeld': 'Onderstepoort',\n- 'Schalkwijk': 'Moussoro',\n- 'Amberg': 'Boecker',\n- 'Madelia': 'Carrau',\n- 'Soahanina': 'Sundsvall',\n- 'Stafford': 'Poano',\n- 'Chichiri': 'Uzaramo',\n- 'II 16:g,[m],[s],t:[e,n,x]': 'II 16:g,[m],[s],t:[1,5]',\n- 'Hindmarsh':'Bovismorbificans',\n- 'Yovokome': 'Manhattan'}\n-\n- #potential merge for O22 and O23\n- #'Ibadan': 'Mississippi',\n- #'Bracknell': 'Oudwijk',\n- #'Vaertan': 'Ullevi',\n- #'Bahati': 'Durham',\n- #'Wichita': 'Friedenau',\n- #'Diguel': 'Telelkebir',\n- #'II 13,22:l,z28:1,5': 'II 13,23:l,z28:1,5',\n- #'Washington': 'Kintambo',\n- #'II 13,23:m,t:z42': 'II 13,22:m,t:z42:z39',\n- #'Serenli': 'Winslow',\n- #'Farmsen': 'Poona',\n- #'Durance': 'Ivrysurseine',\n- #'Agoueve': 'Cubana',\n- #'II 13,23:z29:1,5': 'II 13,22:z29:1,5',\n- #'II 13,23:z29:e,n,x': 'II 13,22:z29:e,n,x',\n- #'Picpus': 'Mampong',\n- #'Anna': 'Nimes',\n- #'Fanti': 'Leiden',\n- #'Ried': 'Ajiobo',\n-\n- #potential O68 list\n- #'Djelfa': 'Skansen',\n- #'Korbol': 'Nagoya',\n- #'Sanga': 'Eboko',\n- #'Konstanz': 'Gatuni',\n- #'Presov': 'Shipley',\n- #'Heistopdenberg': 'Bukuru',\n- #'Tounouma': 'Banalia',\n- #'Gaillac': 'Utah',\n- #'Santiago': 'Belem',\n- #'Virginia': 'Muenchen',\n- #'Yovokome': 'Manhattan',\n- #'Portanigra': 'Dunkwa',\n- #'Bardo': 'Newport',\n- #'Ferruch': 'Kottbus',\n- #'Alminko': 'Nanergou',\n- #'Bargny': 'Takoradi',\n- #'Magherafelt': 'Cyprus',\n- #'Haardt': 'Blockley',\n- #'Pakistan': 'Litchfield',\n- #'Yokoe': 'Bassa',\n- #'Noya': 'Akanji',\n- #'Lamphun': 'Giza',\n- #'Tananarive': 'Brunei',\n- #'Inchpark': 'Alagbon',\n- #'Sunnycove': 'Daarle',\n- #'Sindelfingen': 'Benue',\n- #'Phaliron': 'Kalumburu',\n- #'Bazenheid': 'Zerifin',\n- #'Paris': 'Mapo',\n- #'Istanbul': 'Hadar',\n- #'Chomedey': 'Glostrup',\n- #'Wippra': 'Molade',\n- #'Uno': 'Tamale',\n- #'Kolda': 'Yarm',\n- #'Bellevue': 'Lezennes',\n- #'Albany':'Duesseldorf'\n"
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/bin/Initial_Conditions_SS2S.py
--- a/SeqSero2S/bin/Initial_Conditions_SS2S.py Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b"@@ -1,110 +0,0 @@\n-#!/usr/bin/env python\n-\n-subs=['II', 'I', 'I', 'II', 'I', 'II', 'II', 'I', 'II', 'II', 'II', 'II', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'IIIb', 'I', 'II', 'II', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'II', 'II', 'II', 'II', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'VI', 'II', 'I', 'VI', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'IV', 'I', 'I', 'II', 'I', 'I', 'IV', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'IV', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'VI', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'VI', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'bongori', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'IV', 'II', 'I', 'I', 'I', 'I', 'I', 'VI', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'IIIb', 'I', 'II', 'I', 'I', 'I', 'I', 'VI', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'VI', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'IV', 'I', 'II', 'I', 'II', 'II', 'II', 'I', 'II', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'IIIb', 'I', 'I', 'IIIb', 'IIIb', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'IIIb', 'IIIb', 'IIIb', 'I', 'I', 'I', 'I', 'IIIb', 'IIIb', 'I', 'I', 'I', 'II', 'IIIb', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'IIIb', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'IIIb', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'I', 'II', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'IV', 'II', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'II', 'II', 'II', 'I', 'II', 'I', 'I', 'II', 'II', 'I', 'I', 'II', 'II', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'II', 'bongori', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I', 'I"..b"0:m,t:z42', 'II 40:z:z42', 'II [1],40:z42:1,6', 'II 43:b:z42', 'II 43:d:z42', 'II 43:z29:z42', 'II 43:z42:[1,5,7]', 'II 44:g,t:z42', 'II [1],44:m,t:z42', 'II 45:z29:z42', 'II 50:l,z28:z42', 'II 50:z42:1,7', 'II 53:d:z42', 'II 57:a:z42', 'II 57:z29:z42', 'II 57:z42:1,6:z53', 'II 3,10:z38:z42', 'II 1,6,14:z42:1,6', 'IIIb 18:(k):z54', 'IIIb 47:l,v:z57', 'IIIb 50:l,v:z57', 'IIIb 38:(k):z55', 'IIIb 21:l,v:z57', 'IIIb 48:k:z57', 'IIIb 59:z10:z57', 'IIIb 42:z57:1,5', 'Aesch', 'IIIb 38:z61:[z53]', 'Oakey', 'Aarhus', 'Franken', 'IIIb 42:z10:z67', 'VI 50:l,v:z67', 'IIIb 53:r:z68', 'Delmenhorst', 'II 3,15:z87:e,n,x,z15', 'VI 6,14:l,v:z88', 'Mygdal', 'II 1,9,12,46,27:a:z6', 'II 1,9,12,46,27:b:z39', 'II 1,9,12,46,27:c:z39', 'II 9,12,46,27:g,t:e,n,x', 'II 1,9,12,46,27:l,z13,z28:z39', 'II 1,9,12,46,27:y:z39', 'II 1,9,12,46,27:z10:1,5', 'II 1,9,12,46,27:z10:e,n,x', 'II 1,9,12,46,27:z10:z39', 'II 1,9,12,46,27:z4,z24:1,5', 'Tonev', 'Winnipeg', 'Rossleben', 'Borreze', 'Uccle', 'Poeseldorf', 'Ochsenwerder', 'Newholland', 'Czernyring', 'Steinwerder', 'Canton', 'Barry', 'Mundubbera', 'Yerba', 'Sendai', 'Abortusequi']\n-\n-rename_dict={\n-    'Nitra': 'Enteritidis',\n-    'Kiel': 'Dublin',\n-    'Koessen': 'Panama',\n-    'Phaliron': 'Kalumburu',\n-    'Istanbul': 'Hadar',\n-    'Haardt': 'Blockley',\n-    'Ferruch': 'Kottbus',\n-    'Eboko': 'Sanga',\n-    'Pakistan': 'Litchfield',\n-    'Bellevue': 'Lezennes',\n-    'Daarle': 'Sunnycove',\n-    'Noya': 'Akanji',\n-    'Virginia': 'Muenchen',\n-    'Skansen': 'Djelfa',\n-    'Konstanz': 'Gatuni',\n-    'Bardo': 'Newport',\n-    'Houston': 'Panama',\n-    'Martonos': 'Finkenwerder',\n-    'Midway': 'Florida',\n-    'Lindern': 'Charity',\n-    'Bahrenfeld': 'Onderstepoort',\n-    'Moussoro': 'Schalkwijk',\n-    'Amberg': 'Boecker',\n-    'Madelia': 'Carrau',\n-    'Soahanina': 'Sundsvall',\n-    'Stafford': 'Poano',\n-    'Chichiri': 'Uzaramo',\n-    'Hindmarsh':'Bovismorbificans',\n-    'Yovokome': 'Manhattan',\n-    ## SS2S\n-    'Fulica': 'I 4:a:-',\n-    'Korbol': 'Nagoya',\n-    'Presov': 'Shipley',\n-    'Heistopdenberg': 'Bukuru',\n-    'Tounouma': 'Banalia',\n-    'Gaillac': 'Utah',\n-    'Santiago': 'Belem',\n-    'Portanigra': 'Dunkwa',\n-    'Alminko': 'Nanergou',\n-    'Bargny': 'Takoradi',\n-    'Magherafelt': 'Cyprus',\n-    'Bassa': 'Yokoe',\n-    'Lamphun': 'Giza',\n-    'Brunei': 'Tananarive',\n-    'Inchpark': 'Alagbon',\n-    'Sindelfingen': 'Benue',\n-    'Bazenheid': 'Zerifin',\n-    'Paris': 'Mapo',\n-    'Chomedey': 'Glostrup',\n-    'Wippra': 'Molade',\n-    'Uno': 'Tamale',\n-    'Kolda': 'Yarm',\n-    'Duesseldorf': 'Albany',\n-    'Rosenberg': 'Enteritidis',\n-    'Blegdam': 'Enteritidis',\n-    'Moscow': 'Enteritidis',\n-    'Antarctica': 'Enteritidis',\n-    #'Chincol': 'Emek',\n-    'Dessau': 'Senftenberg',\n-    'Naestved': 'Dublin',\n-    'Rostock': 'Dublin',\n-    ##update names\n-    'IIIb 6,7:(k):z': 'IIIb 7:k:z',\n-    'IIIb 16:(k):e,n,x,z15': 'IIIb 16:k:e,n,x,z15',\n-    'IIIb 60:i:[e,n,x,z15]': 'IIIb 60:i:e,n,x,z15',\n-    'IIIb 60:i:[z]': 'IIIb 60:i:z',\n-    'IIIb 60:i:[z35]': 'IIIb 60:i:z35',\n-    'II [1],13,22:g,m,t:[1,5]': 'II 13,22:g,m,t:1,5',\n-    'II 6,7:z29:[z42]': 'II 7:z29:-',\n-    'II [1],13,22:g,t:[1,5]': 'II 13,22:g,t:1,5',\n-    'II 16:m,t:[z42]': 'II 16:m,t:-',\n-    'II 17:g,t:[e,n,x,z15]': 'II 17:g,t:e,n,x,z15',\n-    'VI 1,6,14,25:z10:1,(2),7': 'VI 6,14:z10:1,2,7',\n-    'II 13,22:m,t:z42:z39': 'II 13,22:m,t:z39',\n-}\n-\n-#potential merge for O22 and O23\n-    #'Ibadan': 'Mississippi',\n-    #'Bracknell': 'Oudwijk',\n-    #'Vaertan': 'Ullevi',\n-    #'Bahati': 'Durham',\n-    #'Wichita': 'Friedenau',\n-    #'Diguel': 'Telelkebir',\n-    #'II 13,22:l,z28:1,5': 'II 13,23:l,z28:1,5',\n-    #'Washington': 'Kintambo',\n-    #'Winslow': 'Serenli',\n-    #'Farmsen': 'Poona',\n-    #'Ivrysurseine': 'Durance',\n-    #'Agoueve': 'Cubana',\n-    #'II [1],13,23:z29:1,5': 'II 13,22:z29:1,5',\n-    #'II [1],13,23:z29:e,n,x': 'II 13,22:z29:e,n,x',\n-    #'Picpus': 'Mampong',\n-    #'Nimes': 'Anna',\n-    #'Fanti': 'Leiden',\n-    #'Ried': 'Ajiobo',\n"
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/bin/SeqSero2S.py
--- a/SeqSero2S/bin/SeqSero2S.py Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b'@@ -1,1723 +0,0 @@\n-#!/usr/bin/env python3\n-\n-import sys\n-import time\n-import random\n-import os\n-import subprocess\n-import gzip\n-import io\n-import pickle\n-import argparse\n-import itertools\n-import json\n-from distutils.version import LooseVersion\n-from distutils.spawn import find_executable\n-sys.path.insert(1,sys.path[0]+\'/..\')\n-\n-__version__ = "1.1.4"\n-\n-### SeqSero Kmer\n-def parse_args():\n-    "Parse the input arguments, use \'-h\' for help."\n-    parser = argparse.ArgumentParser(usage=\'SeqSero2S.py -t <data_type> -m <mode> -i <input_data> [-d <output_directory>] [-p <number of threads>] [-b <BWA_algorithm>]\\n\\nDevelopper: Shaokang Zhang (zskzsk@uga.edu), Hendrik C Den-Bakker (Hendrik.DenBakker@uga.edu) and Xiangyu Deng (xdeng@uga.edu)\\n\\nContact email:seqsero@gmail.com\\n\\n\')#add "-m <data_type>" in future\n-    parser.add_argument("-i",nargs="+",help="<string>: path/to/input_data",type=os.path.abspath)  ### add \'type=os.path.abspath\' to generate absolute path of input data.\n-    parser.add_argument("-t",choices=[\'1\',\'2\',\'3\',\'4\',\'5\'],help="<int>: \'1\' for interleaved paired-end reads, \'2\' for separated paired-end reads, \'3\' for single reads, \'4\' for genome assembly, \'5\' for nanopore reads (fasta/fastq)")\n-    parser.add_argument("-b",choices=[\'sam\',\'mem\'],default="mem",help="<string>: algorithms for bwa mapping for allele mode; \'mem\' for mem, \'sam\' for samse/sampe; default=mem; optional; for now we only optimized for default \'mem\' mode")\n-    parser.add_argument("-p",default="1",help="<int>: number of threads for allele mode, if p >4, only 4 threads will be used for assembly since the amount of extracted reads is small, default=1")\n-    parser.add_argument("-m",choices=[\'k\',\'a\'],default="a",help="<string>: which workflow to apply, \'a\'(raw reads allele micro-assembly), \'k\'(raw reads and genome assembly k-mer), default=a")\n-    parser.add_argument("-n",help="<string>: optional, to specify a sample name in the report output")\n-    parser.add_argument("-d",help="<string>: optional, to specify an output directory name, if not set, the output directory would be \'SeqSero_result_\'+time stamp+one random number")\n-    parser.add_argument("-c",action="store_true",help="<flag>: if \'-c\' was flagged, SeqSero2S will only output serotype prediction without the directory containing log files")\n-    parser.add_argument("-s",action="store_true",help="<flag>: if \'-s\' was flagged, SeqSero2S will not output header in SeqSero_result.tsv")\n-    parser.add_argument("--phred_offset",choices=[\'33\',\'64\',\'auto\'],default=\'auto\',help="<33|64|auto>: offset for FASTQ file quality scores, default=auto")\n-    parser.add_argument("--check",action="store_true",help="<flag>: use \'--check\' flag to check the required dependencies")\n-    parser.add_argument(\'-v\', \'--version\', action=\'version\', version=f"%(prog)s {__version__}")\n-    return parser.parse_args()\n-\n-### check paths of dependencies\n-check_dependencies = parse_args().check\n-dependencies = [\'bwa\',\'samtools\',\'blastn\',\'fastq-dump\',\'spades.py\',\'bedtools\',\'SalmID.py\',\'mlst\',\'stringMLST.py\']\n-if check_dependencies:\n-    for item in dependencies:\n-        ext_path = find_executable(item)\n-        if ext_path is not None:\n-            print ("Using "+item+" - "+ext_path)\n-        else:\n-            print ("ERROR: can not find "+item+" in PATH")\n-    sys.exit()\n-### end of --check\n-\n-def reverse_complement(sequence):\n-    complement = {\n-        \'A\': \'T\',\n-        \'C\': \'G\',\n-        \'G\': \'C\',\n-        \'T\': \'A\',\n-        \'N\': \'N\',\n-        \'M\': \'K\',\n-        \'R\': \'Y\',\n-        \'W\': \'W\',\n-        \'S\': \'S\',\n-        \'Y\': \'R\',\n-        \'K\': \'M\',\n-        \'V\': \'B\',\n-        \'H\': \'D\',\n-        \'D\': \'H\',\n-        \'B\': \'V\'\n-    }\n-    return "".join(complement[base] for base in reversed(sequence))\n-\n-def mlst(assembly):\n-    subprocess.check_call("mlst -q --json mlst.json --scheme senterica_achtman_2 "+assembly+" >> data_log.txt 2>&1",shell=True)\n-    f = open("mlst.json",\'r\')\n-    mlst_result = json.load(f)\n-    f.close()\n-'..b'"\\n"+\n-                         "O antigen prediction:\\t"+O_choice+"\\n"+\n-                         "H1 antigen prediction(fliC):\\t"+highest_fliC+"\\n"+\n-                         "H2 antigen prediction(fljB):\\t"+highest_fljB+"\\n"+\n-                         "Predicted identification:\\t"+subspecies_ID_dir[ssp_pointer]+"\\n"+\n-                         "Predicted antigenic profile:\\t"+predict_form+"\\n"+\n-                         "Predicted serotype:\\t"+predict_sero+"\\n"+\n-                         "Predicted serotype (SeqSero2 v1.3.2):\\t"+predict_sero_ss2+"\\n"+\n-                         note+star_line+claim+antigen_note+"\\n")#+##\n-          tsv_file.write(make_dir+"\\t"+input_file+"\\t"+O_choice+"\\t"+highest_fliC+"\\t"+highest_fljB+"\\t"+subspecies_ID_dir[ssp_pointer]+"\\t"+predict_form+"\\t"+predict_sero+"\\t"+predict_sero_ss2+"\\t"+star_line+claim+antigen_note+"\\t"+st+"\\n")\n-        else:\n-          new_file.write("Output directory:\\t"+make_dir+"\\n"+\n-                         "Input files:\\t"+input_file+"\\n"+\n-                         "O antigen prediction:\\t"+O_choice+"\\n"+\n-                         "H1 antigen prediction(fliC):\\t"+highest_fliC+"\\n"+\n-                         "H2 antigen prediction(fljB):\\t"+highest_fljB+"\\n"+\n-                         "Predicted identification:\\t"+subspecies_ID_dir[ssp_pointer]+"\\n"+\n-                         "Predicted antigenic profile:\\t"+predict_form+"\\n"+\n-                         "Predicted serotype:\\t"+subspecies+\' \'+predict_form+"\\n"+ # add serotype output for "N/A" prediction, subspecies\n-                         "Predicted serotype (SeqSero2 v1.3.2):\\t"+subspecies+\' \'+predict_form_ss2+"\\n"+\n-                         note+NA_note+star_line+claim+antigen_note+"\\n")#+##\n-          tsv_file.write(make_dir+"\\t"+input_file+"\\t"+O_choice+"\\t"+highest_fliC+"\\t"+highest_fljB+"\\t"+subspecies_ID_dir[ssp_pointer]+"\\t"+predict_form+"\\t"+subspecies+\' \'+predict_form+"\\t"+subspecies+\' \'+predict_form_ss2+"\\t"+NA_note+star_line+claim+antigen_note+"\\t"+st+"\\n")\n-        ###MLST\n-        new_file.write("Sequence type:\\t"+st+"\\n"+\n-                       "Number of ST"+st+" strains in EnteroBase:\\t"+st_count+"\\n"+\n-                       "\\n".join([k+":\\t"+v for k,v in sorted_alleles]))\n-        ###\n-        new_file.close()\n-        tsv_file.close()\n-      if "N/A" not in predict_sero:\n-        print("Output directory:\\t"+make_dir+"\\n"+\n-              "Input files:\\t"+input_file+"\\n"+\n-              "O antigen prediction:\\t"+O_choice+"\\n"+\n-              "H1 antigen prediction(fliC):\\t"+highest_fliC+"\\n"+\n-              "H2 antigen prediction(fljB):\\t"+highest_fljB+"\\n"+\n-              "Predicted identification:\\t"+subspecies_ID_dir[ssp_pointer]+"\\n"+\n-              "Predicted antigenic profile:\\t"+predict_form+"\\n"+\n-              "Predicted serotype:\\t"+predict_sero+"\\n"+\n-              "Predicted serotype (SeqSero2 v1.3.2):\\t"+predict_sero_ss2+"\\n"+\n-              note+star_line+claim+antigen_note+"\\n")#+##\n-      else:\n-        print("Output directory:\\t"+make_dir+"\\n"+\n-              "Input files:\\t"+input_file+"\\n"+\n-              "O antigen prediction:\\t"+O_choice+"\\n"+\n-              "H1 antigen prediction(fliC):\\t"+highest_fliC+"\\n"+\n-              "H2 antigen prediction(fljB):\\t"+highest_fljB+"\\n"+\n-              "Predicted identification:\\t"+subspecies_ID_dir[ssp_pointer]+"\\n"+\n-              "Predicted antigenic profile:\\t"+predict_form+"\\n"+\n-              "Predicted serotype:\\t"+subspecies+\' \'+predict_form+"\\n"+ # add serotype output for "N/A" prediction, subspecies\n-              "Predicted serotype (SeqSero2 v1.3.2):\\t"+subspecies+\' \'+predict_form_ss2+"\\n"+\n-              note+NA_note+star_line+claim+antigen_note+"\\n")#+##\n-      ###MLST\n-      print("Sequence type: "+st)\n-      print("Number of ST"+st+" strains in EnteroBase: "+st_count)\n-      #print("Allele profile...")\n-      for k,v in sorted_alleles:\n-        print(k+\': \'+v)\n-      print(\'\\n\')\n-      ###\n-if __name__ == \'__main__\':\n-  main()\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/bin/SeqSero2_update_kmer_database.py
--- a/SeqSero2S/bin/SeqSero2_update_kmer_database.py Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,113 +0,0 @@
-#!/usr/bin/env python3
-
-import argparse
-import os,subprocess
-import pickle
-
-### SeqSero Kmer
-def parse_args():
-    "Parse the input arguments, use '-h' for help."
-    parser = argparse.ArgumentParser(usage='Just type "SeqSero2_update_kmer_database.py", it will update kmer database automatically')
-    return parser.parse_args()
-
-def reverse_complement(sequence):
-    complement = {
-        'A': 'T',
-        'C': 'G',
-        'G': 'C',
-        'T': 'A',
-        'N': 'N',
-        'M': 'K',
-        'R': 'Y',
-        'W': 'W',
-        'S': 'S',
-        'Y': 'R',
-        'K': 'M',
-        'V': 'B',
-        'H': 'D',
-        'D': 'H',
-        'B': 'V'
-    }
-    return "".join(complement[base] for base in reversed(sequence))
-
-def multifasta_dict(multifasta):
-    multifasta_list = [
-        line.strip() for line in open(multifasta, 'r') if len(line.strip()) > 0
-    ]
-    headers = [i for i in multifasta_list if i[0] == '>']
-    multifasta_dict = {}
-    for h in headers:
-        start = multifasta_list.index(h)
-        for element in multifasta_list[start + 1:]:
-            if element[0] == '>':
-                break
-            else:
-                if h[1:] in multifasta_dict:
-                    multifasta_dict[h[1:]] += element
-                else:
-                    multifasta_dict[h[1:]] = element
-    return multifasta_dict
-
-def createKmerDict_reads(list_of_strings, kmer):
-    kmer_table = {}
-    for string in list_of_strings:
-        sequence = string.strip('\n')
-        for i in range(len(sequence) - kmer + 1):
-            new_mer = sequence[i:i + kmer].upper()
-            new_mer_rc = reverse_complement(new_mer)
-            if new_mer in kmer_table:
-                kmer_table[new_mer.upper()] += 1
-            else:
-                kmer_table[new_mer.upper()] = 1
-            if new_mer_rc in kmer_table:
-                kmer_table[new_mer_rc.upper()] += 1
-            else:
-                kmer_table[new_mer_rc.upper()] = 1
-    return kmer_table
-
-def multifasta_to_kmers_dict(multifasta):
-    multi_seq_dict = multifasta_dict(multifasta)
-    lib_dict = {}
-    for h in multi_seq_dict:
-        lib_dict[h] = set(
-            [k for k in createKmerDict_reads([multi_seq_dict[h]], 27)])
-    return lib_dict
-
-def get_salmid_invA_database(ex_dir):
-  # read invA kmer and return it
-  a = open(ex_dir + '/invA_mers_dict', 'rb')
-  invA_dict = pickle.load(a)
-  try:
-    del invA_dict['version']
-  except:
-    pass
-  return invA_dict
-
-def get_salmid_rpoB_database(ex_dir):
-  # read invA kmer and return it
-  a = open(ex_dir + '/rpoB_mers_dict', 'rb')
-  rpoB_dict = pickle.load(a)
-  try:
-    del rpoB_dict['version']
-  except:
-    pass
-  return rpoB_dict
-
-def main():
-  args = parse_args()
-  ex_dir = os.path.dirname(os.path.realpath(__file__))
-  lib_dict = multifasta_to_kmers_dict(ex_dir + '/H_and_O_and_specific_genes.fasta')
-  invA_dict=get_salmid_invA_database(ex_dir)
-  #rpoB_dict=get_salmid_rpoB_database(ex_dir)
-  lib_dict_new = lib_dict.copy()
-  #print(len(lib_dict_new))
-  lib_dict_new.update(invA_dict)
-  #print(len(lib_dict_new))
-  #lib_dict_new.update(rpoB_dict)
-  #print(len(lib_dict_new))
-  f = open(ex_dir + '/antigens.pickle', "wb")
-  pickle.dump(lib_dict_new, f)
-  f.close()
-
-if __name__ == '__main__':
-  main()
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/bin/deinterleave_fastq.sh
--- a/SeqSero2S/bin/deinterleave_fastq.sh Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,30 +0,0 @@
-#!/bin/bash
-# Usage: deinterleave_fastq.sh < interleaved.fastq f.fastq r.fastq [compress]
-# 
-# Deinterleaves a FASTQ file of paired reads into two FASTQ
-# files specified on the command line. Optionally GZip compresses the output
-# FASTQ files using pigz if the 3rd command line argument is the word "compress"
-# 
-# Can deinterleave 100 million paired reads (200 million total
-# reads; a 43Gbyte file), in memory (/dev/shm), in 4m15s (255s)
-# 
-# Latest code: https://gist.github.com/3521724
-# Also see my interleaving script: https://gist.github.com/4544979
-# 
-# Inspired by Torsten Seemann's blog post:
-# http://thegenomefactory.blogspot.com.au/2012/05/cool-use-of-unix-paste-with-ngs.html
-
-# Set up some defaults
-GZIP_OUTPUT=0
-PIGZ_COMPRESSION_THREADS=10
-
-# If the third argument is the word "compress" then we'll compress the output using pigz
-if [[ $3 == "compress" ]]; then
-  GZIP_OUTPUT=1
-fi
-
-if [[ ${GZIP_OUTPUT} == 0 ]]; then
-  paste - - - - - - - -  | tee >(cut -f 1-4 | tr "\t" "\n" > $1) | cut -f 5-8 | tr "\t" "\n" > $2
-else
-  paste - - - - - - - -  | tee >(cut -f 1-4 | tr "\t" "\n" | pigz --best --processes ${PIGZ_COMPRESSION_THREADS} > $1) | cut -f 5-8 | tr "\t" "\n" | pigz --best --processes ${PIGZ_COMPRESSION_THREADS} > $2
-fi
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/H_and_O_and_specific_genes.fasta
--- a/SeqSero2S/seqsero2s_db/H_and_O_and_specific_genes.fasta Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,6923 +0,0 @@\n->fliC_g,m_Enteritidisstr_AKFY01000033_g,m__1506\n-ATGGCACAAGTCATTAATACAAACAGCCTGTCGCTGTTGACCCAGAATAACCTGAACAAATCTCAGTCCTCACTGAGTTC\n-CGCTATTGAGCGTCTGTCCTCTGGTCTGCGTATCAACAGCGCGAAAGACGATGCGGCAGGCCAGGCGATTGCTAACCGCT\n-TCACTTCTAATATCAAAGGTCTGACTCAGGCTTCCCGTAACGCTAACGACGGCATTTCTATTGCGCAGACCACTGAAGGT\n-GCGCTGAATGAAATCAACAACAACCTGCAGCGTGTGCGTGAGTTGTCTGTTCAGGCCACTAACGGGACTAACTCTGATTC\n-CGATCTGAAATCTATCCAGGATGAAATTCAGCAACGTCTGGAAGAAATCGATCGCGTTTCTAATCAGACTCAATTTAACG\n-GTGTTAAAGTCCTGTCTCAGGACAACCAGATGAAAATCCAGGTTGGTGCTAACGATGGTGAAACCATTACCATCGATCTG\n-CAAAAAATTGATGTGAAAAGCCTTGGCCTTGATGGGTTCAATGTTAATGGGCCAAAAGAAGCGACAGTGGGTGATCTGAA\n-ATCCAGCTTCAAGAATGTTACGGGTTACGACACCTATGCAGCGGGTGCCGATAAATATCGTGTAGATATTAATTCCGGTG\n-CTGTAGTGACTGATGCAGCAGCACCGGATAAAGTATATGTAAATGCAGCAAACGGTCAGTTAACAACTGACGATGCGGAA\n-AATAACACTGCGGTTGATCTCTTTAAGACCACTAAATCTACTGCTGGTACCGCTGAAGCCAAAGCGATAGCTGGTGCCAT\n-TAAAGGTGGTAAGGAAGGAGATACCTTTGATTATAAAGGCGTGACTTTTACTATTGATACAAAAACTGGTGATGACGGTA\n-ATGGTAAGGTTTCTACTACCATCAATGGTGAAAAAGTTACGTTAACTGTCGCTGATATTGCCACTGGCGCGACGGATGTT\n-AATGCTGCTACCTTACAATCAAGCAAAAATGTTTATACATCTGTAGTGAACGGTCAGTTTACTTTTGATGATAAAACCAA\n-AAACGAGAGTGCGAAACTTTCTGATTTGGAAGCAAACAATGCTGTTAAGGGCGAAAGTAAAATTACAGTAAATGGGGCTG\n-AATATACTGCTAACGCCACGGGTGATAAGATCACCTTAGCTGGCAAAACCATGTTTATTGATAAAACAGCTTCTGGCGTA\n-AGTACATTAATCAATGAAGACGCTGCCGCAGCCAAGAAAAGTACCGCTAACCCACTGGCTTCAATTGATTCTGCATTGTC\n-AAAAGTGGACGCAGTTCGTTCTTCTCTGGGGGCAATTCAAAACCGTTTTGATTCAGCCATTACCAACCTTGGCAATACGG\n-TAACCAATCTGAACTCCGCGCGTAGCCGTATCGAAGATGCTGACTATGCAACGGAAGTTTCTAATATGTCTAAAGCGCAG\n-ATTCTGCAGCAGGCTGGTACTTCCGTTCTGGCGCAGGCTAACCAGGTTCCGCAAAACGTCCTCTCT\n->fliC_g,m,s_Montevideostr_AESV01000018_g,m__1506\n-ATGGCACAAGTCATTAATACAAACAGCCTGTCGCTGTTGACCCAGAATAACCTGAACAAATCTCAGTCCTCACTGAGTTC\n-CGCTATTGAGCGTCTGTCTTCCGGTCTGCGTATCAACAGCGCGAAAGACGATGCGGCAGGCCAGGCGATTGCTAACCGCT\n-TCACTTCTAATATCAAAGGTCTGACTCAGGCTTCCCGTAACGCTAACGACGGCATTTCTATTGCGCAGACCACTGAAGGC\n-GCGCTGAATGAAATCAACAACAACCTGCAGCGTGTGCGTGAGTTGTCTGTTCAGGCCACTAACGGGACTAACTCTGATTC\n-CGATCTGAAATCTATCCAGGATGAAATTCAGCAACGTCTGGAAGAAATCGATCGCGTTTCTAATCAGACTCAATTTAACG\n-GTGTTAAAGTCCTGTCTCAGGACAACCAGATGAAAATCCAGGTTGGTGCTAACGATGGTGAAACCATTACCATCGATCTG\n-CAAAAAATTGATGTGAAAAGCCTTGGCCTTGATGGGTTCAATGTTAATGGGCCAAAAGAAGCGACAGTGGGTGATCTGAA\n-ATCCAGCTTCAAGAATGTTACGGGTTATGACACCTATGCAGCGGGTGCCAATAAATATCGTGTAGATATTAATTCAGGTG\n-CTGTAGTAACTGATGATGCAGCACCGGATAAAGTATATGTAAATGCAGCAAATGGTCAGTTGACAACTGACGATGCGGAA\n-AATAACACTGCGGTTAACCTATTCAAGACGACTAAATCTGCTGCTGGTACCGATGAAGCCAAAGCGATAGCTGGTGCCAT\n-TAAGGGTGGTAAGGAAGGAGATACCTTTGATTATAAAGGCGTGACTTTTACTATTGATACAAAAACTGGTGATGACGGTA\n-ATGGTAAGGTTTCTACTACCATCAATGGTGAAAAAGTTACGTTAACTGTCGCTGATATTGCCACTGGCGCGACGGATGTT\n-AATGCTGCTACCTTACAATCAAGCAAAAATGTTTATACATCTGTAGTGAACGGTCAGTTTACTTTTGATGATAAAACCAA\n-AAACGAGAGTGCGAAACTTTCTGATTTGGAAGCAAACAATGCTGTTAAGGGCGAAAGTAAAATTACAGTAAATGGGGCTG\n-AATATACTGCTAACGCCGCGGGTGATAAGGTCACCTTAGCTGGCAAAACCATGTTTATTGATAAAACAGCTTCTGGCGTT\n-AGTACATTAATCAATGAAGACGCTGCCGCAGCCAAGAAAAGTACCGCTAACCCACTGGCTTCAATTGATTCTGCATTGTC\n-AAAAGTGGACGCAGTTCGTTCTTCTCTGGGGGCAATTCAAAACCGTTTTGATTCAGCCATTACCAACCTTGGCAATACGG\n-TAACCAATCTGAACTCCGCGCGTAGCCGTATCGAAGATGCTGACTATGCAACGGAAGTTTCTAATATGTCTAAAGCGCAG\n-ATTCTGCAGCAGGCTGGTACTTCCGTTCTGGCGCAGGCTAACCAGGTTCCGCAAAACGTCCTCTCT\n->fljB_1,2_Salmonella.enterica_Stanley_AY353267_1__1521\n-ATGGCACAAGTAATCAACACTAACAGTCTGTCGCTGCTGACCCAGAATAACCTGAACAAATCCCAGTCCGCACTGGGCAC\n-CGCTATCGAGCGTCTGTCTTCTGGTCTGCGTATCAACAGCGCGAAAGACGATGCGGCAGGTCAGGCGATTGCTAACCGTT\n-TTACCGCGAACATCAAAGGTCTGACTCAGGCTTCCCGTAACGCTAACGACGGTATCTCCATTGCGCAGACCACTGAAGGC\n-GCGCTGAACGAAATCAACAACAACCTGCAGCGTGTGCGTGAACTGGCGGTTCAGTCTGCTAACAGCACTAACTCCCAGTC\n-TGACCTCGACTCTATCCAGGCTGAAATTACCCAGCGTCTGAACGAAATCGACCGTGTATCCGGCCAGACTCAGTTCAACG\n-GCGTGAAAGTCCTGGCGCAGGACAACACCCTGACCATCCAGGTTGGTGCCAACGACGGTGAAACTATCGATATCGATCTG\n-AAGCAGATCAACTCTCAGACCCTGGGTCTGGACTCACTGAACGTGCAGAAAGCGTATGATGTGAAAGATACAGCAGTAAC\n-AACGAAAGCTTATGCCAATAATGGTACTACACTGGATGTATCGGGTCTTGATGATGCAGCTATTAAAGCGGCTACGGGTG\n-GTACGAATGGTACGGCTTCTGTAACCGGTGGTGCGGTTAAATTTGACGCAGATAATAACAAGTACTTTGTTACTATTGGT'..b'CGGTGACAATGACCGCAAATAAATCAACAGTAACTGGGGCCGG\n-CACAGTTACCAAAAACCAAATTGTAGACGCTGTTACTCCGGCACCAGTTGATACAGTCGCAGCAGCTACTGCATTGACCA\n-ATGCAGGTGTGACAGGTGCGACAGGTAATACCAGCTTGGTTAAAATGTCATTTGAAGATAAAAATGGCAAAGTTACTGAT\n-GCGGGTTACGCGCTTAAAGTTGGAAATGATTATTATGCCGCTGATTACGATGAAAAGACTGGTGAGATAAAAGCTAAGAC\n-TGTAAATTATACTGACGCTACTGGTGCAACAAAAACTGGTGCTGTGAAATTTGGCGGCGCGAATGGTAAAACTGAAGTTG\n-TGACTACAGTTGATGGTAATACTTATCAGGCTAGTGATGTGAAAGGGCATAATTTCCAGAGTGGTGGCGCTTTAAGTGAG\n-GCTGTGACTACTAAAACTGAAAACCCGCTGGCTAAAATTGATGCCGCGCTGGCGCAGGTTGATGCGCTGCGTTCTGACCT\n-GGGTGCGGTTCAGAACCGTTTCAACTCCGCTATCACCAATCTGGGCAATACCGTAAACAACTTGTCTGAAGCGCGTAGCC\n-GTATCGAAGATTCCGACTACGCGACCGAAGTCTCCAACATGTCTCGCGCGCAGATTCTGCAGCAGGCCGGTACTTCCGTT\n-CTGGCGCAGGCTAACCAGGTTCCGCAAAACGTCCTCTCTTTACTGCGTTAA\n->fliC_1,5,7_Salmonella.enterica_from-cdc-Stk1778_1,5,7__1521\n-ATGGCACAAGTCATTAATACAAACAGCCTGTCGCTGTTGACCCAGAATAACCTGAACAAATCCCAGTCCGCACTGGGCAC\n-TGCTATTGAGCGTCTGTCTTCCGGTCTGCGTATCAACAGCGCGAAAGACGATGCGGCAGGTCAGGCGATTGCTAACCGTT\n-TCACCGCGAACATCAAAGGCCTGACGCAGGCTTCCCGTAACGCTAACGACGGTATTTCTATTGCGCAGACCACTGAAGGC\n-GCGCTGAACGAAATCAACAACAACCTGCAGCGTGTGCGTGAACTGGCGGTTCAGTCTGCTAACAGCACCAACTCCCAGTC\n-TGACCTCGACTCCATCCAGGCTGAAATCACCCAGCGTCTGAACGAAATCGACCGTGTATCCGGCCAGACTCAGTTCAACG\n-GCGTGAAAGTCCTGGCGCAGGACAACACCCTGACCATCCAGGTTGGCGCGAACGACGGTGAAACTATTGATATCGATCTG\n-AAGCAGATCAACTCGCAGACCCTGGGCCTGGATTCACTGAACGTGCAGAAAGCGTATGATGTGAAAGATACAGCAGTAAC\n-AACGACAGCTTATGCCGATAACGGTACTACATTGAATGTCTCAGGCCTTGATGATGCAGCTATCAAAGCGGCTACGGGGG\n-GTACGACTGGTGCACCTACTGTAACAGGTGGTGCGGTTAAATTTGACGCAGATAATAACAAGTACTTTGTTACTATTGGG\n-GGCTTTACTGGTGGTGATCTCGCCAAAAATGGCGATTATGAAGTTAACGTTGCTACTGACGGTACAGTAACACTTGCGCC\n-TGGTGCAACTAAAACCACAATGCCTGCTGGTGCGACAACTAAAACAGAAGTACAGGAGTTAAAAACTACACCGGTAGCTG\n-CTTCAGCAGATGCTAAAAATGCCTTAATCGCTGGCGGCGTTGACACTACCGATGCTAATGGCGCTGAGTTGGTCAAAATG\n-TCTTATACCGATAAAAATGGTAAGACAATTGAAGGCGGCTATGCGCTTAAAGCTGGCGATAAGTATTACGCCGCAGATTA\n-CGACGAAACGACAGGGGCAATTAAAGCTAAAACCACAAGTTATACTGCTGCTGACGGTACTACCAAAACAGCGGCTAACC\n-AACTGGGTGGCGCAGACGGTAAAACCGAAGTTGTTACTATCGACGGTAAAACCTACAATGCCAGCAAAGCCGCTGGTCAT\n-GATTTCAAAGCACAGCCAGAGCTGGCGGAAGCGGCTGCTAAAACCACTGAAAACCCGCTGGCTAAAATTGATGCCGCGCT\n-GGCGCAGGTGGATGCACTGCGTTCTGACCTGGGTGCGGTTCAGAACCGTTTCAACTCCGCTATCACCAACCTGGGCAATA\n-CCGTAAATAACCTGTCTTCTGCCCGTAGCCGTATCGAAGATTCCGACTACGCGACCGAAGTCTCCAACATGTCTCGCGCG\n-CAGATTCTGCAGCAGGCCGGTACCTCCGTTCTGGCGCAGGCTAACCAGGTTCCGCAAAACGTCCTCTCTTTACTGCGTTA\n-A\n->fliC_1,2,7_Salmonella.enterica_from-cdc-Stk2293_1,2,7__1521\n-ATGGCACAAGTCATTAACACAAACAGCCTGTCGCTGTTGACCCAGAATAACCTGAACAAATCCCAGTCCGCACTGGGCAC\n-TGCTATTGAGCGTCTGTCTTCCGGTCTGCGTATCAACAGCGCGAAAGACGATGCGGCAGGTCAGGCGATTGCTAACCGTT\n-TCACCGCGAACATCAAAGGCCTGACTCAGGCTTCCCGTAACGCTAACGACGGTATTTCTATTGCGCAGACCACTGAAGGC\n-GCGCTGAACGAAATCAACAACAACCTGCAGCGTGTGCGTGAACTGGCGGTTCAGTCTGCTAACAGCACCAACTCCCAGTC\n-TGACCTCGACTCCATCCAGGCTGAAATCACCCAGCGTCTGAACGAAATCGACCGTGTATCCGGCCAGACTCAGTTCAACG\n-GCGTGAAAGTCCTGGCGCAGGACAACACCCTGACCATCCAGGTTGGCGCCAACGACGGTGAAACTATCGATATCGATCTG\n-AAGCAGATCAACTCTCAGACCCTGGGTCTGGATTCACTGAACGTGCAGAAAGCGTATGATGTGAAAGATACAGCAGTAAC\n-AACGAAAGCTTATGCCAATAATGGTACTACACTGGATGTATCGGGTCTTACTGATGCAGCTATTAAAACGGCTACGGGTG\n-GTACGAATGGTGCACCTGCTGTAACAGGTGGTGCGGTTAAATTTGACGCAGATAATAACAAGTACTTTGTTACTATTGGT\n-GGCTTTACTGGTGCTGATGCCGCCAAAAATGGCGATTATGAAGTTAACGTTGCTACTGACGGTACAGTAACACTTGCGCC\n-TGGTGCAACTAAAACCACAATGCCTGCTGGTGCGACAACTAAAACAGAAGTACAGGAGTTAAAAGCTACACCGGTAGCTG\n-CTTCAGCAGATGCTAAAAATGCCTTAATCGCTGGCGGCGTTGACACTGCCGATGCTAATGGCGCTGAGTTGGTCAAAATG\n-TCTTATACCGATAAAAATGGTAAGACAATTGAAGGCGGCTATGCGCTTAAAGCTGGCGATAAGTATTACGCCGCAGATTA\n-CGACGAAACGACAGGGGCAATTAAAGCTAAAACCACAAGTTATACTGCTGCTGACGGTACTACCAAAACAGCGGCTAACC\n-AACTGGGTGGCGCAGACGGTAAAACTGAAGTCGTTTCTATCGACGGTAAAACCTACAATGCCAGCAAAGCCGAAGGTCAC\n-AACTTCAAAGCACAGCCAGAGCTGGCTGAAGTAGCTACTAAAACCACCGAAAACCCGCTGCAGAAAATTGATGCTGCGCT\n-GGCACAGGTTGACACGTTACGTTCTGACCTGGGTGCGGTACAAAACCGTTTCAACTCCGCTATCACCAACCTGGGCAATA\n-CCGTAAATAACCTGTCTTCTGCCCGTAGCCGTATCGAAGATTCCGACTACGCGACCGAAGTCTCCAACATGTCTCGCGCG\n-CAGATTCTGCAGCAGGCCGGTACTTCCGTTCTGGCGCAGGCTAACCAGGTTCCGCAAAACGTCCTCTCTTTACTGCGTTA\n-A\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/antigens.pickle
b
Binary file SeqSero2S/seqsero2s_db/antigens.pickle has changed
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/invA_mers_dict
b
Binary file SeqSero2S/seqsero2s_db/invA_mers_dict has changed
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella.log
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella.log Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,24 +0,0 @@
-06/26/2023 09:03:06 AM singleSampleTool : GDUTNS--Y1.R1.raw.fastq.gz and GDUTNS--Y1.R2.raw.fastq.gz
-06/26/2023 09:03:06 AM singleSampleTool : paired True
-06/26/2023 09:03:06 AM singleSampleTool : fastq1 start
-06/26/2023 09:03:06 AM singleFileTool :GDUTNS--Y1.R1.raw.fastq.gz
-06/26/2023 09:03:06 AM singleFileTool : fastq
-06/26/2023 09:03:06 AM fileExplorer :GDUTNS--Y1.R1.raw.fastq.gz
-06/26/2023 09:03:54 AM singleSampleTool : fastq1 done
-06/26/2023 09:03:54 AM singleSampleTool : fastq2 start
-06/26/2023 09:03:54 AM singleFileTool :GDUTNS--Y1.R2.raw.fastq.gz
-06/26/2023 09:03:54 AM singleFileTool : fastq
-06/26/2023 09:03:54 AM fileExplorer :GDUTNS--Y1.R2.raw.fastq.gz
-06/26/2023 09:04:48 AM singleSampleTool : fastq2 done
-06/26/2023 09:04:48 AM singleSampleTool : weightedProfile start
-06/26/2023 09:04:48 AM weightedProf
-06/26/2023 09:04:48 AM singleSampleTool : weightedProfile finished
-06/26/2023 09:04:48 AM singleSampleTool : getMaxCount start
-06/26/2023 09:04:48 AM getMaxCount
-06/26/2023 09:04:48 AM Max Support :GDUTNS--Y : {'purE': {'5': 54640}, 'dnaN': {'8': 75064}, 'thrA': {'15': 80816}, 'sucA': {'11': 61141}, 'hemD': {'11': 72516}, 'aroC': {'8': 77112}, 'hisD': {'11': 51911}}
-06/26/2023 09:04:48 AM Second Max Support :GDUTNS--Y : {'purE': {'4': 48207, '456': 48207}, 'dnaN': {'1': 58680, '492': 58680}, 'thrA': {'10': 63003}, 'sucA': {'9': 58437, '46': 58437, '109': 58437, '197': 58437, '413': 58437, '570': 58437, '925': 58437, '1060': 58437}, 'hemD': {'3': 65987}, 'aroC': {'7': 67451}, 'hisD': {'1': 40164, '353': 40164}}
-06/26/2023 09:04:48 AM singleSampleTool : getMaxCount end
-06/26/2023 09:04:48 AM singleSampleTool : findST start
-06/26/2023 09:04:48 AM findST
-06/26/2023 09:04:48 AM singleSampleTool : findST end
-06/26/2023 09:04:48 AM Command :['/home/shaoting/.conda/envs/seqsero2s/bin/stringMLST.py', '--predict', '-P', 'kmer/salmonella', '-1', 'GDUTNS--Y1.R1.raw.fastq.gz', '-2', 'GDUTNS--Y1.R2.raw.fastq.gz', '-o', 'GDUTNS--Y1_stringMLST.txt']
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_35.txt
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_35.txt Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
b'@@ -1,388076 +0,0 @@\n-GTTTTTCGCCCGGGACACGCGGATTACACCTATGA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TCATAGGTGTAATCCGCGTGTCCCGGGCGAAAAAC\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TTTTTCGCCCGGGACACGCGGATTACACCTATGAG\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-CTCATAGGTGTAATCCGCGTGTCCCGGGCGAAAAA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TTTTCGCCCGGGACACGCGGATTACACCTATGAGC\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-GCTCATAGGTGTAATCCGCGTGTCCCGGGCGAAAA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TTTCGCCCGGGACACGCGGATTACACCTATGAGCA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TGCTCATAGGTGTAATCCGCGTGTCCCGGGCGAAA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TTCGCCCGGGACACGCGGATTACACCTATGAGCAG\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-CTGCTCATAGGTGTAATCCGCGTGTCCCGGGCGAA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TCGCCCGGGACACGCGGATTACACCTATGAGCAGA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TCTGCTCATAGGTGTAATCCGCGTGTCCCGGGCGA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-CGCCCGGGACACGCGGATTACACCTATGAGCAGAA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TTCTGCTCATAGGTGTAATCCGCGTGTCCCGGGCG\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-GCCCGGGACACGCGGATTACACCTATGAGCAGAAA\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-TTTCTGCTCATAGGTGTAATCCGCGTGTCCCGGGC\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-CCCGGGACACGCGGATTACACCTATGAGCAGAAAT\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-ATTTCTGCTCATAGGTGTAATCCGCGTGTCCCGGG\taroC\t[1,305,511,512,529,530,531,532,698,1126,1173]\n-CCGGGACACGCGGATTACACCTATGAGCAGAAATA\taroC\t[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,20,21,22,23,27,28,29,30,31,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,50,51,52,53,56,59,60,61,62,63,65,67,68,69,70,72,75,76,77,78,79,80,81,82,87,88,89,90,92,93,94,98,99,100,101,102,103,105,106,107,108,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,128,129,130,131,136,137,140,141,142,143,144,147,148,150,152,153,154,155,156,158,159,160,161,162,163,164,165,168,169,170,172,175,178,179,182,183,184,185,186,187,189,193,194,195,196,197,198,199,200,201,202,203,208,209,210,213,214,215,218,221,222,225,230,231,232,233,234,244,250,254,255,256,261,262,270,277,279,282,289,290,291,294,296,297,298,299,302,303,304,305,306,307,308,310,312,313,314,315,316,319,320,321,322,324,325,326,328,329,331,332,333,336,338,341,342,343,344,345,346,347,348,349,351,353,355,357,359,360,361,362,363,364,365,367,368,369,371,373,374,375,376,379,381,382,383,386,391,397,398,400,401,403,404,407,408,409,410,411,412,413,415,416,418,419,420,421,426,428,430,431,434,435,437,438,439,440,441,442,443,444,450,451,453,454,457,462,463,464,465,468,470,472,473,474,475,476,478,480,481,482,483,484,485,488,490,492,493,494,495,496,497,498,501,504,505,507,509,511,512,514,515,519,520,523,526,527,528,529,530,531,532,533,534,535,536,537,538,540,541,542,543,544,545,546,547,548,549,551,553,558,559,560,561,564,565,566,567,568,569,571,572,575,576,579,581,582,583,584,587,589,590,592,594,595,597,599,601,602,604,608,626,627,628,630,631,634,636,640,641,646,647,650,651,652,653,658,660,662,663,664,665,666,667,668,669,670,672,673,674,675,678,679,680,681,686,688,691,692,693,698,699,700,701,702,706,711,713,717,718,719,720,723,724,725,726,727,729,732,733,734,735,736,739,740,742,747,748,749,750,751,752,753,755,756,757,759,760,761,763,764,765,766,767,770,771,773,774,776,778,779,781,782,783,784,785,786,787,788,789,790,791,792,794,795,796,799,800,801,804,805,808,809,810,811,812,814,816,818,820,821,822,823,825,826,827,830,831,832,833,834,835,836,837,838,839,840,844,845,846,850,851,854,855,856,857,858,859,860,861,862,863,864,865,866,867,871,876,884,885,886,887,891,892,893,894,896,897,898,908,909,910,911,913,914,916,917,919,922,923,924,926,927,930,931,932,935,936,937,938,940,943,944,945,947,952,953,955,956,959,960,962,965,967,968,971,974,976,978,980,982,983,988,989,990,991,992,993,994,995,999,1000,1001,1002,1003,1004,1006,1007,1009,'..b'ATCCCCTGTCTGATTAA\tthrA\t[1618]\n-TTAATCAGACAGGGGATCTGGAACTGAGCAATGGG\tthrA\t[1618]\n-CCATTGCTCAGTTCCAGATCCCCTGTCTGATTAAA\tthrA\t[1618]\n-TTTAATCAGACAGGGGATCTGGAACTGAGCAATGG\tthrA\t[1618]\n-CATTGCTCAGTTCCAGATCCCCTGTCTGATTAAAA\tthrA\t[1618]\n-TTTTAATCAGACAGGGGATCTGGAACTGAGCAATG\tthrA\t[1618]\n-ATTGCTCAGTTCCAGATCCCCTGTCTGATTAAAAA\tthrA\t[1618]\n-TTTTTAATCAGACAGGGGATCTGGAACTGAGCAAT\tthrA\t[1618]\n-TTGCTCAGTTCCAGATCCCCTGTCTGATTAAAAAT\tthrA\t[1618]\n-ATTTTTAATCAGACAGGGGATCTGGAACTGAGCAA\tthrA\t[1618]\n-TGCTCAGTTCCAGATCCCCTGTCTGATTAAAAATA\tthrA\t[1618]\n-TATTTTTAATCAGACAGGGGATCTGGAACTGAGCA\tthrA\t[1618]\n-GCCGGACGCCAGGCTGTTGAAATCGATGTCCTACT\tthrA\t[1623]\n-AGTAGGACATCGATTTCAACAGCCTGGCGTCCGGC\tthrA\t[1623]\n-CCGGACGCCAGGCTGTTGAAATCGATGTCCTACTA\tthrA\t[1623]\n-TAGTAGGACATCGATTTCAACAGCCTGGCGTCCGG\tthrA\t[1623]\n-CGGACGCCAGGCTGTTGAAATCGATGTCCTACTAG\tthrA\t[1623]\n-CTAGTAGGACATCGATTTCAACAGCCTGGCGTCCG\tthrA\t[1623]\n-GGACGCCAGGCTGTTGAAATCGATGTCCTACTAGG\tthrA\t[1623]\n-CCTAGTAGGACATCGATTTCAACAGCCTGGCGTCC\tthrA\t[1623]\n-GACGCCAGGCTGTTGAAATCGATGTCCTACTAGGA\tthrA\t[1623]\n-TCCTAGTAGGACATCGATTTCAACAGCCTGGCGTC\tthrA\t[1623]\n-ACGCCAGGCTGTTGAAATCGATGTCCTACTAGGAA\tthrA\t[1623]\n-TTCCTAGTAGGACATCGATTTCAACAGCCTGGCGT\tthrA\t[1623]\n-CGCCAGGCTGTTGAAATCGATGTCCTACTAGGAAG\tthrA\t[1623]\n-CTTCCTAGTAGGACATCGATTTCAACAGCCTGGCG\tthrA\t[1623]\n-GCCAGGCTGTTGAAATCGATGTCCTACTAGGAAGC\tthrA\t[1623]\n-GCTTCCTAGTAGGACATCGATTTCAACAGCCTGGC\tthrA\t[1623]\n-CCAGGCTGTTGAAATCGATGTCCTACTAGGAAGCG\tthrA\t[1623]\n-CGCTTCCTAGTAGGACATCGATTTCAACAGCCTGG\tthrA\t[1623]\n-CAGGCTGTTGAAATCGATGTCCTACTAGGAAGCGA\tthrA\t[1623]\n-TCGCTTCCTAGTAGGACATCGATTTCAACAGCCTG\tthrA\t[1623]\n-AGGCTGTTGAAATCGATGTCCTACTAGGAAGCGAT\tthrA\t[1623]\n-ATCGCTTCCTAGTAGGACATCGATTTCAACAGCCT\tthrA\t[1623]\n-GGCTGTTGAAATCGATGTCCTACTAGGAAGCGATG\tthrA\t[1623]\n-CATCGCTTCCTAGTAGGACATCGATTTCAACAGCC\tthrA\t[1623]\n-GCTGTTGAAATCGATGTCCTACTAGGAAGCGATGG\tthrA\t[1623]\n-CCATCGCTTCCTAGTAGGACATCGATTTCAACAGC\tthrA\t[1623]\n-CTGTTGAAATCGATGTCCTACTAGGAAGCGATGGA\tthrA\t[1623]\n-TCCATCGCTTCCTAGTAGGACATCGATTTCAACAG\tthrA\t[1623]\n-TGTTGAAATCGATGTCCTACTAGGAAGCGATGGAG\tthrA\t[1623]\n-CTCCATCGCTTCCTAGTAGGACATCGATTTCAACA\tthrA\t[1623]\n-GTTGAAATCGATGTCCTACTAGGAAGCGATGGAGC\tthrA\t[1623]\n-GCTCCATCGCTTCCTAGTAGGACATCGATTTCAAC\tthrA\t[1623]\n-TTGAAATCGATGTCCTACTAGGAAGCGATGGAGCT\tthrA\t[1623]\n-AGCTCCATCGCTTCCTAGTAGGACATCGATTTCAA\tthrA\t[1623]\n-TGAAATCGATGTCCTACTAGGAAGCGATGGAGCTC\tthrA\t[1623]\n-GAGCTCCATCGCTTCCTAGTAGGACATCGATTTCA\tthrA\t[1623]\n-GAAATCGATGTCCTACTAGGAAGCGATGGAGCTCT\tthrA\t[1623]\n-AGAGCTCCATCGCTTCCTAGTAGGACATCGATTTC\tthrA\t[1623]\n-AAATCGATGTCCTACTAGGAAGCGATGGAGCTCTC\tthrA\t[1623]\n-GAGAGCTCCATCGCTTCCTAGTAGGACATCGATTT\tthrA\t[1623]\n-AATCGATGTCCTACTAGGAAGCGATGGAGCTCTCT\tthrA\t[1623]\n-AGAGAGCTCCATCGCTTCCTAGTAGGACATCGATT\tthrA\t[1623]\n-ATCGATGTCCTACTAGGAAGCGATGGAGCTCTCTT\tthrA\t[1623]\n-AAGAGAGCTCCATCGCTTCCTAGTAGGACATCGAT\tthrA\t[1623]\n-TCGATGTCCTACTAGGAAGCGATGGAGCTCTCTTA\tthrA\t[1623]\n-TAAGAGAGCTCCATCGCTTCCTAGTAGGACATCGA\tthrA\t[1623]\n-CGATGTCCTACTAGGAAGCGATGGAGCTCTCTTAC\tthrA\t[1623]\n-GTAAGAGAGCTCCATCGCTTCCTAGTAGGACATCG\tthrA\t[1623]\n-GATGTCCTACTAGGAAGCGATGGAGCTCTCTTACT\tthrA\t[1623]\n-AGTAAGAGAGCTCCATCGCTTCCTAGTAGGACATC\tthrA\t[1623]\n-ATGTCCTACTAGGAAGCGATGGAGCTCTCTTACTT\tthrA\t[1623]\n-AAGTAAGAGAGCTCCATCGCTTCCTAGTAGGACAT\tthrA\t[1623]\n-TGTCCTACTAGGAAGCGATGGAGCTCTCTTACTTC\tthrA\t[1623]\n-GAAGTAAGAGAGCTCCATCGCTTCCTAGTAGGACA\tthrA\t[1623]\n-GTCCTACTAGGAAGCGATGGAGCTCTCTTACTTCG\tthrA\t[1623]\n-CGAAGTAAGAGAGCTCCATCGCTTCCTAGTAGGAC\tthrA\t[1623]\n-TCCTACTAGGAAGCGATGGAGCTCTCTTACTTCGG\tthrA\t[1623]\n-CCGAAGTAAGAGAGCTCCATCGCTTCCTAGTAGGA\tthrA\t[1623]\n-CCTACTAGGAAGCGATGGAGCTCTCTTACTTCGGC\tthrA\t[1623]\n-GCCGAAGTAAGAGAGCTCCATCGCTTCCTAGTAGG\tthrA\t[1623]\n-CTACTAGGAAGCGATGGAGCTCTCTTACTTCGGCG\tthrA\t[1623]\n-CGCCGAAGTAAGAGAGCTCCATCGCTTCCTAGTAG\tthrA\t[1623]\n-TACTAGGAAGCGATGGAGCTCTCTTACTTCGGCGC\tthrA\t[1623]\n-GCGCCGAAGTAAGAGAGCTCCATCGCTTCCTAGTA\tthrA\t[1623]\n-ACTAGGAAGCGATGGAGCTCTCTTACTTCGGCGCT\tthrA\t[1623]\n-AGCGCCGAAGTAAGAGAGCTCCATCGCTTCCTAGT\tthrA\t[1623]\n-CTAGGAAGCGATGGAGCTCTCTTACTTCGGCGCTA\tthrA\t[1623]\n-TAGCGCCGAAGTAAGAGAGCTCCATCGCTTCCTAG\tthrA\t[1623]\n-TAGGAAGCGATGGAGCTCTCTTACTTCGGCGCTAA\tthrA\t[1623]\n-TTAGCGCCGAAGTAAGAGAGCTCCATCGCTTCCTA\tthrA\t[1623]\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_aroC.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_aroC.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2512 +0,0 @@\n->aroC_1\n-GTTTTTCGCCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGCGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACTTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_2\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATTAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGTGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_3\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGTGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATTGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCAGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGTGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_4\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGATATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATTAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_5\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGATATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGCGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTTTTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_6\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGTATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCAGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATTAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGTGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_7\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGATATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_8\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGATATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAATTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGA'..b'GCAGGGGCGATCGCTAAGAAATACCTGGCGGAAAAGTTCGGTATCGAAATCCGCGGTTGTCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCAACAGGTTGAGCGTAATCCGTTCTTTTGCCCCGATGCGGATAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGCGACTCTATCGGCGCGAAAGTGACGGTGATAGCGAGCGGCGTGCCGGCAGGTCTTGGCGAACCGGTATTTGATCGGCTGGATGCGGATATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAAGGTGGTGGCGCTACGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_1565\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGAAAAAGTTCGGTATCGAAATCCGTGGCTGCCTGACCAAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAACTTAATCCGTTCTTTTGCCCCGATGCGGACAAACTTGATGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCAAGCGGCGTGCCGGCAGGTCTTGGCGAACCAGTATTTGACCGACTGGACGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGTGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGTCAGAATCGCGATGAAATCACGGCACAGGGT\n->aroC_1567\n-GTCTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCACGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTAGCGGAAAAGTTCGGTATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGCGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTGTTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_1568\n-GTTTTTCGTCCGGGACACGCGGATTATACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATTGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGTGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATTAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_1569\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGTCCCGATGCGGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGTGGCGTGCCGGCAGGGCTTGGCGAACCGGTTTTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGTGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_1571\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATTGCCAAGAAATACCTAGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGATATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCAGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGCGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTTTTTGACCGACTGGATGCGGACATCGCCCATGGGCTGATGAGCATCAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGTGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n->aroC_1572\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGTGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATTGCCAAGAAATACCTGGCGGAAAAGTTCGGCATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGATATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCAGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATTAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGGAATCACGGCGCAGGGT\n->aroC_1573\n-GTTTTTCGTCCGGGACACGCGGATTACACCTATGAGCAGAAATACGGCCTGCGCGATTACCGTGGCGGTGGACGTTCTTCCGCGCGTGAAACCGCGATGCGCGTAGCGGCAGGGGCGATCGCCAAGAAATACCTGGCGGAAAAGTTCGGTATCGAAATCCGCGGCTGCCTGACCCAGATGGGCGACATTCCGCTGGAGATTAAAGACTGGCGTCAGGTTGAGCTTAATCCGTTCTTTTGCCCCGATGCAGACAAACTTGACGCGCTGGACGAACTGATGCGCGCGCTGAAAAAAGAGGGTGACTCCATCGGCGCGAAAGTGACGGTGATGGCGAGCGGCGTGCCGGCAGGGCTTGGCGAACCGGTATTTGACCGACTGGATGCGGACATCGCCCATGCGCTGATGAGCATTAATGCGGTGAAAGGCGTGGAGATCGGCGAAGGATTTAACGTGGTGGCGCTGCGCGGCAGCCAGAATCGCGATGAAATCACGGCGCAGGGT\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_config.txt
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_config.txt Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,10 +0,0 @@
-[loci]
-aroC kmer/salmonella_aroC.tfa
-dnaN kmer/salmonella_dnaN.tfa
-hemD kmer/salmonella_hemD.tfa
-hisD kmer/salmonella_hisD.tfa
-purE kmer/salmonella_purE.tfa
-sucA kmer/salmonella_sucA.tfa
-thrA kmer/salmonella_thrA.tfa
-[profile]
-profile kmer/salmonella_profile.txt
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_dnaN.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_dnaN.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2440 +0,0 @@\n->dnaN_1\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCAGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTTGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAGGCGTCTTTACCTAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGTGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_2\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCTCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGTGAAAACCCGCTGCGCGTGCAG\n->dnaN_3\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCAGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGTTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_4\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCTCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_5\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCCACGCTTCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCTCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_6\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCAGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGTACTGTCGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_7\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCAGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAATCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_8\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGTGCTACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACACTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGCAGCGAACTGCGCACTGTTGCGACCGACGGCCACCGTCTGGCGGT'..b'GAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_1326\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCTACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGCAGCGAACTGCGCACTGTTGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCATTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGTGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_1328\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCTCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAACGAACTGCGCACTGTCGCGACCGACGGCCACCGCCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGTGAAAACCCGCTGCGCGTGCAG\n->dnaN_1329\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCAGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACACTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAAGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_1330\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGCGCTACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCTTAATTGAAGCGACCCAGTTTTCGATGGCTCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGTTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_1331\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGTGCTACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGCTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCTCATCAGGACGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_1333\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCGGGTGCTACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGTCGTTCAGTTGGAAGGCGATCGGATGTTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCGCAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n->dnaN_1334\n-ATGGAGATGGTCGCGCGCGTTACGCTTTCTCAGCCGCATGAGCCAGGCGCCACTACCGTGCCGGCGCGGAAATTCTTTGATATCTGCCGCGGCCTGCCGGAGGGCGCGGAGATTGCCGTTCAGTTGGAAGGCGATCGGATGTTGGTGCGTTCTGGCCGTAGCCGCTTCTCGCTGTCTACGCTGCCTGCCGCCGATTTCCCGAATCTTGACGACTGGCAAAGCGAAGTTGAATTTACGCTGCCACAGGCCACGATGAAGCGCCTGATTGAAGCGACCCAGTTTTCGATGGCCCATCAGGATGTGCGCTACTACTTAAACGGTATGCTGTTTGAAACGGAAGGTAGCGAACTGCGCACTGTCGCGACCGACGGCCACCGTCTGGCGGTGTGCTCAATGCCGCTGGAAGCGTCTTTACCCAGCCACTCGGTGATTGTGCCGCGTAAAGGCGTGATTGAACTGATGCGTATGCTCGACGGCGGCGAAAACCCGCTGCGCGTGCAG\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_hemD.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_hemD.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2326 +0,0 @@\n->hemD_1\n-GCAACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACTCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGACGAAACTGGCCTGCGTCGCCGCGCTATTTCTCGATTGGCCGCACTACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGTTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_2\n-GCAACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACTCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGACGAAACTGGCCTGCGTCGCCGCGCTATTTCTCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGTTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_3\n-GCGACACTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_4\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGAAACTGGCCTGCGCCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_5\n-GCGACACTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTAATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_6\n-GCGACGCTCGCGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCTGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCGCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAAATGTTGCAA\n->hemD_7\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTAATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_8\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_9\n-GCGACGCTGACGAAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGACACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATG'..b'GACGTTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCCCACGCCCAACTCCAGCGAGATGGTCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGTCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGTCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGTCGCGAACTGCTGGGCGAAACCCTGACAGCTCACGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGAAGTGCGAAACATTACGATGGCGCAGAAGAGGCGATGCGCTGGCATACTCGCGGCGTAACGACGCTTGTTGTCACCAGCGGCGAGATGTTGCAA\n->hemD_1265\n-GCGACTCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCTCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACACTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_1268\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCTGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGTGGCGCCGCGCTATTTTGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCGCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_1269\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCTGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGTGGCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCGCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGTGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_1270\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCCCACGCCCAGATCCAGCAGGATGGTCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGATTCGATATTCGTTATCCATTGGGTCGGGAAATCAGCGAAGTCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGTCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAATTTTTGTGAATGTTATCAACGAAGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATGCTCGCGGCATAACAACGCTTGTTGTCACCAGCGGCGAGATGTTGCAA\n->hemD_1271\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCTGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGCCGAAACTGGCCTGTGGCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCGCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_1272\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGTGGCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACACTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_1273\n-GCGAAGCTGACGGAAAAAGATCTGGTTTTTGCCCTTTCACAGCACGCCGTCGCCTTTGCTCACGCCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCAAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTTACCAGCGGCGAGATGTTGCAA\n->hemD_1275\n-GCGACGCTGACGGAAAACGATCTGGTTTTTGCCCTTTCACAGCACGCTGTCGCCTTTGCTCACACCCAGCTCCAGCGGGATGGTCGAAACTGGCCTGCGTCGCCGCGCTATTTCGCGATTGGCCGCACCACGGCGCTCGCCCTTCATACCGTTAGCGGGTTCGATATTCGTTATCCATTGGATCGGGAAATCAGCGAAGCCTTGCTACAATTACCTGAATTACAAAATATTGCGGGCAAACGCGCGCTGATTTTGCGTGGCAATGGCGGCCGCGAACTGCTGGGCGAAACCCTGACAGCTCGCGGAGCCGAAGTCAGTTTTTGTGAATGTTATCAACGATGTGCGAAACATTACGATGGCGCGGAAGAAGCGATGCGCTGGCATACTCGCGGCGTAACAACGCTTGTTGTCACCAGCGGCGAGATGTTGCAA\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_hisD.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_hisD.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,3420 +0,0 @@\n->hisD_1\n-ATTGCGGGATGCCAGAAGGTGGTTCTGTGCTCGCCGCCACCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAGCGTCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGCCCGGATTCCCAGGTGATCCTGCTGACGCCGGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGGCACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_2\n-ATTGCAGGATGCCAGATCGTGGTTCTGTGCTCGCCACCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAGCGCCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCGTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCGCAGGTGATCCTGCTGACGCCTGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_3\n-ATTGCGGGATGCCAGAAGGTGGTTCTGTGCTCGCCGCCACCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAGCGTCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAATACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGCCCGGATTCCCAGGTGATCCTGCTGACGCCGGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGGCACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_4\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAGCGCCTCGACGGCGCGGCTATCGATATGCCTGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCCCAGGTGATTCTGCTGACGCCTGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAGCTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTAATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_5\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAGCGTCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCAGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGCCCGGATTCCCAGGTGATCCTACTGACGCCTGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_6\n-ATTGCGGGATGCCAGAAGGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAGCGTCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCAGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGCCCGGATTCCCAGATGATCCTGCTGACGCCTGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_7\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAACGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCGCAGGTGATTCTGCTGACGCCTGATGCTGACATTGCCTGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCAGAACTGCCGCGCGCGGACACCGCCAGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_8\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCTGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCGCAGGTGATCCTGCTGACGCCGGATGCTGACATTGCCCG'..b'GCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAATCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTCGTGACCGAAGCCAAACGTCAGGTCAGCCAGCGTCTCGACGGCGCGGCTATCGATATGCCTGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACGCCGGATTTCGTCGCTTCTGACCTGCTTTCCCAGGCAGAACACGGCCCGGATTCACAGGTGATTCTTCTGACGCCGGATGCCGACATCGCCCGCAAGGTAGCGGAGGCGGTAGAACGTCAACTGGCTGAACTGCCGCGCGCGGAAACCGCCCGTCAGGCTTTGCGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1898\n-ATTGCGGGATGCCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCACAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCGTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCGCAGGTGATCCTGCTGACGCCTGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTTGCAGAACTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1899\n-ATTGCGGGATGTCAGAAAGTGGTTCTGTGCTCGCCGCCGCCCATCGCCGATGAAATCCTCTATGCGGCACAACTGTGTGGCATACAGGAGATCTTTAACGTCGGCGGCTCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAATCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAATGCTTTTGTAACTGAAGCCAAGCGTCAGGTCAGTCAGCGTCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAACGCCGGACTTCGTCGCTTCTGACCTGCTCTCCCAGGCAGAACACGGCCCGGATTCCCAGGTGATCCTGCTGACGCCGGATGCTAACATCGCCCGCAGGGTGGCGGAGGCGGTAGAACGTCAACTGGCTGAACTGCCGCGCGCGGACACCGCCCGTCAGGCTTTGCGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1900\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAACGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCGCAGGTGATTCTGCTGACGCCTGATGCTGACATTGCCTGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCAGAACTGCCGCGTGCGGACACCGCCAGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1902\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCTGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCGTCTGACCTGCTCTCCCAGGCAGAACACGGTCCGGATTCGCAGGTGATCCTGCTGACGCCTGATGCTCACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1903\n-ATTGCGGGATGCCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCACGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTACTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCTTCTGACCTGCTCTCCCAGGCTGAGCACGGTCCGGATTCCCAGGTGATTCTGCTGACGCCTGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAACTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1904\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCGCAACTGTGTGGCGTGCGGGAAATCTTTAACGTCGGCGGCGCGCAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAGTCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAACGCCTTTGTAACCGAAGCCAAGCGTCAGGTCAGCCAACGCCTCGACGGCGCGGCTATCGATATGCCTGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAACACCGGATTTCGTCGCGTCTGACCTGCTCTCCCAAGCTGAGCACGGTCCGGATTCGCAGGTGATCCTGCTGACGCCGGATGCTGACATTGCCCGCAAGGTGGCGGAGGCGGTAGAACGTCAACTGGCGGAGCTGCCGCGCGCGGACACCGCCCGGCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n->hisD_1905\n-ATTGCGGGATGTCAGAACGTGGTTCTGTGCTCGCCGCCGCCCATCGCTGATGAAATCCTCTATGCGGCACAGCTATGTGGCGTGCAGGAAATCTTTAACGTCGGCGGCGCACAGGCGATTGCCGCTCTGGCCTTCGGCAGCGAATCCGTACCGAAAGTGGATAAAATTTTTGGCCCCGGCAATGCTTTTGTAACTGAAGCCAAGCGTCAGGTCAGTCAGCGTCTCGACGGCGTGGCTATCGATATGCCAGCCGGGCCGTCTGAAGTGCTGGTGATCGCCGACAGCGGCGCAACGCCGGACTTCGTCGCTTCTGACCTGCTCTCCCAGGCAGAACACGGCCCGGATTCCCAGGTGATCCTGCTGACGCCGGATGCTGACATCGCCCGCAGGGTGGCGGAGGCGGTAGAACGTCAACTGGCTGAACTGCCGCGCGCGGACACCGCCCGTCAGGCCCTGAGCGCCAGTCGTCTGATTGTGACCAAAGATTTAGCGCAGTGCGTC\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_profile.txt
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_profile.txt Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,9123 +0,0 @@\n-ST\taroC\tdnaN\themD\thisD\tpurE\tsucA\tthrA\n-1\t1\t1\t1\t1\t1\t1\t5\n-2\t1\t1\t2\t1\t1\t1\t5\n-3\t1\t1\t2\t1\t1\t1\t9\n-4\t43\t41\t16\t13\t34\t13\t4\n-5\t16\t43\t45\t43\t36\t39\t42\n-6\t4\t4\t4\t5\t4\t4\t8\n-7\t2\t2\t3\t2\t2\t2\t6\n-8\t1\t1\t2\t3\t1\t1\t5\n-9\t33\t26\t30\t55\t21\t87\t134\n-10\t5\t2\t3\t6\t5\t5\t10\n-11\t5\t2\t3\t7\t6\t6\t11\n-12\t6\t5\t6\t7\t5\t7\t12\n-13\t3\t3\t7\t4\t3\t3\t7\n-14\t7\t6\t8\t8\t7\t8\t13\n-15\t2\t7\t9\t9\t5\t9\t12\n-16\t6\t7\t10\t10\t8\t10\t14\n-17\t8\t8\t11\t11\t5\t11\t15\n-18\t9\t9\t6\t12\t9\t12\t2\n-19\t10\t7\t12\t9\t5\t9\t2\n-20\t11\t10\t13\t13\t10\t13\t4\n-21\t12\t2\t14\t14\t11\t14\t16\n-22\t12\t2\t15\t14\t11\t14\t16\n-23\t13\t11\t16\t15\t12\t15\t4\n-24\t13\t12\t17\t16\t13\t16\t4\n-25\t14\t13\t18\t12\t14\t17\t1\n-26\t14\t13\t18\t12\t14\t18\t1\n-27\t5\t14\t18\t9\t6\t12\t17\n-28\t15\t15\t19\t17\t5\t19\t18\n-29\t16\t16\t20\t18\t8\t12\t18\n-30\t10\t17\t21\t12\t15\t20\t18\n-31\t2\t2\t15\t14\t15\t20\t12\n-32\t17\t18\t22\t17\t5\t21\t19\n-33\t2\t5\t6\t7\t5\t7\t12\n-34\t10\t19\t12\t9\t5\t9\t2\n-35\t10\t7\t12\t9\t5\t9\t20\n-36\t18\t14\t12\t9\t5\t18\t21\n-37\t3\t3\t7\t19\t3\t3\t7\n-38\t2\t7\t10\t10\t8\t10\t14\n-39\t19\t20\t3\t20\t5\t2\t22\n-40\t19\t20\t3\t20\t5\t22\t22\n-41\t17\t18\t12\t17\t5\t21\t19\n-42\t20\t4\t23\t14\t16\t19\t18\n-43\t2\t14\t24\t14\t2\t19\t8\n-44\t9\t9\t6\t7\t9\t12\t2\n-45\t10\t7\t21\t14\t15\t12\t12\n-46\t10\t7\t21\t12\t15\t12\t12\n-47\t21\t11\t16\t15\t12\t15\t4\n-48\t22\t11\t25\t21\t10\t23\t23\n-49\t5\t14\t21\t9\t6\t12\t17\n-50\t5\t21\t18\t9\t6\t12\t17\n-51\t16\t16\t26\t18\t8\t12\t18\n-52\t23\t9\t15\t12\t17\t20\t12\n-53\t24\t22\t27\t22\t18\t24\t24\n-54\t25\t23\t27\t23\t19\t24\t25\n-55\t26\t24\t28\t24\t20\t25\t26\n-56\t27\t25\t29\t24\t20\t26\t27\n-57\t28\t26\t30\t25\t21\t27\t28\n-58\t29\t27\t30\t26\t21\t28\t28\n-59\t30\t28\t31\t27\t22\t29\t29\n-60\t31\t28\t32\t28\t23\t29\t30\n-61\t32\t29\t33\t29\t24\t30\t31\n-62\t32\t30\t34\t30\t24\t31\t32\n-63\t33\t26\t30\t26\t21\t32\t28\n-64\t10\t14\t15\t31\t25\t20\t33\n-65\t11\t10\t13\t32\t10\t13\t4\n-66\t34\t31\t35\t14\t26\t6\t8\n-67\t35\t32\t36\t33\t27\t33\t3\n-68\t36\t31\t35\t14\t26\t34\t8\n-69\t37\t33\t37\t34\t6\t9\t34\n-70\t38\t34\t38\t35\t28\t35\t4\n-71\t39\t35\t8\t36\t29\t9\t36\n-72\t40\t36\t3\t37\t29\t9\t36\n-73\t5\t2\t3\t38\t5\t5\t10\n-74\t41\t4\t23\t14\t16\t19\t18\n-75\t14\t37\t39\t33\t30\t19\t37\n-76\t8\t38\t40\t12\t5\t9\t38\n-77\t10\t39\t41\t39\t5\t19\t39\n-78\t5\t2\t42\t7\t31\t6\t11\n-79\t11\t11\t17\t40\t32\t9\t40\n-80\t42\t40\t17\t41\t33\t36\t41\n-81\t43\t41\t16\t42\t35\t13\t4\n-82\t41\t42\t43\t12\t9\t12\t2\n-83\t41\t9\t21\t12\t8\t37\t17\n-84\t44\t14\t44\t14\t15\t38\t17\n-85\t45\t4\t8\t44\t27\t9\t8\n-86\t2\t14\t24\t14\t37\t19\t8\n-88\t46\t44\t46\t46\t38\t18\t34\n-89\t47\t45\t47\t47\t39\t9\t43\n-90\t48\t31\t35\t14\t26\t40\t44\n-91\t49\t11\t25\t15\t12\t15\t4\n-92\t5\t2\t3\t7\t31\t41\t11\n-93\t50\t10\t25\t13\t10\t13\t4\n-94\t42\t46\t48\t48\t40\t35\t4\n-95\t3\t36\t43\t38\t16\t42\t38\n-96\t43\t47\t49\t49\t41\t15\t3\n-97\t51\t48\t43\t50\t42\t43\t45\n-98\t10\t7\t50\t9\t5\t9\t2\n-99\t10\t7\t12\t9\t5\t9\t46\n-101\t52\t3\t40\t51\t44\t45\t3\n-102\t53\t49\t51\t52\t45\t46\t48\n-103\t54\t50\t27\t53\t46\t47\t49\n-104\t55\t51\t52\t54\t47\t48\t50\n-105\t33\t26\t30\t55\t21\t49\t28\n-106\t56\t25\t29\t56\t48\t50\t51\n-107\t57\t52\t31\t57\t22\t29\t30\n-108\t58\t29\t53\t29\t24\t30\t52\n-110\t2\t2\t24\t14\t2\t19\t8\n-111\t41\t42\t43\t12\t9\t12\t53\n-112\t41\t42\t43\t58\t9\t12\t2\n-113\t9\t9\t6\t59\t9\t12\t2\n-114\t48\t31\t35\t14\t26\t52\t8\n-115\t16\t2\t45\t43\t36\t12\t42\n-116\t10\t7\t21\t14\t15\t39\t12\n-117\t16\t2\t45\t43\t15\t12\t42\n-118\t16\t2\t45\t43\t36\t39\t42\n-119\t16\t2\t18\t43\t36\t12\t42\n-120\t16\t2\t40\t43\t36\t39\t42\n-121\t10\t7\t21\t14\t36\t12\t12\n-122\t16\t2\t45\t43\t15\t39\t42\n-123\t10\t2\t21\t43\t36\t12\t42\n-125\t10\t7\t21\t14\t15\t53\t12\n-126\t11\t10\t25\t13\t10\t35\t4\n-127\t46\t54\t46\t46\t38\t18\t34\n-128\t10\t7\t12\t9\t5\t55\t2\n-129\t45\t4\t8\t44\t27\t56\t8\n-130\t45\t4\t8\t44\t50\t9\t8\n-131\t10\t56\t21\t14\t15\t12\t12\n-132\t2\t57\t15\t14\t15\t20\t12\n-133\t36\t31\t35\t14\t26\t6\t55\n-134\t45\t4\t8\t44\t53\t9\t8\n-135\t46\t55\t23\t14\t16\t54\t56\n-136\t5\t2\t3\t61\t6\t6\t11\n-137\t10\t7\t12\t9\t5\t57\t2\n-138\t11\t41\t55\t42\t34\t58\t4\n-139\t36\t31\t57\t14\t26\t34\t8\n-140\t13\t11\t17\t16\t13\t60\t4\n-141\t59\t58\t56\t62\t51\t59\t16\n-142\t2\t59\t23\t64\t38\t61\t12\n-143\t60\t12\t17\t63\t13\t16\t4\n-145\t36\t31\t35\t14\t26\t6\t8\n-146\t48\t31\t35\t14\t26\t40\t8\n-147\t48\t31\t35\t14\t26\t44\t47\n-148\t2\t59\t23\t64\t38\t62\t12\n-149\t2\t14\t24\t14\t49\t19\t8\n-150\t61\t12\t10\t65\t54\t63\t57\n-151\t62\t53\t54\t60\t5\t64\t54\n-152\t62\t53\t54\t60\t5\t53\t54\n-155\t10\t60\t58\t66\t6\t65\t16\n-156\t63\t14\t6\t12\t5\t14\t58\n-157\t10\t61\t21\t12\t15\t12\t12\n-158\t10\t62\t21\t67\t15\t12\t12\n-159\t10\t7\t12\t9\t5\t66\t2\n-160\t65\t25\t29\t69\t48\t26\t60\n-161\t33\t26\t30\t55\t56\t68\t61\n-162\t30\t28\t31\t57\t57\t69\t30\n-163\t16\t2\t60\t43\t36\t39\t42\n-164\t16\t2\t45\t70\t36\t39\t42\n-165\t10\t7\t21\t14\t58\t12\t12\n-166\t5\t14\t6\t12\t5\t14\t58\n-167\t16\t2\t61\t71\t36\t39\t42\n-168\t66\t2\t3\t7\t6\t6\t11\n-169\t50\t63\t25\t72\t59\t71\t62\n-170\t41\t42\t62\t58\t9\t12\t2\n-171\t67\t10\t17\t73\t9\t9\t4\n-172\t68\t2\t3\t7\t5\t6\t10\n-173\t69\t42\t43\t58\t9\t12\t2\n-174\t50\t63\t25\t72\t59\t71\t63\n-175\t13\t12\t63\t16\t13\t7'..b'\n-10466\t5\t2\t3\t7\t6\t6\t1606\n-10467\t5\t2\t3\t7\t1537\t6\t11\n-10470\t40\t194\t748\t36\t29\t8\t832\n-10471\t2\t4\t40\t43\t481\t2\t1608\n-10472\t16\t16\t20\t18\t1540\t12\t18\n-10474\t336\t118\t3\t196\t27\t128\t8\n-10475\t84\t1317\t38\t16\t12\t13\t4\n-10476\t33\t26\t30\t282\t229\t1135\t28\n-10477\t14\t865\t786\t38\t1541\t128\t579\n-10478\t10\t4\t3\t38\t4\t128\t8\n-10479\t483\t28\t31\t151\t57\t29\t81\n-10480\t313\t86\t97\t358\t76\t427\t1609\n-10481\t5\t2\t3\t7\t1542\t6\t11\n-10482\t14\t4\t4\t130\t529\t128\t8\n-10483\t1110\t28\t1264\t151\t22\t29\t30\n-10484\t11\t10\t25\t13\t10\t1404\t4\n-10485\t30\t1318\t31\t151\t22\t29\t300\n-10486\t140\t105\t85\t93\t14\t10\t1610\n-10487\t561\t118\t3\t130\t4\t1405\t579\n-10488\t273\t176\t27\t22\t85\t24\t91\n-10489\t111\t47\t49\t16\t41\t15\t586\n-10490\t13\t140\t25\t526\t12\t13\t1611\n-10491\t99\t1319\t58\t11\t111\t9\t2\n-10492\t11\t83\t25\t1895\t1543\t35\t4\n-10493\t92\t1320\t7\t1868\t2\t113\t419\n-10494\t3\t1321\t7\t4\t3\t3\t7\n-10495\t7\t4\t8\t1240\t1206\t109\t210\n-10496\t805\t130\t40\t94\t346\t9\t95\n-10497\t289\t26\t30\t282\t21\t1406\t28\n-10498\t15\t70\t93\t78\t1544\t6\t68\n-10499\t137\t435\t8\t196\t526\t1407\t102\n-10500\t5\t2\t3\t7\t1545\t6\t11\n-10501\t43\t47\t1265\t16\t41\t15\t3\n-10502\t92\t107\t79\t156\t1547\t151\t87\n-10503\t76\t14\t3\t77\t1548\t64\t67\n-10504\t815\t10\t18\t1896\t6\t146\t1612\n-10505\t104\t7\t54\t78\t104\t9\t128\n-10506\t62\t442\t40\t20\t88\t117\t2\n-10507\t10\t1322\t12\t9\t5\t9\t2\n-10508\t72\t531\t49\t72\t33\t1189\t596\n-10509\t10\t7\t12\t9\t5\t500\t46\n-10513\t1561\t439\t350\t163\t84\t19\t124\n-10514\t189\t70\t68\t132\t175\t51\t172\n-10515\t101\t97\t78\t125\t84\t90\t192\n-10516\t438\t32\t323\t183\t139\t53\t41\n-10517\t33\t26\t1236\t26\t21\t32\t457\n-10518\t86\t176\t27\t22\t18\t24\t174\n-10519\t1562\t25\t28\t1897\t263\t26\t27\n-10520\t1265\t26\t514\t282\t131\t229\t28\n-10521\t255\t229\t30\t55\t21\t229\t658\n-10522\t25\t77\t27\t22\t250\t407\t169\n-10523\t296\t26\t30\t213\t21\t27\t264\n-10524\t33\t26\t30\t55\t229\t145\t134\n-10525\t33\t26\t30\t26\t283\t87\t132\n-10526\t382\t26\t30\t144\t283\t353\t625\n-10527\t29\t26\t30\t84\t21\t145\t28\n-10528\t33\t26\t30\t26\t229\t87\t28\n-10530\t1563\t1245\t25\t1898\t1551\t19\t4\n-10531\t65\t78\t28\t211\t48\t26\t51\n-10532\t262\t78\t29\t82\t129\t1408\t51\n-10533\t1564\t24\t28\t1899\t237\t26\t131\n-10534\t5\t2\t3\t7\t1552\t6\t11\n-10535\t14\t118\t3\t1318\t4\t128\t8\n-10536\t14\t118\t3\t1318\t27\t128\t8\n-10537\t84\t76\t38\t16\t1553\t13\t4\n-10538\t88\t26\t30\t26\t21\t87\t80\n-10539\t15\t70\t93\t78\t113\t1409\t68\n-10540\t25\t82\t27\t23\t18\t643\t25\n-10541\t1565\t26\t30\t87\t21\t87\t80\n-10542\t75\t14\t224\t545\t1554\t2\t314\n-10544\t10\t7\t1268\t9\t5\t9\t2\n-10545\t17\t18\t22\t17\t5\t21\t1613\n-10546\t229\t1323\t269\t341\t18\t85\t236\n-10547\t17\t347\t1255\t122\t1555\t109\t1614\n-10548\t16\t2\t45\t43\t36\t39\t1615\n-10549\t10\t19\t1269\t9\t5\t9\t2\n-10550\t1567\t384\t38\t16\t33\t35\t410\n-10551\t1044\t377\t168\t16\t248\t1410\t1616\n-10552\t45\t1091\t17\t384\t12\t179\t63\n-10553\t43\t41\t16\t85\t40\t58\t4\n-10554\t2\t4\t15\t1272\t8\t12\t303\n-10555\t1265\t1324\t30\t282\t21\t145\t28\n-10556\t5\t21\t18\t9\t6\t1411\t17\n-10557\t11\t1325\t55\t42\t34\t58\t4\n-10558\t84\t334\t123\t676\t76\t9\t161\n-10559\t417\t14\t79\t195\t3\t404\t2\n-10560\t372\t361\t10\t236\t8\t9\t22\n-10561\t1568\t73\t10\t130\t2\t112\t38\n-10562\t2\t188\t98\t205\t76\t2\t14\n-10563\t14\t419\t8\t20\t2\t405\t452\n-10564\t33\t26\t1270\t282\t21\t87\t28\n-10565\t30\t28\t31\t1371\t22\t29\t30\n-10566\t5\t1326\t18\t9\t6\t12\t17\n-10567\t2\t2\t9\t1900\t105\t19\t86\n-10568\t10\t7\t21\t12\t15\t1412\t12\n-10569\t5\t2\t3\t7\t1556\t6\t11\n-10570\t5\t2\t3\t7\t6\t6\t1617\n-10571\t5\t2\t3\t7\t1557\t6\t11\n-10572\t5\t2\t3\t7\t1558\t6\t11\n-10573\t5\t2\t3\t7\t1559\t6\t11\n-10574\t5\t2\t3\t7\t1560\t6\t11\n-10579\t1569\t4\t4\t130\t438\t1303\t1023\n-10580\t561\t118\t3\t196\t4\t128\t8\n-10581\t2\t1328\t45\t1660\t36\t12\t588\n-10582\t81\t5\t101\t12\t1562\t130\t17\n-10584\t10\t7\t1271\t9\t5\t9\t2\n-10585\t373\t356\t15\t467\t76\t9\t139\n-10586\t543\t498\t85\t11\t1563\t388\t506\n-10587\t92\t278\t16\t1902\t27\t427\t560\n-10588\t10\t19\t12\t9\t5\t9\t406\n-10589\t127\t90\t40\t1903\t150\t199\t95\n-10590\t5\t2\t3\t7\t1564\t6\t11\n-10591\t5\t2\t3\t7\t1565\t6\t11\n-10592\t5\t2\t3\t7\t1566\t6\t11\n-10593\t25\t77\t27\t22\t18\t24\t1618\n-10594\t11\t1329\t25\t13\t10\t35\t4\n-10597\t175\t169\t47\t402\t184\t9\t22\n-10598\t1571\t1330\t1272\t1904\t76\t9\t1621\n-10599\t1572\t295\t10\t100\t38\t9\t303\n-10600\t1568\t1331\t10\t130\t2\t112\t38\n-10601\t376\t288\t1273\t275\t566\t295\t1427\n-10603\t5\t1333\t87\t103\t29\t108\t102\n-10604\t1573\t1334\t8\t204\t179\t1415\t307\n-10605\t95\t77\t27\t1905\t277\t24\t25\n-10606\t124\t115\t10\t162\t1458\t470\t1136\n-10607\t1\t1\t1\t1\t1\t1\t1623\n-10608\t863\t15\t1275\t1103\t36\t2\t936\n-10609\t84\t76\t38\t16\t1568\t13\t4\n-10610\t16\t16\t20\t18\t8\t1416\t18\n-10611\t52\t519\t54\t402\t1569\t35\t102\n-10612\t17\t14\t8\t796\t1570\t611\t428\n-10613\t5\t1132\t40\t115\t2\t75\t322\n-10614\t41\t73\t102\t4\t95\t1417\t1624\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_purE.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_purE.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2708 +0,0 @@\n->purE_1\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCACACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTCAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGGGCGGCGAACGCCGCACTGCTGGCAGCGCAAATTTTGGCTACGCATGATAGCGCGCTGCATCGGCGCATCGCCGAC\n->purE_2\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTCAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCTGAC\n->purE_3\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTCAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACACTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCACAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCCGAC\n->purE_4\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCTCATCGCACCCCCGATAAGCTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCTGAC\n->purE_5\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCTCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_6\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_7\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTCAGCGGCGTGGATAGCCTTTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_8\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_9\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCTCATCGCACCCCCGATAAGCTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTTTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACACTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCTGAC\n->purE_10\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAGCTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCACATCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTACCGGTACAAAGCGCTGCGCTAAGCGGTGTGGATAGCCTCTACTCCATCGTGCAGATG'..b'TCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_1560\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_1562\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCTCATCGCACCCCCGATAAGCTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTGCCGGTACAAAGCGCTGCGCTCAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGGGCGGCGAACGCCGCACTGCTGGCAGCGCAAATTTTGGCTACGCATGATAGCGCGCTGCATCGGCGCATCGCCGAC\n->purE_1563\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCAGTGGGTACGCTGGCGATCGGCAAAGCCGGTGCCGCGAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCCGAC\n->purE_1564\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_1565\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_1566\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_1568\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTCTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCTCATCGCACCCCCGATAAGCTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCGCACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTTTACTCCATTGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCTGAC\n->purE_1569\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAGCTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGCGCGGGCGGCGCGGCACACCTGCCGGGAATGATTGCGGCAAAAACTCTGGTCCCGGTACTCGGCGTACCGGTACAAAGCGCTGCGCTAAGCGGTGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCACTGCTGGCAGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATTGCCGAC\n->purE_1570\n-AGCGACTGGGCTACCATGCAATTCGCCGCCGAAATTTTTGAAATTCTGGATGTCCCGCACCATGTAGAAGTGGTTTCCGCCCATCGCACCCCCGATAAACTGTTCAGCTTCGCCGAAACGGCGGAAGAGAACGGATATCAAGTGATTATTGCCGGGGCGGGCGGCGCGGCACACCTGCCGGGAATGATTGCGGCAAAAACGCTGGTCCCGGTACTCGGCGTGCCGGTACAAAGCGCTGCGCTAAGCGGCGTGGATAGCCTCTACTCCATCGTGCAGATGCCGCGCGGCATTCCGGTGGGTACGCTGGCGATCGGTAAAGCCGGTGCCGCTAACGCCGCCCTGCTCGCCGCGCAGATTCTGGCGCAACACGACGCGGAACTGCATCAGCGCATCGCTGAC\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_sucA.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_sucA.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2532 +0,0 @@\n->sucA_1\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCTATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGTCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAGTTTGCCGGTAAACATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACTGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACCGACTGGACGAACCGAGCAGTAATAAAGTGCTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_2\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGCTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_3\n-AAACGTTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATTACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_4\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACTGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCACCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGTGCCCGTCTGGACCGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATTACCATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_5\n-AAACGTTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGTGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGAACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAGTTTGCCGGTAAACATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCACCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGTGCCCGTCTGGACCGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_6\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGTGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_7\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_8\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGTGCCAAATTCCCCGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGTGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACTGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGT'..b'CCGATGCTGAAAGAGATGGTTCGCCATGCGGGTAATAGCGGCACTCGCGAAGTGGTGCTGGGTATGGCGCACCGCGGTCGCCTGAACGTACTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAGTTTGCCGGTAAGCATAAAGAACATCTTGGCACCGGCGATGTGAAGTACCACATGGGCTTCTCGTCAGATATCGAAACGGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCACCTGGAAATCGTGAGCCCGGTGGTGATGGGATCTGTGCGTGCGCGTTTGGATAGACTGGACGAACCGAGCAGCAACAAAGTGCTACCCATCACCATTCATGGCGATGCGGCAGTCACCGGCCAGGGCGTGGTTCAG\n->sucA_1409\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGTGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCAGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_1410\n-AAACGCTTTCTGAACGAACTAACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCCGGTGCGAAACGTTTCTCGCTGGAGGGGGGAGATGCTCTGGTACCCATGTTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGGTCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAGTTTGCCGGTAAGCATAAAGAACATCTTGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGCCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCACCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGTGCTCGTCTGGACAGACTGGACGAGCCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_1411\n-AAACGTTTCCTAAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATTTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_1412\n-AAACGTTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCACTGGCGTTTAACCCATCGCATTTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_1415\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGTGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATTTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGTGCCCGTCTGGACCGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_1416\n-AAACGTTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGCGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTTGAGGGGGGAGATGCGTTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGCGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACCGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATTTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACAGACTGGACGAACCGAGCAGCAACAAAGTGTTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n->sucA_1417\n-AAACGCTTCCTGAACGAACTGACCGCCGCTGAAGGGCTGGAACGTTATCTGGGTGCCAAATTCCCGGGTGCGAAACGTTTCTCGCTCGAGGGGGGAGATGCGCTGATACCCATGCTGAAAGAGATGGTTCGCCATGCGGGTAACAGCGGCACTCGCGAAGTGGTGCTGGGGATGGCGCACCGTGGTCGCCTGAACGTGCTGATCAACGTACTGGGTAAAAAACCGCAGGATCTGTTCGACGAATTTGCCGGTAAGCATAAAGAACATCTGGGTACTGGCGACGTGAAGTATCACATGGGCTTCTCGTCAGATATCGAAACCGAAGGCGGTCTGGTTCACCTGGCGCTGGCGTTTAACCCATCGCATCTGGAAATTGTGAGCCCGGTGGTGATGGGCTCCGTGCGCGCCCGTCTGGACCGACTGGACGAACCGAGCAGTAATAAAGTGCTGCCGATCACTATTCACGGCGACGCCGCGGTGACCGGCCAGGGCGTGGTTCAG\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_thrA.tfa
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_thrA.tfa Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2946 +0,0 @@\n->thrA_1\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGACTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGTAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_2\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATTACGCCCATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGTAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAACCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGTTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_3\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCATCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_4\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCACGTCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATTACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCATCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_5\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGTTGAAATCGATGTCCTACCAGGAAGCGATGGAGCTCTCTTACTTCGGCGCTAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_6\n-GTGCTGGGGCGTAATGGCTCTGACTACTCTGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGACTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGTAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTGAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCTGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_7\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTTCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTCAAAGGGATCTCTAACCTTAACAATATGGCGATGTTTAGCGTCTCCGGCCCTGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGTTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_8\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGTTGAAATCGATGTCCTACCAGGAAGCGATGGAGCTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGAT'..b'CCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1615\n-GTGCTTGGGCGTAATGGCTCTGACTACTCTGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGTTGAAATCGATGTCCTACCAGGAAGCGATGGAGCTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCAGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCAGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1616\n-GTACTGGGCCGTAACGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCGTGTTTACGTGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATTACGCCCATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATGATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGTCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTACTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGTTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1617\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTTCTTCACCCTCGTACCATTACGCCCATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGTAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAACCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1618\n-GTGCTGGGCCGTAATGGTTCCGACTATTCTGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATTACGCCCATTGCTCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTACTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1621\n-GTGCTGGGGCGTAATGGCTCTGACTACTCTGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGTGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATTACGCCCATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGTAATCCGCAGGTGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCTGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1623\n-GTGCTGGGCCGTAATGGTTCCGACTATTCCGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGCGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGTTGAAATCGATGTCCTACTAGGAAGCGATGGAGCTCTCTTACTTCGGCGCTAAAGTCCTTCACCCTCGCACCATAACGCCTATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGCAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGGATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n->thrA_1624\n-GTGCTGGGGCGTAATGGCTCTGACTACTCTGCCGCCGTGCTGGCCGCCTGTTTACGCGCTGACTGCTGTGAAATCTGGACTGACGTCGATGGTGTGTATACCTGTGACCCGCGCCAGGTGCCGGACGCCAGGCTGCTGAAATCGATGTCCTACCAGGAAGCGATGGAACTCTCTTACTTCGGCGCCAAAGTCCTTCACCCTCGCACCATTACGCCCATCGCCCAGTTCCAGATCCCCTGTCTGATTAAAAATACCGGTAATCCGCAGGCGCCAGGAACGCTGATCGGCGCGTCCAGCGACGATGATAATCTGCCGGTTAAAGGGATCTCTAACCTTAACAACATGGCGATGTTTAGCGTCTCCGGCCCGGGAATGAAAGGGATGATTGGGATGGCGGCGCGTGTTTTCGCCGCCATGTCTCGCGCCGGAATCTCGGTGGTGCTCATTACCCAGTCCTCCTCTGAGTACAGCATCAGCTTCTGTGTGCCGCAGAGTGACTGC\n'
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/kmer/salmonella_weight.txt
--- a/SeqSero2S/seqsero2s_db/kmer/salmonella_weight.txt Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
@@ -1,9 +0,0 @@
-purE_631 0.7904408017272534
-purE_748 0.83309951166174
-purE_749 0.7904408017272534
-purE_781 0.8757582215962267
-purE_866 0.7904408017272534
-purE_868 0.8180434963907447
-purE_971 1.076505091876164
-purE_1502 0.83309951166174
-purE_1537 1.0539210689696712
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/mlst.pickle
b
Binary file SeqSero2S/seqsero2s_db/mlst.pickle has changed
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/seqsero2s_db/special.pickle
b
Binary file SeqSero2S/seqsero2s_db/special.pickle has changed
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb SeqSero2S/setup.py
--- a/SeqSero2S/setup.py Fri May 15 17:55:16 2026 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
[
@@ -1,31 +0,0 @@
-import os, sys
-from distutils.core import setup
-from setuptools import find_packages
-
-def readme():
-    with open('README.md') as f:
-        return f.read()
-
-setup(name='SeqSero2S',
-    #version=open("version.py").readlines()[-1].split()[-1].strip("\"'"),
-    version='1.1.4',
-    description='Salmonella serotyping',
-    long_description=readme(),
-    classifiers=[
-        'Development Status :: 3 - Alpha',
-        'License :: OSI Approved :: GNU General Public License v2 (GPLv2)',
-        'Programming Language :: Python :: 3',
-        'Topic :: Text Processing :: Linguistic',
-        ],
-    keywords='Salmonella serotyping bioinformatics WGS',
-    url='https://github.com/denglab/SeqSero2S/',
-    author='Shaokang Zhang, Hendrik C Den-Bakker and Xiangyu Deng',
-    author_email='zskzsk@uga.edu, Hendrik.DenBakker@uga.edu, xdeng@uga.edu',
-    license='GPLv2',
-    scripts=["bin/deinterleave_fastq.sh","bin/Initial_Conditions_SS2S.py","bin/Initial_Conditions_SS2.py","bin/SeqSero2S.py","bin/SeqSero2_update_kmer_database.py"],
-    packages=[""],
-    include_package_data = True,
-    install_requires=['biopython~=1.73'],
-    data_files=[("seqsero2s_db",["seqsero2s_db/mlst.pickle","seqsero2s_db/antigens.pickle","seqsero2s_db/H_and_O_and_specific_genes.fasta","seqsero2s_db/invA_mers_dict","seqsero2s_db/special.pickle"]),("seqsero2s_db/kmer",["seqsero2s_db/kmer/salmonella_35.txt","seqsero2s_db/kmer/salmonella_config.txt","seqsero2s_db/kmer/salmonella_hemD.tfa","seqsero2s_db/kmer/salmonella.log","seqsero2s_db/kmer/salmonella_purE.tfa","seqsero2s_db/kmer/salmonella_thrA.tfa","seqsero2s_db/kmer/salmonella_aroC.tfa","seqsero2s_db/kmer/salmonella_dnaN.tfa","seqsero2s_db/kmer/salmonella_hisD.tfa","seqsero2s_db/kmer/salmonella_profile.txt","seqsero2s_db/kmer/salmonella_sucA.tfa","seqsero2s_db/kmer/salmonella_weight.txt"])],
-    zip_safe=False,
-)
b
diff -r 4dbbf92ff30a -r 6041d8f4eeeb seqsero2S.xml
--- a/seqsero2S.xml Fri May 15 17:55:16 2026 +0000
+++ b/seqsero2S.xml Fri May 15 19:51:16 2026 +0000
b
@@ -1,4 +1,4 @@
-<tool id="seqsero2s" name="SeqSero2S" version="1.1.4+galaxytrakr+1">
+<tool id="seqsero2s" name="SeqSero2S" version="1.1.4+galaxytrakr">
     <description>Simplified Salmonella serotype prediction</description>
     <requirements>
         <container type="docker">quay.io/galaxytrakr/seqsero2s:1.1.3</container>