diff --git a/Dockerfiles/anvio-main/Dockerfile b/Dockerfiles/anvio-main/Dockerfile
index 42fb74cfb9..af3d005871 100644
--- a/Dockerfiles/anvio-main/Dockerfile
+++ b/Dockerfiles/anvio-main/Dockerfile
@@ -12,7 +12,7 @@
 #
 
 FROM continuumio/miniconda3:4.11.0
-ENV ANVIO_VERSION "7.1_main_0522"
+ENV ANVIO_VERSION "8"
 
 SHELL ["/bin/bash", "--login", "-c"]
 
@@ -21,7 +21,7 @@ RUN conda config --env --add channels conda-forge
 
 # Create a conda environment for anvi'o, activate it, and make sure it will
 # always be activated
-RUN conda create -n anvioenv python=3.7
+RUN conda create -n anvioenv python=3.10
 RUN conda init bash
 RUN conda activate anvioenv
 RUN echo "conda activate anvioenv" >> ~/.bashrc
@@ -43,23 +43,29 @@ RUN conda install -y nano
 RUN conda install -y -c conda-forge mamba
 
 # Setup the environment
-RUN mamba install -y -c bioconda -c conda-forge python=3.7 \
-        sqlite prodigal idba mcl muscle=3.8.1551 hmmer diamond \
-        blast megahit spades bowtie2 tbb=2020.3 bwa graphviz \
-        "samtools >=1.9" trimal iqtree trnascan-se fasttree vmatch \
-        r-base r-tidyverse r-optparse r-stringi r-magrittr
+RUN mamba install -y -c conda-forge -c bioconda python=3.10 \
+        sqlite prodigal idba mcl muscle=3.8.1551 famsa hmmer diamond \
+        blast megahit spades bowtie2 bwa graphviz "samtools>=1.9" \
+        trimal iqtree trnascan-se fasttree vmatch r-base r-tidyverse \
+        r-optparse r-stringi r-magrittr bioconductor-qvalue meme ghostscript
 
 # try this, too. it may also fail to install. which is OK:
 RUN mamba install -y -c bioconda fastani
 
-# install qvalue
-RUN Rscript -e 'install.packages("BiocManager", repos="https://cran.rstudio.com"); BiocManager::install("qvalue")'
+RUN wget -qO- "https://cmake.org/files/v3.23/cmake-3.23.1-linux-"$(uname -m)".tar.gz" | tar --strip-components=1 -xz -C /usr/local
+
+#GCC compiler
+RUN apt-get update && \
+    apt-get -y install gcc mono-mcs && \
+    rm -rf /var/lib/apt/lists/*
 
 # Install anvi'o from pip
-RUN pip install git+https://github.com/merenlab/anvio.git
+RUN curl -L https://github.com/merenlab/anvio/releases/download/v8/anvio-8.tar.gz \
+        --output anvio-8.tar.gz
+RUN pip install anvio-8.tar.gz
 
-# Install METABAT and DAS_TOOL
-RUN conda install metabat2 das_tool
+# Install METABAT and DAS_TOOL 
+#RUN mamba install metabat2 das_tool
 
 # Install CONCOCT
 RUN apt-get update && apt-get install -qq build-essential libgsl0-dev bedtools mummer samtools perl libssl-dev
diff --git a/anvio/argparse.py b/anvio/argparse.py
index 3cadf630c7..20a97fcac9 100755
--- a/anvio/argparse.py
+++ b/anvio/argparse.py
@@ -59,7 +59,7 @@ def get_anvio_epilogue(self):
 
         version = anvio.anvio_version_for_help_docs
 
-        general_help = f"https://merenlab.org/software/anvio/help/{version}"
+        general_help = f"https://anvio.org/help/{version}"
         program_help = f"{general_help}/programs/{self.prog}"
 
         if os.path.exists(os.path.join(os.path.dirname(docs.__file__), f"programs/{self.prog}.md")):
diff --git a/anvio/biochemistry/reactionnetwork.py b/anvio/biochemistry/reactionnetwork.py
index 54ffc93c56..91d2081241 100644
--- a/anvio/biochemistry/reactionnetwork.py
+++ b/anvio/biochemistry/reactionnetwork.py
@@ -20,17 +20,18 @@
 import pandas as pd
 import multiprocessing as mp
 
+from argparse import Namespace
 from typing import Dict, List, Set, Tuple
 
 import anvio.utils as utils
+import anvio.dbinfo as dbinfo
 import anvio.tables as tables
 import anvio.terminal as terminal
 import anvio.filesnpaths as filesnpaths
 
 from anvio.errors import ConfigError
-from anvio.dbops import ContigsDatabase
-from anvio.dbops import ContigsSuperclass
 from anvio import DEBUG, __file__ as ANVIO_PATH, __version__ as VERSION
+from anvio.dbops import ContigsDatabase, PanDatabase, ContigsSuperclass, PanSuperclass
 
 
 __author__ = "Developers of anvi'o (see AUTHORS.txt)"
@@ -92,10 +93,13 @@ def __init__(self) -> None:
         self.e_values: List[float] = []
 
 class GeneCluster:
-    """Representation of a gene cluster."""
+    """Representation of a gene cluster in the metabolic network."""
     def __init__(self) -> None:
-        # genes in the gene cluster
-        self.genes: List[Gene] = []
+        self.gene_cluster_id: int = None
+        # Consensus KO among the genes in the cluster. The KO annotations of genes in genomes that
+        # underlie each consensus annotation are not tracked. This would require storing more data
+        # on the consensus annotations in `dbops.PanSuperclass.get_gene_cluster_function_summary`.
+        self.ko: KO = None
 
 class Bin:
     """Representation of a bin of genes or gene clusters."""
@@ -693,7 +697,7 @@ def export_json(
         overwrite: bool = False,
         objective: str = None,
         remove_missing_objective_metabolites: bool = False,
-        record_bins: tuple = ('gene', ),
+        # record_bins: tuple = ('gene', ),
         indent: int = 2,
         progress: terminal.Progress = terminal.Progress()
     ) -> None:
@@ -856,87 +860,87 @@ def export_json(
             json.dump(json_dict, f, indent=indent)
         progress.end()
 
-# class PangenomicNetwork(ReactionNetwork):
-#     """A reaction network predicted from KEGG KO and ModelSEED annotations of pangenomic gene clusters."""
-#     def __init__(self) -> None:
-#         # map gene cluster ID to gene cluster object
-#         self.gene_clusters: Dict[str, GeneCluster] = {}
-#         self.bins: Dict[str, GeneClusterBin] = {}
-#         self.collection: BinCollection = None
-#         super().__init__()
+class PangenomicNetwork(ReactionNetwork):
+    """A reaction network predicted from KEGG KO and ModelSEED annotations of pangenomic gene clusters."""
+    def __init__(self) -> None:
+        # map gene cluster ID to gene cluster object
+        self.gene_clusters: Dict[str, GeneCluster] = {}
+        self.bins: Dict[str, GeneClusterBin] = {}
+        self.collection: BinCollection = None
+        super().__init__()
 
-#     def export_json(
-#         self,
-#         path: str,
-#         annotate_genes: tuple = ('genome', 'bin', ),
-#         annotate_reactions: tuple = ('genome', 'bin', 'kegg_reaction', 'ec_number'),
-#         annotate_metabolites: tuple = ('genome', 'bin', 'kegg_compound'),
-#         run: terminal.Run = terminal.Run(),
-#         progress: terminal.Progress = terminal.Progress()
-#     ) -> None:
-#         """
-#         Export the network to a metabolic model file in JSON format. *Gene entries in this file
-#         represent gene clusters.* Optionally, gene, reaction, and metabolite entries in this file
-#         are annotated with the names of genomes and names of gene cluster bins in which they occur.
+    def export_json(
+        self,
+        path: str,
+        annotate_genes: tuple = ('genome', 'bin', ),
+        annotate_reactions: tuple = ('genome', 'bin', 'kegg_reaction', 'ec_number'),
+        annotate_metabolites: tuple = ('genome', 'bin', 'kegg_compound'),
+        run: terminal.Run = terminal.Run(),
+        progress: terminal.Progress = terminal.Progress()
+    ) -> None:
+        """
+        Export the network to a metabolic model file in JSON format. *Gene entries in this file
+        represent gene clusters.* Optionally, gene, reaction, and metabolite entries in this file
+        are annotated with the names of genomes and names of gene cluster bins in which they occur.
 
-#         Parameters
-#         ==========
-#         path : str
-#             output JSON file path
+        Parameters
+        ==========
+        path : str
+            output JSON file path
 
-#         annotate_genes : tuple, ('genome', 'bin', )
-#             Annotate gene (cluster) entries in the JSON file with additional data, selecting
-#             from the following:
+        annotate_genes : tuple, ('genome', 'bin', )
+            Annotate gene (cluster) entries in the JSON file with additional data, selecting
+            from the following:
 
-#             'genome' : genomes in which the genes of the cluster occur
+            'genome' : genomes in which the genes of the cluster occur
 
-#             'bin' : bins in which the gene cluster occurs
+            'bin' : bins in which the gene cluster occurs
 
-#             'all_ko' : all KOs associated with genes in the cluster, sorted in descending order of
-#                 the number of genes in the cluster that were associated with each KO and then mean
-#                 e-value of gene-KO assignments
+            'all_ko' : all KOs associated with genes in the cluster, sorted in descending order of
+                the number of genes in the cluster that were associated with each KO and then mean
+                e-value of gene-KO assignments
 
-#             'ko' : KOs associated with the gene cluster that yielded reactions in the network,
-#                 sorted in descending order of the number of genes in the cluster that were
-#                 associated with each KO and then mean e-value of gene-KO assignments
+            'ko' : KOs associated with the gene cluster that yielded reactions in the network,
+                sorted in descending order of the number of genes in the cluster that were
+                associated with each KO and then mean e-value of gene-KO assignments
 
-#             'ko_count' : number of genes in the cluster that were associated with each KO; if
-#                 'all_ko' is provided, then each value corresponds to a KO in 'all_ko', whereas if
-#                 only 'ko' is provided, then each value corresponds to a KO in 'ko'
+            'ko_count' : number of genes in the cluster that were associated with each KO; if
+                'all_ko' is provided, then each value corresponds to a KO in 'all_ko', whereas if
+                only 'ko' is provided, then each value corresponds to a KO in 'ko'
 
-#             'e_value' : mean scores of KO associations with genes in the cluster; if 'all_ko' is
-#                 provided, then each value corresponds to a KO in 'all_ko', whereas if only 'ko' is
-#                 provided, then each value corresponds to a KO in 'ko'
+            'e_value' : mean scores of KO associations with genes in the cluster; if 'all_ko' is
+                provided, then each value corresponds to a KO in 'all_ko', whereas if only 'ko' is
+                provided, then each value corresponds to a KO in 'ko'
 
-#         annotate_reactions : tuple, ('genome', 'bin', 'kegg_reaction', 'ec_number')
-#             Annotate reaction entries in the JSON file with additional data, selecting from the following:
+        annotate_reactions : tuple, ('genome', 'bin', 'kegg_reaction', 'ec_number')
+            Annotate reaction entries in the JSON file with additional data, selecting from the following:
 
-#             'genome' : genomes in which the reaction occurs
+            'genome' : genomes in which the reaction occurs
 
-#             'bin' : bins in which the reaction occurs
+            'bin' : bins in which the reaction occurs
 
-#             'kegg_reaction' : KO-associated KEGG reaction IDs yielding the ModelSEED reaction
+            'kegg_reaction' : KO-associated KEGG reaction IDs yielding the ModelSEED reaction
 
-#             'ec_number' : KO-associated EC numbers yielding the ModelSEED reaction
+            'ec_number' : KO-associated EC numbers yielding the ModelSEED reaction
 
-#             'ko' : KOs yielding the ModelSEED reaction
+            'ko' : KOs yielding the ModelSEED reaction
 
-#         annotate_metabolites : tuple, ('genome', 'bin', 'kegg_compound')
-#             Annotate metabolite entries in the JSON file with additional data, selecting from the following:
+        annotate_metabolites : tuple, ('genome', 'bin', 'kegg_compound')
+            Annotate metabolite entries in the JSON file with additional data, selecting from the following:
 
-#             'genome' : genomes in which the metabolite occurs
+            'genome' : genomes in which the metabolite occurs
 
-#             'bin' : bins in which the metabolite occurs
+            'bin' : bins in which the metabolite occurs
 
-#             'kegg_compound' : KEGG compound aliases of the ModelSEED compound
+            'kegg_compound' : KEGG compound aliases of the ModelSEED compound
 
-#             'ko' : KOs yielding the ModelSEED compound
+            'ko' : KOs yielding the ModelSEED compound
 
-#         run : terminal.Run, terminal.Run()
+        run : terminal.Run, terminal.Run()
 
-#         progress : terminal.Progress, terminal.Progress()
-#         """
-#         pass
+        progress : terminal.Progress, terminal.Progress()
+        """
+        pass
 
 class JSONStructure:
     """JSON structure of metabolic model file."""
@@ -1349,7 +1353,7 @@ class ModelSEEDDatabase:
     By default, the database is loaded from a default directory of ModelSEED files unless an
     alternative directory is provided.
     """
-    default_dir = os.path.join(os.path.dirname(ANVIO_PATH), 'data/MISC/ModelSEED')
+    default_dir = os.path.join(os.path.dirname(ANVIO_PATH), 'data/misc/MODELSEED')
 
     # Compounds are identified as cytosolic or extracellular in ModelSEED reactions.
     compartment_ids = {0: 'c', 1: 'e'}
@@ -1387,7 +1391,7 @@ def __init__(self, modelseed_dir: str = None) -> None:
         with open(sha_path) as f:
             self.sha = f.read().strip()
         reactions_table = pd.read_csv(reactions_path, sep='\t', header=0, low_memory=False)
-        self.compounds_table = pd.read_csv(compounds_path, sep='\t', header=0, index_col='id', low_memory=False)
+        self.compounds_table: pd.DataFrame = pd.read_csv(compounds_path, sep='\t', header=0, index_col='id', low_memory=False)
 
         # Facilitate lookup of reaction data by KEGG REACTION ID via a reorganized reactions table.
         # Remove reactions without KEGG aliases.
@@ -1646,7 +1650,7 @@ def load_contigs_database_network(
         # Check that the network stored in the contigs database was made from the same set of KEGG
         # KO gene annotations as currently in the database.
         stored_hash = contigs_super.a_meta['reaction_network_ko_annotations_hash']
-        current_hash = self.hash_ko_annotations(contigs_super.gene_function_calls_dict)
+        current_hash = self.hash_contigs_db_ko_annotations(contigs_super.gene_function_calls_dict)
         if check_gene_annotations:
             if stored_hash != current_hash:
                 ConfigError(
@@ -1901,10 +1905,12 @@ def load_contigs_database_network(
     def make_network(
         self,
         contigs_db: str = None,
-        genomes_storage_db: str = None,
         pan_db: str = None,
+        genomes_storage_db: str = None,
         store: bool = True,
-        overwrite_existing_network: bool = False
+        overwrite_existing_network: bool = False,
+        consensus_threshold: float = None,
+        discard_ties: bool = False
     ) -> ReactionNetwork:
         """
         Make a metabolic reaction network from KEGG Orthologs stored in an anvi'o database,
@@ -1918,15 +1924,15 @@ def make_network(
             gene KO annotations stored in the database. If 'store' is True, the network is saved in
             the database.
 
-        genomes_storage_db : str, None
-            Path to a genomes storage database. The pangenomic network is derived from gene KO
-            annotations stored in the database. 'pan_db' is also required.
-
         pan_db : str, None
             Path to a pan database. The pangenomic network is determined for gene clusters stored in
             the database. If 'store' is True, the network is saved in the database.
             'genomes_storage_db' is also required.
 
+        genomes_storage_db : str, None
+            Path to a genomes storage database. The pangenomic network is derived from gene KO
+            annotations stored in the database. 'pan_db' is also required.
+
         store : bool, True
             Save the network. A network constructed from a contigs database is stored in that
             database. A pangenomic network constructed from a genomes stroage database and pan
@@ -1935,22 +1941,51 @@ def make_network(
         overwrite_existing_network : bool, False
             Overwrite an existing network stored in the contigs or pan database. 'store' is also
             required.
+
+        consensus_threshold : float, None
+            This parameter applies to pangenomes. With the default of None, the protein annotation
+            most frequent among genes in a cluster is assigned to the cluster itself. If a
+            non-default argument is provided (a value on [0, 1]), at least this proportion of genes
+            in the cluster must have the most frequent annotation for the cluster to be annotated.
+
+        discard_ties : bool, False
+            This parameter applies to pangenomes. If multiple protein annotations are most frequent
+            among genes in a cluster, then do not assign an annotation to the cluster itself when
+            this argument is True. By default, this argument is False, so one of the most frequent
+            annotations would be arbitrarily chosen.
         """
-        if contigs_db:
+        if contigs_db and (pan_db or genomes_storage_db):
+            raise ConfigError(
+                "Either a contigs database OR both a pan database and genomes storage database are required "
+                "to make either a (meta)genomic reaction network or a pangenomic reaction network, respectively."
+            )
+        elif contigs_db:
             self.run.info_single(
                 "A reaction network will be made from protein orthology annotations in the contigs database."
             )
-            network = self.make_contigs_database_network(contigs_db, store=store, overwrite_existing_network=overwrite_existing_network)
+            network = self.make_contigs_database_network(
+                contigs_db,
+                store=store,
+                overwrite_existing_network=overwrite_existing_network
+            )
         elif genomes_storage_db or pan_db:
             self.run.info_single(
                 "A pangenomic reaction network will be made from protein orthology annotations "
                 "in the genomes storage database and gene clusters in the pan database."
             )
-            network = self.make_pangenomic_network(genomes_storage_db, pan_db, store=store, overwrite_existing_network=overwrite_existing_network)
+            network = self.make_pangenomic_network(
+                pan_db,
+                genomes_storage_db,
+                store=store,
+                overwrite_existing_network=overwrite_existing_network,
+                consensus_threshold=consensus_threshold,
+                discard_ties=discard_ties
+            )
         else:
             raise ConfigError(
-                "A reaction network cannot be made without a database source. "
-                "Either a contigs database or a genomes storage database and pan database are required."
+                "A reaction network cannot be made without a database source. Either a contigs database OR "
+                "a pan database and genomes storage database are required to make either a (meta)genomic "
+                "reaction network or a pangenomic reaction network, respectively."
             )
         return network
 
@@ -2036,14 +2071,13 @@ def make_contigs_database_network(
                 # with the KO were added to the network as well.
                 gene.kos.append(network.kos[ko_id])
                 continue
-            else:
-                ko = KO()
-                ko.id = ko_id
-                ko.name = ko_data[1]
-                gene.kos.append(ko)
-                # Add the KO to the network, regardless of whether it yields reactions. KOs not
-                # contributing to the network are removed later.
-                network.kos[ko_id] = ko
+            ko = KO()
+            ko.id = ko_id
+            ko.name = ko_data[1]
+            gene.kos.append(ko)
+            # Add the KO to the network, regardless of whether it yields reactions. KOs not
+            # contributing to the network are removed later.
+            network.kos[ko_id] = ko
 
             # Find KEGG reactions and EC numbers associated with the newly encountered KO.
             try:
@@ -2069,132 +2103,14 @@ def make_contigs_database_network(
                 # be associated with ModelSEED reactions.
                 continue
 
-            # If a KEGG reaction has already been encountered, then aliased ModelSEED reactions have
-            # been processed and added as ModelSEEDReaction objects to the network. Therefore, KEGG
-            # reactions that have already been encountered are treated differently than KEGG
-            # reactions encountered for the first time.
-            new_kegg_reaction_ids = []
-            for kegg_reaction_id in ko_kegg_reaction_ids:
-                try:
-                    # The KEGG reaction has already been encountered. Retrieve ModelSEED reactions
-                    # aliased by the KEGG reaction.
-                    modelseed_reaction_ids = network.kegg_modelseed_aliases[kegg_reaction_id]
-                except KeyError:
-                    new_kegg_reaction_ids.append(kegg_reaction_id)
-                    # The following list of ModelSEED reaction IDs associated with the KEGG reaction
-                    # is filled in later. If no ModelSEED reactions are associated with the KEGG
-                    # reaction, the entry in the dictionary will be removed.
-                    network.kegg_modelseed_aliases[kegg_reaction_id] = []
-                    continue
-                for modelseed_reaction_id in modelseed_reaction_ids:
-                    try:
-                        # Retrieve the existing ModelSEEDReaction object.
-                        reaction = network.reactions[modelseed_reaction_id]
-                    except KeyError:
-                        # The ModelSEED reaction associated with the EC number did not have valid
-                        # data: for example, when the 'stoichiometry' field is empty.
-                        continue
-                    # Associate the ModelSEED reaction with the newly encountered KO.
-                    ko.reactions[modelseed_reaction_id] = reaction
-                    # Record which KEGG REACTION IDs and EC numbers from the KO yield the ModelSEED reaction.
-                    ko.kegg_reaction_aliases[modelseed_reaction_id] = list(
-                        set(ko_kegg_reaction_ids).intersection(set(reaction.kegg_aliases))
-                    )
-                    ko.ec_number_aliases[modelseed_reaction_id] = list(
-                        set(ko_ec_numbers).intersection(set(reaction.ec_number_aliases))
-                    )
-
-            # As above with KEGG reactions, if an EC number has already been encountered, then
-            # aliased ModelSEED reactions have been processed and added as ModelSEEDReaction objects
-            # to the network. Therefore, EC numbers that have already been encountered are treated
-            # differently than EC numbers encountered for the first time.
-            new_ec_numbers = []
-            for ec_number in ko_ec_numbers:
-                try:
-                    # The EC number has already been encountered. Retrieve ModelSEED reactions
-                    # aliased by the EC number.
-                    modelseed_reaction_ids = network.ec_number_modelseed_aliases[ec_number]
-                except KeyError:
-                    new_ec_numbers.append(ec_number)
-                    # The following list of ModelSEED reaction IDs associated with the EC number is
-                    # filled in later. If no ModelSEED reactions are associated with the EC number,
-                    # the entry in the dictionary will be removed.
-                    network.ec_number_modelseed_aliases[ec_number] = []
-                    continue
-                for modelseed_reaction_id in modelseed_reaction_ids:
-                    try:
-                        # Retrieve the existing ModelSEEDReaction object.
-                        reaction = network.reactions[modelseed_reaction_id]
-                    except KeyError:
-                        # The ModelSEED reaction associated with the EC number did not have valid
-                        # data: for example, when the 'stoichiometry' field is empty.
-                        continue
-                    if modelseed_reaction_id in reaction.ec_number_aliases:
-                        # A KEGG reaction associated with the newly encountered KO was also
-                        # associated with the ModelSEED reaction. KO EC number aliases were
-                        # previously recorded along with KO KEGG reaction aliases. Redundant work
-                        # can be avoided here linking the ModelSEED reaction to the KO in the network.
-                        continue
-                    ko.reactions[modelseed_reaction_id] = reaction
-                    ko.kegg_reaction_aliases[modelseed_reaction_id] = list(
-                        set(ko_kegg_reaction_ids).intersection(set(reaction.kegg_aliases))
-                    )
-                    ko.ec_number_aliases[modelseed_reaction_id] = list(
-                        set(ko_ec_numbers).intersection(set(reaction.ec_number_aliases))
-                    )
-
+            new_kegg_reaction_ids = self._parse_ko_kegg_reaction_ids(network, ko, ko_kegg_reaction_ids, ko_ec_numbers)
+            new_ec_numbers = self._parse_ko_ec_numbers(network, ko, ko_ec_numbers, ko_kegg_reaction_ids)
             if not (new_kegg_reaction_ids or new_ec_numbers):
                 # All of the KEGG reactions and EC numbers associated with the KO have already been
                 # encountered in previously processed KOs and added to the network, so proceed to
                 # the next gene KO annotation.
                 continue
-
-            # Get data on ModelSEED reactions aliased by newly encountered KEGG REACTION IDs and EC numbers.
-            modelseed_reactions_data = {}
-            if new_kegg_reaction_ids:
-                # Each row of the table represents a unique KEGG reaction -> ModelSEED reaction mapping.
-                modelseed_kegg_reactions_dict: Dict[str, Dict] = modelseed_kegg_reactions_table[
-                    modelseed_kegg_reactions_table['KEGG_REACTION_ID'].isin(new_kegg_reaction_ids)
-                ].to_dict(orient='index')
-                for modelseed_reaction_data in modelseed_kegg_reactions_dict.values():
-                    kegg_reaction_id = modelseed_reaction_data['KEGG_REACTION_ID']
-                    modelseed_reaction_id = modelseed_reaction_data['id']
-                    # Record the association between the KEGG reaction and ModelSEED reaction in the
-                    # network, and vice versa.
-                    network.kegg_modelseed_aliases[kegg_reaction_id].append(modelseed_reaction_id)
-                    try:
-                        network.modelseed_kegg_aliases[modelseed_reaction_id].append(kegg_reaction_id)
-                    except KeyError:
-                        # This is the first time the ModelSEED reaction has been encountered.
-                        network.modelseed_kegg_aliases[modelseed_reaction_id] = [kegg_reaction_id]
-                        network.modelseed_ec_number_aliases[modelseed_reaction_id] = []
-                    if modelseed_reaction_id in modelseed_reactions_data:
-                        # One of the other newly encountered KEGG reactions also mapped to this
-                        # ModelSEED reaction, so do not record redundant ModelSEED reaction data.
-                        continue
-                    modelseed_reactions_data[modelseed_reaction_id] = modelseed_reaction_data
-            if new_ec_numbers:
-                # Each row of the table represents a unique EC number -> ModelSEED reaction mapping.
-                modelseed_ec_reactions_dict: Dict[str, Dict] = modelseed_ec_reactions_table[
-                    modelseed_ec_reactions_table['EC_number'].isin(new_ec_numbers)
-                ].to_dict(orient='index')
-                for modelseed_reaction_data in modelseed_ec_reactions_dict.values():
-                    ec_number = modelseed_reaction_data['EC_number']
-                    modelseed_reaction_id = modelseed_reaction_data['id']
-                    # Record the association between the EC number and ModelSEED reaction in the
-                    # network, and vice versa.
-                    network.ec_number_modelseed_aliases[ec_number].append(modelseed_reaction_id)
-                    try:
-                        network.modelseed_ec_number_aliases[modelseed_reaction_id].append(ec_number)
-                    except KeyError:
-                        # This is the first time the ModelSEED reaction has been encountered.
-                        network.modelseed_ec_number_aliases[modelseed_reaction_id] = [ec_number]
-                        network.modelseed_kegg_aliases[modelseed_reaction_id] = []
-                    if modelseed_reaction_id in modelseed_reactions_data:
-                        # One of the other newly encountered KEGG reactions or EC numbers also
-                        # mapped to this ModelSEED reaction, so do not record redundant ModelSEED reaction data.
-                        continue
-                    modelseed_reactions_data[modelseed_reaction_id] = modelseed_reaction_data
+            modelseed_reactions_data = self._get_modelseed_reactions_data(network, new_kegg_reaction_ids, new_ec_numbers, modelseed_kegg_reactions_table, modelseed_ec_reactions_table)
             if not modelseed_reactions_data:
                 # The newly encountered KEGG REACTION IDs and EC numbers do not map to ModelSEED
                 # reactions (are not in the table).
@@ -2216,42 +2132,7 @@ def make_contigs_database_network(
                     # 'kegg_modelseed_aliases', 'ec_number_modelseed_aliases',
                     # 'modelseed_kegg_aliases', and 'modelseed_ec_number_aliases'.
                     continue
-                ko.reactions[modelseed_reaction_id] = reaction
-                # Record which KEGG REACTION IDs and EC numbers from the KO yield the ModelSEED reaction.
-                ko.kegg_reaction_aliases[modelseed_reaction_id] = list(
-                    set(new_kegg_reaction_ids).intersection(set(reaction.kegg_aliases))
-                )
-                ko.ec_number_aliases[modelseed_reaction_id] = list(
-                    set(new_ec_numbers).intersection(set(reaction.ec_number_aliases))
-                )
-                network.reactions[modelseed_reaction_id] = reaction
-
-                # If the ModelSEED compound ID has been encountered in previously processed
-                # reactions, then there is already a ModelSEEDCompound object for it.
-                new_modelseed_compound_ids = []
-                reaction_compounds = []
-                for modelseed_compound_id in modelseed_compound_ids:
-                    if modelseed_compound_id in network.metabolites:
-                        reaction_compounds.append(network.metabolites[modelseed_compound_id])
-                    else:
-                        new_modelseed_compound_ids.append(modelseed_compound_id)
-
-                # Generate new metabolite objects in the network
-                for modelseed_compound_id in new_modelseed_compound_ids:
-                    try:
-                        modelseed_compound_series: pd.Series = modelseed_compounds_table.loc[modelseed_compound_id]
-                    except KeyError:
-                        raise ConfigError(
-                            f"A row for the ModelSEED compound ID, '{modelseed_compound_id}', was expected "
-                            "but not found in the ModelSEED compounds table. This ID was found in the equation "
-                            f"for the ModelSEED reaction, '{modelseed_reaction_id}'."
-                        )
-                    modelseed_compound_data = modelseed_compound_series.to_dict()
-                    modelseed_compound_data['id'] = modelseed_compound_id
-                    compound = self._get_modelseed_compound(modelseed_compound_data)
-                    reaction_compounds.append(compound)
-                    network.metabolites[modelseed_compound_id] = compound
-                reaction.compounds = tuple(reaction_compounds)
+                self._add_modelseed_reaction(network, ko, reaction, new_kegg_reaction_ids, new_ec_numbers, modelseed_compound_ids, modelseed_compounds_table)
 
         # List genes that do not contribute to the reaction network. Remove any trace of these genes
         # from the network.
@@ -2318,6 +2199,11 @@ def make_contigs_database_network(
                 f"Here are the unrecognized KO IDs from the contigs database: {', '.join(undefined_ko_ids)}"
             )
 
+        ko_dir = KODatabase.default_dir if self.ko_dir is None else self.ko_dir
+        modelseed_dir = ModelSEEDDatabase.default_dir if self.modelseed_dir is None else self.modelseed_dir
+        self.run.info("Reference KEGG KO database directory", ko_dir, nl_before=1)
+        self.run.info("Reference ModelSEED database directory", modelseed_dir)
+
         if store:
             if contigs_super.a_meta['reaction_network_ko_annotations_hash']:
                 self.run.warning("Deleting existing reaction network from contigs database")
@@ -2329,12 +2215,24 @@ def make_contigs_database_network(
 
             self.progress.new("Saving reaction network to contigs database")
             self.progress.update("Reactions table")
-            self._store_contigs_database_reactions(network, contigs_db)
+            reactions_table = self._get_database_reactions_table(network)
+            cdb = ContigsDatabase(contigs_db)
+            cdb.db._exec_many(
+                f'''INSERT INTO {tables.gene_function_reactions_table_name} VALUES ({','.join('?' * len(tables.gene_function_reactions_table_structure))})''',
+                reactions_table.values
+            )
+            cdb.disconnect()
             self.progress.update("Metabolites table")
-            self._store_contigs_database_metabolites(network, contigs_db)
+            metabolites_table = self._get_database_metabolites_table(network)
+            cdb = ContigsDatabase(contigs_db)
+            cdb.db._exec_many(
+                f'''INSERT INTO {tables.gene_function_metabolites_table_name} VALUES ({','.join('?' * len(tables.gene_function_metabolites_table_structure))})''',
+                metabolites_table.values
+            )
+            cdb.disconnect()
 
             self.progress.update("Metadata")
-            ko_annotations_hash = self.hash_ko_annotations(gene_function_calls_dict)
+            ko_annotations_hash = self.hash_contigs_db_ko_annotations(gene_function_calls_dict)
             cdb = ContigsDatabase(contigs_db)
             cdb.db.set_meta_value('reaction_network_ko_annotations_hash', ko_annotations_hash)
             cdb.db.set_meta_value('reaction_network_kegg_database_release', ko_db.release)
@@ -2366,6 +2264,7 @@ def make_contigs_database_network(
 
         self.progress.new("Counting reactions and KO sources")
         self.progress.update("...")
+        # This group of network statistics is found the same way for both contigs and pan databases.
 
         stats['Reactions in network'] = reaction_count = len(network.reactions)
         reaction_counts = []
@@ -2384,6 +2283,7 @@ def make_contigs_database_network(
 
         self.progress.new("Counting reactions from each alias source")
         self.progress.update("...")
+        # This group of network statistics is found the same way for both contigs and pan databases.
 
         kegg_reaction_source_count = 0
         ec_number_source_count = 0
@@ -2436,6 +2336,7 @@ def make_contigs_database_network(
 
         self.progress.new("Counting reactions and metabolites by property")
         self.progress.update("...")
+        # This group of network statistics is found the same way for both contigs and pan databases.
 
         reversible_count = 0
         irreversible_count = 0
@@ -2515,173 +2416,942 @@ def make_contigs_database_network(
 
         return network
 
-    def _get_modelseed_reaction(self, modelseed_reaction_data: Dict) -> Tuple[ModelSEEDReaction, List[str]]:
+    def make_pangenomic_network(
+        self,
+        pan_db: str,
+        genomes_storage_db: str,
+        store: bool = True,
+        overwrite_existing_network: bool = False,
+        consensus_threshold: float = None,
+        discard_ties: bool = False
+    ) -> PangenomicNetwork:
         """
-        Generate a ModelSEED reaction object and list of associated ModelSEED compound IDs from the
-        ModelSEED reaction table entry. The reaction object is not populated with metabolite objects
-        from the list of associated compound IDs.
+        Make a pangenomic metabolic reaction network from KEGG Orthologs stored a genomes storage
+        database and gene clusters stored in a pan database.
 
         Parameters
         ==========
-        modelseed_reaction_data : Dict
-            A dictionary representation of a row for a reaction in the ModelSEED reaction table set
-            up by anvi'o.
-
-        Returns
-        =======
-        ModelSEEDReaction
-            An object representation of the ModelSEED reaction.
-
-        List[str]
-            ModelSEED compound IDs of reactants and products.
-        """
-        stoichiometry: str = modelseed_reaction_data['stoichiometry']
-        if pd.isna(stoichiometry):
-            # ignore any reaction lacking a chemical equation for some reason
-            return None, None
+        pan_db : str
+            Path to a pan database. The pangenomic network is determined for gene clusters stored in
+            the database.
 
-        reaction = ModelSEEDReaction()
+        genomes_storage_db : str
+            Path to a genomes storage database. The pangenomic network is derived from gene KO
+            annotations stored in the database.
 
-        modelseed_id = modelseed_reaction_data['id']
-        if pd.isna(modelseed_id):
-            raise ConfigError(
-                "The row for the reaction in the ModelSEED table does not but should have an ID. "
-                f"Here is the data in the row: '{modelseed_reaction_data}'"
-            )
-        reaction.modelseed_id = modelseed_id
+        store : bool, True
+            Save the network to the pan database.
 
-        modelseed_name = modelseed_reaction_data['name']
-        if pd.isna(modelseed_name):
-            reaction.modelseed_name = None
-        else:
-            reaction.modelseed_name = modelseed_name
+        overwrite_existing_network : bool, False
+            Overwrite an existing network stored in the pan database. 'store' is also required.
 
-        kegg_reaction_ids: str = modelseed_reaction_data['KEGG']
-        if pd.isna(kegg_reaction_ids):
-            reaction.kegg_aliases = tuple()
-        else:
-            reaction.kegg_aliases = tuple(kegg_reaction_ids.split('; '))
+        consensus_threshold : float, None
+            With the default of None, the protein annotation most frequent among genes in a cluster
+            is assigned to the cluster itself. If a non-default argument is provided (a value on [0,
+            1]), at least this proportion of genes in the cluster must have the most frequent
+            annotation for the cluster to be annotated.
 
-        ec_numbers: str = modelseed_reaction_data['ec_numbers']
-        if pd.isna(ec_numbers):
-            reaction.ec_number_aliases = []
-        else:
-            reaction.ec_number_aliases = ec_numbers.split('|')
+        discard_ties : bool, False
+            If multiple protein annotations are most frequent among genes in a cluster, then do not
+            assign an annotation to the cluster itself when this argument is True. By default, this
+            argument is False, so one of the most frequent annotations would be arbitrarily chosen.
 
-        reversibility = modelseed_reaction_data['reversibility']
-        if pd.isna(reversibility):
+        Returns
+        =======
+        PangenomicNetwork
+            The network derived from the pangenomic databases.
+        """
+        # Load the pan database.
+        args = Namespace()
+        args.pan_db = pan_db
+        args.genomes_storage = genomes_storage_db
+        args.discard_ties = discard_ties
+        args.consensus_threshold = consensus_threshold
+        pan_super = PanSuperclass(args, r=run_quiet)
+
+        if store and pan_super.p_meta['reaction_network_ko_annotations_hash'] and not overwrite_existing_network:
             raise ConfigError(
-                "The row for the reaction in the ModelSEED table was expected to have a 'reversibility' value. "
-                f"Here is the data in the row: '{modelseed_reaction_data}'"
+                "The existing reaction network in the pan database must be explicitly overwritten."
             )
-        if reversibility == '=' or reversibility == '?':
-            # Assume that reactions lacking data ('?') are reversible.
-            reaction.reversibility = True
-        else:
-            reaction.reversibility = False
 
-        decimal_reaction_coefficients = []
-        split_stoichiometry = stoichiometry.split(';')
-        modelseed_compound_ids = []
-        compartments = []
-        for entry in split_stoichiometry:
-            split_entry = entry.split(':')
-            decimal_reaction_coefficients.append(split_entry[0])
-            modelseed_compound_ids.append(split_entry[1])
-            compartments.append(ModelSEEDDatabase.compartment_ids[int(split_entry[2])])
-        reaction.compartments = tuple(compartments)
-        reaction_coefficients = self._to_lcm_denominator(decimal_reaction_coefficients)
-        direction = modelseed_reaction_data['direction']
-        if pd.isna(direction):
+        # Check that genome contigs databases were annotated with KOs before building the pan
+        # database. Unlike in contigs super, the initialization of functions by a method of pan
+        # super does not allow specification of particular functional annotation sources, with
+        # concomitant checks for their existence.
+        gs_info = dbinfo.GenomeStorageDBInfo(genomes_storage_db)
+        gs_sources: str = gs_info.get_self_table()['gene_function_sources']
+        if 'KOfam' not in [source.strip() for source in gs_sources.split(',')]:
             raise ConfigError(
-                "The row for the reaction in the ModelSEED table was expected to have a 'direction' value. "
-                f"Here is the data in the row: '{modelseed_reaction_data}'"
+                "The genomes of the pangenome were not annotated with KOs, which can be rectified by "
+                "running `anvi-run-kegg-kofams` on the genome contigs databases and remaking the pangenome."
             )
-        if (direction == '>' and reversibility == '<') or (direction == '<' and reversibility == '>'):
-            # The way the reaction is written is the opposite of the way the reaction proceeds.
-            reaction_coefficients = [-c for c in reaction_coefficients]
-        reaction.coefficients = tuple(reaction_coefficients)
-
-        return reaction, modelseed_compound_ids
-
-    def _to_lcm_denominator(self, floats: List[float]) -> Tuple[int]:
-        """
-        Convert a list of numbers to their lowest common integer multiples.
+        pan_super.init_gene_clusters()
+        pan_super.init_gene_clusters_functions()
+        pan_super.init_gene_clusters_functions_summary_dict()
 
-        Parameters
-        ==========
-        floats : List[float]
+        self.progress.new("Building reaction network")
+        self.progress.update("Loading reference databases")
 
-        Returns
-        =======
-        List[int]
-        """
-        def lcm(a, b):
-            return a * b // math.gcd(a, b)
-        rationals = [fractions.Fraction(f).limit_denominator() for f in floats]
-        lcm_denom = functools.reduce(lcm, [r.denominator for r in rationals])
-        return list(int(r.numerator * lcm_denom / r.denominator) for r in rationals)
+        # Load the required orthology reference databases set up by anvi'o.
+        ko_db = KODatabase(self.ko_dir)
+        modelseed_db = ModelSEEDDatabase(self.modelseed_dir)
 
-    def _get_modelseed_compound(self, modelseed_compound_data: Dict) -> ModelSEEDCompound:
-        """
-        Generate a ModelSEED compound object from its entry in the ModelSEED table.
+        network = PangenomicNetwork()
 
-        Parameters
-        ==========
-        modelseed_compound_data : Dict
-            A dictionary representation of a row for a compound in the ModelSEED compound table set
-            up by anvi'o.
+        modelseed_kegg_reactions_table = modelseed_db.kegg_reactions_table
+        modelseed_ec_reactions_table = modelseed_db.ec_reactions_table
+        modelseed_compounds_table = modelseed_db.compounds_table
 
-        Returns
-        =======
-        ModelSEEDCompound
-            An object representation of the ModelSEED compound.
-        """
-        compound = ModelSEEDCompound()
-        compound.modelseed_id = modelseed_compound_data['id']
+        # List KOs that annotated gene clusters in the pan database but for some reason are not
+        # found in the KO database.
+        undefined_ko_ids = []
 
-        modelseed_name = modelseed_compound_data['name']
-        if pd.isna(modelseed_name):
-            compound.modelseed_name = None
-        else:
-            compound.modelseed_name = modelseed_name
+        # Parse gene clusters.
+        gene_clusters_functions_summary_dict: Dict = pan_super.gene_clusters_functions_summary_dict
+        total_gene_clusters = len(pan_super.gene_clusters)
+        num_gene_clusters_parsed = -1
+        for gene_cluster_id, gene_cluster_functions_data in gene_clusters_functions_summary_dict.items():
+            num_gene_clusters_parsed += 1
+            self.progress.update(f"Gene clusters parsed: {num_gene_clusters_parsed} / {total_gene_clusters}")
+            # Retrieve the consensus KO across genes in the cluster. Parameterization of the method
+            # used to select consensus KOs occurred in pan super initialization.
+            gene_cluster_ko_data = gene_cluster_functions_data['KOfam']
+            if gene_cluster_ko_data == {'function': None, 'accession': None}:
+                # No KO was assigned to the cluster.
+                continue
+            ko_id = gene_cluster_ko_data['accession']
 
-        kegg_aliases: str = modelseed_compound_data['KEGG']
-        if pd.isna(kegg_aliases):
-            compound.kegg_aliases = tuple()
-        else:
-            compound.kegg_aliases = tuple(kegg_aliases.split('; '))
+            gene_cluster = GeneCluster()
+            gene_cluster.gene_cluster_id = gene_cluster_id
+            # Add the gene cluster to the network, regardless of whether it yields reactions. Gene
+            # clusters not contributing to the reaction network are removed later.
+            network.gene_clusters[gene_cluster_id] = gene_cluster
 
-        formula = modelseed_compound_data['formula']
-        if pd.isna(formula):
-            compound.formula = None
-            # compounds without formulas have a nominal charge of 10000000 in compounds.tsv
-            compound.charge = None
-        else:
-            compound.formula = formula
-            charge = modelseed_compound_data['charge']
-            if pd.isna(charge):
-                raise ConfigError(
-                    f"The charge of a ModelSEED compound, '{compound.modelseed_id}', was not recorded "
-                    "in 'compounds.tsv' but is expected to be present as an integer. Here is the data "
-                    f"in the row for the compound: '{modelseed_compound_data}'"
-                )
-            compound.charge = charge
+            if ko_id in network.kos:
+                # The KO was assigned to another gene cluster that was already processed and added
+                # to the network. Objects representing ModelSEED reactions and metabolites and other
+                # data associated with the KO were added to the network in addition to a KO object.
+                gene_cluster.ko = network.kos[ko_id]
+                continue
+            ko = KO()
+            ko.id = ko_id
+            ko.name = gene_cluster_ko_data['function']
+            gene_cluster.ko = ko
+            # Add the newly encountered KO to the network, regardless of whether it yields
+            # reactions. KOs not contributing to the network are removed later.
+            network.kos[ko_id] = ko
 
-        return compound
+            # Find KEGG reactions and EC numbers associated with the newly encountered KO.
+            try:
+                ko_info = ko_db.ko_table.loc[ko.id]
+            except KeyError:
+                undefined_ko_ids.append(ko_id)
+                continue
+            ko_kegg_reaction_info: str = ko_info.loc['reactions']
+            if pd.isna(ko_kegg_reaction_info):
+                # The KO is not associated with KEGG reactions.
+                ko_kegg_reaction_ids = []
+            else:
+                ko_kegg_reaction_ids = ko_kegg_reaction_info.split()
+            ko_ec_number_info: str = ko_info.loc['ec_numbers']
+            if pd.isna(ko_ec_number_info):
+                # The KO is not associated with EC numbers.
+                ko_ec_numbers = []
+            else:
+                ko_ec_numbers = ko_ec_number_info.split()
 
-    def _store_contigs_database_reactions(self, network: GenomicNetwork, contigs_db: str) -> None:
-        """
-        Store reaction data in the relevant contigs database table.
+            if not (ko_kegg_reaction_ids or ko_ec_numbers):
+                # The KO is not associated with any KEGG reactions or EC numbers, and thereby cannot
+                # be associated with ModelSEED reactions.
+                continue
 
-        Parameters
-        ==========
-        network : GenomicNetwork
-            The reaction network generated from gene KO annotations in the contigs database.
+            new_kegg_reaction_ids = self._parse_ko_kegg_reaction_ids(network, ko, ko_kegg_reaction_ids, ko_ec_numbers)
+            new_ec_numbers = self._parse_ko_ec_numbers(network, ko, ko_ec_numbers, ko_kegg_reaction_ids)
+            if not (new_kegg_reaction_ids or new_ec_numbers):
+                # All of the KEGG reactions and EC numbers associated with the KO have already been
+                # encountered in previously processed KOs and added to the network, so proceed to
+                # the next gene cluster.
+                continue
+            modelseed_reactions_data = self._get_modelseed_reactions_data(network, new_kegg_reaction_ids, new_ec_numbers, modelseed_kegg_reactions_table, modelseed_ec_reactions_table)
+            if not modelseed_reactions_data:
+                # The newly encountered KEGG REACTION IDs and EC numbers do not map to ModelSEED
+                # reactions (are not in the ModelSEED table).
+                continue
+
+            # Process the ModelSEED reactions aliased by newly encountered KEGG reactions and EC numbers.
+            for modelseed_reaction_id, modelseed_reaction_data in modelseed_reactions_data.items():
+                if modelseed_reaction_id in network.reactions:
+                    # The ModelSEED reaction is aliased by previously encountered KEGG reactions and
+                    # EC numbers, and so has already been added to the network.
+                    continue
+                # Make a new reaction object for the ModelSEED ID. This object does not yet have
+                # metabolite objects (for the ModelSEED compound IDs) added to it yet.
+                reaction, modelseed_compound_ids = self._get_modelseed_reaction(modelseed_reaction_data)
+                if reaction is None:
+                    # For some reason, the reaction does not have a equation in the ModelSEED
+                    # database. Associations between such reactions without equations and sourcing
+                    # KEGG reactions and EC numbers are later removed from the network attributes,
+                    # 'kegg_modelseed_aliases', 'ec_number_modelseed_aliases',
+                    # 'modelseed_kegg_aliases', and 'modelseed_ec_number_aliases'.
+                    continue
+                self._add_modelseed_reaction(network, ko, reaction, new_kegg_reaction_ids, new_ec_numbers, modelseed_compound_ids, modelseed_compounds_table)
+
+        # List gene clusters and KOs that do not contribute to the reaction network. Remove any
+        # trace of these gene clusters and KOs from the network.
+        unnetworked_gene_cluster_ids = []
+        unnetworked_ko_ids = []
+        for gene_cluster_id, gene_cluster in network.gene_clusters.items():
+            ko = gene_cluster.ko
+            if ko.reactions:
+                break
+            unnetworked_gene_cluster_ids.append(gene_cluster_id)
+            unnetworked_ko_ids.append(ko.id)
+        for gene_cluster_id in unnetworked_gene_cluster_ids:
+            network.gene_clusters.pop(gene_cluster_id)
+        for ko_id in unnetworked_ko_ids:
+            network.kos.pop(ko_id)
+
+        # List KO KEGG reactions that do not map to ModelSEED reactions. Remove any trace of these
+        # KEGG reactions from the network.
+        unnetworked_kegg_reaction_ids = []
+        for kegg_reaction_id, modelseed_reaction_ids in network.kegg_modelseed_aliases.items():
+            if not modelseed_reaction_ids:
+                unnetworked_kegg_reaction_ids.append(kegg_reaction_id)
+        for kegg_reaction_id in unnetworked_kegg_reaction_ids:
+            network.kegg_modelseed_aliases.pop(kegg_reaction_id)
+
+        # List KO EC numbers that do not map to ModelSEED reactions. Remove any trace of these EC
+        # numbers from the network.
+        unnetworked_ec_numbers = []
+        for ec_number, modelseed_reaction_ids in network.ec_number_modelseed_aliases.items():
+            if not modelseed_reaction_ids:
+                unnetworked_ec_numbers.append(ec_number)
+        for ec_number in unnetworked_ec_numbers:
+            network.ec_number_modelseed_aliases.pop(ec_number)
+
+        # List aliased ModelSEED reactions that did not yield a ModelSEEDReaction object due to the
+        # lack of an equation for the reaction in the ModelSEED database. Remove any trace of these
+        # reactions from the network.
+        undefined_modelseed_reaction_ids = list(
+            set(network.modelseed_kegg_aliases).difference(set(network.reactions))
+        )
+        for modelseed_reaction_id in undefined_modelseed_reaction_ids:
+            network.modelseed_kegg_aliases.pop(modelseed_reaction_id)
+            network.modelseed_ec_number_aliases.pop(modelseed_reaction_id)
+        self.progress.end()
+
+        if DEBUG:
+            self.run.info_single(
+                "The following ModelSEED reactions would have been added to the reaction network "
+                "had there been a chemical equation in the ModelSEED database; perhaps it is worth "
+                "investigating the ModelSEED reactions table to understand why this is not the case: "
+                f"{', '.join(undefined_modelseed_reaction_ids)}"
+            )
+
+        if undefined_ko_ids:
+            self.run.info_single(
+                "Certain gene clusters were assigned consensus KOs that were not found in the KO "
+                "database. It could be that the KOfams used to annotate gene clusters were not from "
+                "the same KEGG database version as the KO files. Here are the unrecognized KO IDs "
+                f"from the pan database: {', '.join(undefined_ko_ids)}"
+            )
+
+        ko_dir = KODatabase.default_dir if self.ko_dir is None else self.ko_dir
+        modelseed_dir = ModelSEEDDatabase.default_dir if self.modelseed_dir is None else self.modelseed_dir
+        self.run.info("Reference KEGG KO database directory", ko_dir, nl_before=1)
+        self.run.info("Reference ModelSEED database directory", modelseed_dir)
+
+        if store:
+            if pan_super.p_meta['reaction_network_ko_annotations_hash']:
+                self.run.warning("Deleting existing reaction network from pan database")
+                pdb = PanDatabase(pan_db)
+                pdb.db._exec(f'''DELETE from {tables.pan_gene_cluster_function_reactions_table_name}''')
+                pdb.db._exec(f'''DELETE from {tables.pan_gene_cluster_function_metabolites_table_name}''')
+                pdb.disconnect()
+                self.run.info_single("Deleted data in gene cluster function reactions and metabolites tables", nl_after=1)
+
+            self.progress.new("Saving reaction network to pan database")
+            self.progress.update("Reactions table")
+            reactions_table = self._get_database_reactions_table(network)
+            pdb = PanDatabase(pan_db)
+            pdb.db._exec_many(
+                f'''INSERT INTO {tables.pan_gene_cluster_function_reactions_table_name} VALUES ({','.join('?' * len(tables.pan_gene_cluster_function_reactions_table_structure))})''',
+                reactions_table.values
+            )
+            pdb.disconnect()
+            self.progress.update("Metabolites table")
+            metabolites_table = self._get_database_metabolites_table(network)
+            pdb = PanDatabase(pan_db)
+            pdb.db._exec_many(
+                f'''INSERT INTO {tables.pan_gene_cluster_function_metabolites_table_name} VALUES ({','.join('?' * len(tables.gene_function_metabolites_table_structure))})''',
+                metabolites_table.values
+            )
+            pdb.disconnect()
+
+            self.progress.update("Metadata")
+            ko_annotations_hash = self.hash_pan_db_ko_annotations(genomes_storage_db, gene_clusters_functions_summary_dict, consensus_threshold=consensus_threshold, discard_ties=discard_ties)
+            pdb = PanDatabase(pan_db)
+            pdb.db.set_meta_value('reaction_network_ko_annotations_hash', ko_annotations_hash)
+            pdb.db.set_meta_value('reaction_network_kegg_database_release', ko_db.release)
+            pdb.db.set_meta_value('reaction_network_modelseed_database_sha', modelseed_db.sha)
+            pdb.db.set_meta_value('reaction_network_consensus_threshold', consensus_threshold)
+            pdb.db.set_meta_value('reaction_network_discard_ties', int(discard_ties))
+            pdb.disconnect()
+            self.progress.end()
+
+        stats = {}
+        self.run.info_single("METABOLIC REACTION NETWORK STATISTICS", mc='green', nl_after=1)
+
+        self.progress.new("Counting gene clusters and KOs")
+        self.progress.update("...")
+
+        pdb = PanDatabase(pan_db)
+        stats['Total gene clusters in pangenome'] = gene_cluster_count = pdb.meta['num_gene_clusters']
+        pdb.disconnect()
+        stats['Genes clusters assigned protein KOs'] = ko_annotated_gene_cluster_count = len(network.gene_clusters) + len(unnetworked_gene_cluster_ids)
+        stats['Gene clusters in network'] = networked_gene_cluster_count = len(network.gene_clusters)
+        stats['Protein KOs assigned to gene clusters'] = annotating_ko_count = len(network.kos) + len(unnetworked_ko_ids)
+        stats['KOs in network'] = networked_ko_count = len(network.kos)
+        self.progress.end()
+
+        self.run.info_single("Gene clusters and KEGG Ortholog (KO) annotations")
+        self.run.info("Total gene clusters in pangenome", gene_cluster_count)
+        self.run.info("Gene clusters annotated with protein KOs", ko_annotated_gene_cluster_count)
+        self.run.info("Gene clusters in network", networked_gene_cluster_count)
+        self.run.info("Protein KOs annotating gene clusters", annotating_ko_count)
+        self.run.info("KOs in network", networked_ko_count, nl_after=1)
+
+        self.progress.new("Counting reactions and KO sources")
+        self.progress.update("...")
+        # This group of network statistics is found the same way for both a pan and contigs database.
+
+        stats['Reactions in network'] = reaction_count = len(network.reactions)
+        reaction_counts = []
+        for ko in network.kos.values():
+            reaction_counts.append(len(ko.reactions))
+        stats['Mean reactions per KO'] = mean_reactions_per_ko = round(np.mean(reaction_counts), 1)
+        stats['Stdev reactions per KO'] = std_reactions_per_ko = round(np.std(reaction_counts), 1)
+        stats['Max reactions per KO'] = max_reactions_per_ko = max(reaction_counts)
+        self.progress.end()
+
+        self.run.info_single("ModelSEED reactions in network and KO sources")
+        self.run.info("Reactions in network", reaction_count)
+        self.run.info("Mean reactions per KO", mean_reactions_per_ko)
+        self.run.info("Stdev reactions per KO", std_reactions_per_ko)
+        self.run.info("Max reactions per KO", max_reactions_per_ko, nl_after=1)
+
+        self.progress.new("Counting reactions from each alias source")
+        self.progress.update("...")
+        # This group of network statistics is found the same way for both a pan and contigs database.
+
+        kegg_reaction_source_count = 0
+        ec_number_source_count = 0
+        both_source_count = 0
+        for modelseed_reaction_id, kegg_reaction_ids in network.modelseed_kegg_aliases.items():
+            ec_numbers = network.modelseed_ec_number_aliases[modelseed_reaction_id]
+            if kegg_reaction_ids:
+                kegg_reaction_source_count += 1
+            if ec_numbers:
+                ec_number_source_count += 1
+            if kegg_reaction_ids and ec_numbers:
+                both_source_count += 1
+        stats['Reactions aliased by KEGG reaction'] = kegg_reaction_source_count
+        stats['Reactions aliased by EC number'] = ec_number_source_count
+        stats['Rxns aliased by both KEGG rxn & EC number'] = both_source_count
+        stats['Reactions aliased only by KEGG reaction'] = only_kegg_reaction_source_count = kegg_reaction_source_count - both_source_count
+        stats['Reactions aliased only by EC number'] = only_ec_number_source_count = ec_number_source_count - both_source_count
+
+        stats['KEGG reactions contributing to network'] = kegg_reaction_count = len(network.kegg_modelseed_aliases)
+        reaction_counts = []
+        for kegg_reaction_id, modelseed_reaction_ids in network.kegg_modelseed_aliases.items():
+            reaction_counts.append(len(modelseed_reaction_ids))
+        stats['Mean reactions per KEGG reaction'] = mean_reactions_per_kegg_reaction = round(np.mean(reaction_counts), 1)
+        stats['Stdev reactions per KEGG reaction'] = std_reactions_per_kegg_reaction = round(np.std(reaction_counts), 1)
+        stats['Max reactions per KEGG reaction'] = max_reactions_per_kegg_reaction = max(reaction_counts)
+
+        stats['EC numbers contributing to network'] = ec_number_count = len(network.ec_number_modelseed_aliases)
+        reaction_counts = []
+        for ec_number, modelseed_reaction_ids in network.ec_number_modelseed_aliases.items():
+            reaction_counts.append(len(modelseed_reaction_ids))
+        stats['Mean reactions per EC number'] = mean_reactions_per_ec_number = round(np.mean(reaction_counts), 1)
+        stats['Stdev reactions per EC number'] = std_reactions_per_ec_number = round(np.std(reaction_counts), 1)
+        stats['Max reactions per EC number'] = max_reactions_per_ec_number = max(reaction_counts)
+        self.progress.end()
+
+        self.run.info_single("Reaction alias source comparison")
+        self.run.info("Reactions aliased by KEGG reaction", kegg_reaction_source_count)
+        self.run.info("Reactions aliased by EC number", ec_number_source_count)
+        self.run.info("Rxns aliased by both KEGG rxn & EC number", both_source_count)
+        self.run.info("Reactions aliased only by KEGG reaction", only_kegg_reaction_source_count)
+        self.run.info("Reactions aliased only by EC number", only_ec_number_source_count)
+        self.run.info("KEGG reactions contributing to network", kegg_reaction_count)
+        self.run.info("Mean reactions per KEGG reaction", mean_reactions_per_kegg_reaction)
+        self.run.info("Stdev reactions per KEGG reaction", std_reactions_per_kegg_reaction)
+        self.run.info("Max reactions per KEGG reaction", max_reactions_per_kegg_reaction)
+        self.run.info("EC numbers contributing to network", ec_number_count)
+        self.run.info("Mean reactions per EC number", mean_reactions_per_ec_number)
+        self.run.info("Stdev reactions per EC number", std_reactions_per_ec_number)
+        self.run.info("Max reactions per EC number", max_reactions_per_ec_number, nl_after=1)
+
+        self.progress.new("Counting reactions and metabolites by property")
+        self.progress.update("...")
+        # This group of network statistics is found the same way for both pan and contigs databases.
+
+        reversible_count = 0
+        irreversible_count = 0
+        cytoplasmic_compound_ids = []
+        extracellular_compound_ids = []
+        consumed_compound_ids = []
+        produced_compound_ids = []
+        compound_reaction_counts = {}
+        for reaction in network.reactions.values():
+            if reaction.reversibility:
+                reversible_count += 1
+            else:
+                irreversible_count += 1
+            encountered_compound_ids = []
+            for compartment, coefficient, compound in zip(reaction.compartments, reaction.coefficients, reaction.compounds):
+                compound_id = compound.modelseed_id
+                if compartment == 'c':
+                    cytoplasmic_compound_ids.append(compound_id)
+                else:
+                    extracellular_compound_ids.append(compound_id)
+                if reaction.reversibility:
+                    consumed_compound_ids.append(compound_id)
+                    produced_compound_ids.append(compound_id)
+                elif coefficient < 0:
+                    consumed_compound_ids.append(compound_id)
+                else:
+                    produced_compound_ids.append(compound_id)
+                if compound_id not in encountered_compound_ids:
+                    try:
+                        compound_reaction_counts[compound_id] += 1
+                    except KeyError:
+                        compound_reaction_counts[compound_id] = 1
+        stats['Reversible reactions'] = reversible_count
+        stats['Irreversible reactions'] = irreversible_count
+        cytoplasmic_compound_ids = set(cytoplasmic_compound_ids)
+        extracellular_compound_ids = set(extracellular_compound_ids)
+        stats['Metabolites in network'] = metabolite_count = len(network.metabolites)
+        stats['Cytoplasmic metabolites'] = cytoplasmic_count = len(cytoplasmic_compound_ids)
+        stats['Extracellular metabolites'] = extracellular_count = len(extracellular_compound_ids)
+        stats['Exclusively cytoplasmic metabolites'] = exclusively_cytoplasmic_count = len(cytoplasmic_compound_ids.difference(extracellular_compound_ids))
+        stats['Exclusively extracellular metabolites'] = exclusively_extracellular_count = len(extracellular_compound_ids.difference(cytoplasmic_compound_ids))
+        stats['Cytoplasmic/extracellular metabolites'] = cytoplasmic_plus_extracellular_count = len(cytoplasmic_compound_ids.intersection(extracellular_compound_ids))
+        consumed_compound_ids = set(consumed_compound_ids)
+        produced_compound_ids = set(produced_compound_ids)
+        stats['Consumed metabolites'] = consumed_count = len(consumed_compound_ids)
+        stats['Produced metabolites'] = produced_count = len(produced_compound_ids)
+        stats['Both consumed & produced metabolites'] = consumed_plus_produced_count = len(consumed_compound_ids.intersection(produced_compound_ids))
+        stats['Exclusively consumed metabolites'] = exclusively_consumed_count = len(consumed_compound_ids.difference(produced_compound_ids))
+        stats['Exclusively produced metabolites'] = exclusively_produced_count = len(produced_compound_ids.difference(consumed_compound_ids))
+        metabolite_reaction_counts = collections.Counter(compound_reaction_counts.values())
+        stats['Metabolites consumed or produced by 1 rxns'] = one_reaction_count = metabolite_reaction_counts[1]
+        stats['Metabolites consumed or produced by 2 rxns'] = two_reactions_count = metabolite_reaction_counts[2]
+        stats['Metabolites consumed or produced by 3+ rxns'] = three_plus_reactions_count = metabolite_count - one_reaction_count - two_reactions_count
+        self.progress.end()
+
+        self.run.info_single("Reaction reversibility")
+        self.run.info("Reversible reactions", reversible_count)
+        self.run.info("Irreversible reactions", irreversible_count, nl_after=1)
+
+        self.run.info_single("Metabolites and localization")
+        self.run.info("Metabolites in network", metabolite_count)
+        self.run.info("Cytoplasmic metabolites", cytoplasmic_count)
+        self.run.info("Extracellular metabolites", extracellular_count)
+        self.run.info("Exclusively cytoplasmic metabolites", exclusively_cytoplasmic_count)
+        self.run.info("Exclusively extracellular metabolites", exclusively_extracellular_count)
+        self.run.info("Cytoplasmic/extracellular metabolites", cytoplasmic_plus_extracellular_count, nl_after=1)
+
+        self.run.info_single("Metabolite consumption and production")
+        self.run.info("Consumed metabolites", consumed_count)
+        self.run.info("Produced metabolites", produced_count)
+        self.run.info("Both consumed & produced metabolites", consumed_plus_produced_count)
+        self.run.info("Exclusively consumed metabolites", exclusively_consumed_count)
+        self.run.info("Exclusively produced metabolites", exclusively_produced_count)
+        self.run.info("Metabolites consumed or produced by 1 rxn", one_reaction_count)
+        self.run.info("Metabolites consumed or produced by 2 rxns", two_reactions_count)
+        self.run.info("Metabolites consumed or produced by 3+ rxns", three_plus_reactions_count)
+
+        return network
+
+    def _parse_ko_kegg_reaction_ids(
+        self,
+        network: ReactionNetwork,
+        ko: KO,
+        ko_kegg_reaction_ids: List[str],
+        ko_ec_numbers: List[str]
+    ) -> List[str]:
+        """
+        Parse KEGG reactions associated with a KO in the process of building a reaction network.
+
+        Report KEGG REACTION IDs that have not been encountered in association with previously
+        processed KOs. Record the existence of these KEGG reactions in the reaction network object.
+        For previously encountered KEGG reactions, retrieve data on aliased ModelSEED reactions and
+        record that data in the KO object.
+
+        Parameters
+        ==========
+        network : ReactionNetwork
+            The reaction network object being built
+
+        ko : KO
+            The representation of the KO being processed
+
+        ko_kegg_reaction_ids : list
+            KEGG REACTION IDs associated with the KO
+
+        ko_ec_numbers: list
+            EC numbers associated with the KO
+
+        Returns
+        =======
+        list
+            Newly encountered KEGG REACTION IDs not associated with previously processed KOs
+        """
+        # If a KEGG reaction has already been encountered, then aliased ModelSEED reactions have
+        # also been processed and added as ModelSEEDReaction objects to the network. Therefore, KEGG
+        # reactions that have already been encountered are treated differently than KEGG reactions
+        # encountered for the first time.
+        new_kegg_reaction_ids = []
+        for kegg_reaction_id in ko_kegg_reaction_ids:
+            try:
+                # The KEGG reaction has already been encountered. Retrieve ModelSEED reactions
+                # aliased by the KEGG reaction.
+                modelseed_reaction_ids = network.kegg_modelseed_aliases[kegg_reaction_id]
+            except KeyError:
+                new_kegg_reaction_ids.append(kegg_reaction_id)
+                # The following list of ModelSEED reaction IDs associated with the KEGG reaction
+                # is filled in later. If no ModelSEED reactions are associated with the KEGG
+                # reaction, the entry in the dictionary will be removed.
+                network.kegg_modelseed_aliases[kegg_reaction_id] = []
+                continue
+            for modelseed_reaction_id in modelseed_reaction_ids:
+                try:
+                    # Retrieve the existing ModelSEEDReaction object.
+                    reaction = network.reactions[modelseed_reaction_id]
+                except KeyError:
+                    # The ModelSEED reaction associated with the EC number did not have valid
+                    # data: for example, when the 'stoichiometry' field is empty.
+                    continue
+                # Associate the ModelSEED reaction with the newly encountered KO.
+                ko.reactions[modelseed_reaction_id] = reaction
+                # Record which KEGG REACTION IDs and EC numbers from the KO yield the ModelSEED reaction.
+                ko.kegg_reaction_aliases[modelseed_reaction_id] = list(
+                    set(ko_kegg_reaction_ids).intersection(set(reaction.kegg_aliases))
+                )
+                ko.ec_number_aliases[modelseed_reaction_id] = list(
+                    set(ko_ec_numbers).intersection(set(reaction.ec_number_aliases))
+                )
+        return new_kegg_reaction_ids
+
+    def _parse_ko_ec_numbers(
+        self,
+        network: ReactionNetwork,
+        ko: KO,
+        ko_ec_numbers: List[str],
+        ko_kegg_reaction_ids: List[str]
+    ) -> List[str]:
+        """
+        Parse EC numbers associated with a KO in the process of building a reaction network.
+
+        Report EC numbers that have not been encountered in association with previously processed
+        KOs. Record the existence of these EC numbers in the reaction network object. For previously
+        encountered EC numbers, retrieve data on aliased ModelSEED reactions and record that data in
+        the KO object.
+
+        Parameters
+        ==========
+        network : ReactionNetwork
+            The reaction network object being built
+
+        ko : KO
+            The representation of the KO being processed
+
+        ko_ec_numbers: list
+            EC numbers associated with the KO
+
+        ko_kegg_reaction_ids : list
+            KEGG REACTION IDs associated with the KO
+
+        Returns
+        =======
+        list
+            Newly encountered EC numbers not associated with previously processed KOs
+        """
+        # As before with KEGG reactions, if an EC number has already been encountered, then aliased
+        # ModelSEED reactions have also been processed and added as ModelSEEDReaction objects to the
+        # network. Therefore, EC numbers that have already been encountered are treated differently
+        # than EC numbers encountered for the first time.
+        new_ec_numbers = []
+        for ec_number in ko_ec_numbers:
+            try:
+                # The EC number has already been encountered. Retrieve ModelSEED reactions
+                # aliased by the EC number.
+                modelseed_reaction_ids = network.ec_number_modelseed_aliases[ec_number]
+            except KeyError:
+                new_ec_numbers.append(ec_number)
+                # The following list of ModelSEED reaction IDs associated with the EC number is
+                # filled in later. If no ModelSEED reactions are associated with the EC number,
+                # the entry in the dictionary will be removed.
+                network.ec_number_modelseed_aliases[ec_number] = []
+                continue
+            for modelseed_reaction_id in modelseed_reaction_ids:
+                try:
+                    # Retrieve the existing ModelSEEDReaction object.
+                    reaction = network.reactions[modelseed_reaction_id]
+                except KeyError:
+                    # The ModelSEED reaction associated with the EC number did not have valid
+                    # data: for example, when the 'stoichiometry' field is empty.
+                    continue
+                if modelseed_reaction_id in reaction.ec_number_aliases:
+                    # A KEGG reaction associated with the newly encountered KO was also
+                    # associated with the ModelSEED reaction. KO EC number aliases were
+                    # previously recorded along with KO KEGG reaction aliases. Redundant work
+                    # can be avoided here linking the ModelSEED reaction to the KO in the network.
+                    continue
+                ko.reactions[modelseed_reaction_id] = reaction
+                ko.kegg_reaction_aliases[modelseed_reaction_id] = list(
+                    set(ko_kegg_reaction_ids).intersection(set(reaction.kegg_aliases))
+                )
+                ko.ec_number_aliases[modelseed_reaction_id] = list(
+                    set(ko_ec_numbers).intersection(set(reaction.ec_number_aliases))
+                )
+        return new_ec_numbers
 
-        contigs_db : str
-            The path to the contigs database from which the reaction network was generated.
+    def _get_modelseed_reactions_data(
+        self,
+        network: ReactionNetwork,
+        new_kegg_reaction_ids: List[str],
+        new_ec_numbers: List[str],
+        modelseed_kegg_reactions_table: pd.DataFrame,
+        modelseed_ec_reactions_table: pd.DataFrame
+    ) -> Dict:
+        """
+        Get data on ModelSEED reactions aliased by newly encountered KEGG REACTION IDs and EC numbers.
+
+        Parameters
+        ==========
+        network : ReactionNetwork
+            The reaction network object being built
+
+        new_kegg_reaction_ids : list
+            Newly encountered KEGG REACTION IDs not associated with previously processed KOs
+
+        new_ec_numbers : list
+            Newly encountered EC numbers not associated with previously processed KOs
+
+        modelseed_kegg_reactions_table : pd.DataFrame
+            Loaded ModelSEED Biochemistry reactions database structured by KEGG REACTION ID
+
+        modelseed_ec_reactions_table : pd.DataFrame
+            Loaded ModelSEED Biochemistry reactions database structured by EC number
+
+        Returns
+        =======
+        dict
+            Data on the reaction sourced from the ModelSEED Biochemistry database
+        """
+        modelseed_reactions_data = {}
+        if new_kegg_reaction_ids:
+            # Each row of the table represents a unique KEGG reaction -> ModelSEED reaction mapping.
+            modelseed_kegg_reactions_dict: Dict[str, Dict] = modelseed_kegg_reactions_table[
+                modelseed_kegg_reactions_table['KEGG_REACTION_ID'].isin(new_kegg_reaction_ids)
+            ].to_dict(orient='index')
+            for modelseed_reaction_data in modelseed_kegg_reactions_dict.values():
+                kegg_reaction_id = modelseed_reaction_data['KEGG_REACTION_ID']
+                modelseed_reaction_id = modelseed_reaction_data['id']
+                # Record the association between the KEGG reaction and ModelSEED reaction in the
+                # network, and vice versa.
+                network.kegg_modelseed_aliases[kegg_reaction_id].append(modelseed_reaction_id)
+                try:
+                    network.modelseed_kegg_aliases[modelseed_reaction_id].append(kegg_reaction_id)
+                except KeyError:
+                    # This is the first time the ModelSEED reaction has been encountered.
+                    network.modelseed_kegg_aliases[modelseed_reaction_id] = [kegg_reaction_id]
+                    network.modelseed_ec_number_aliases[modelseed_reaction_id] = []
+                if modelseed_reaction_id in modelseed_reactions_data:
+                    # One of the other newly encountered KEGG reactions also mapped to this
+                    # ModelSEED reaction, so do not record redundant ModelSEED reaction data.
+                    continue
+                modelseed_reactions_data[modelseed_reaction_id] = modelseed_reaction_data
+        if new_ec_numbers:
+            # Each row of the table represents a unique EC number -> ModelSEED reaction mapping.
+            modelseed_ec_reactions_dict: Dict[str, Dict] = modelseed_ec_reactions_table[
+                modelseed_ec_reactions_table['EC_number'].isin(new_ec_numbers)
+            ].to_dict(orient='index')
+            for modelseed_reaction_data in modelseed_ec_reactions_dict.values():
+                ec_number = modelseed_reaction_data['EC_number']
+                modelseed_reaction_id = modelseed_reaction_data['id']
+                # Record the association between the EC number and ModelSEED reaction in the
+                # network, and vice versa.
+                network.ec_number_modelseed_aliases[ec_number].append(modelseed_reaction_id)
+                try:
+                    network.modelseed_ec_number_aliases[modelseed_reaction_id].append(ec_number)
+                except KeyError:
+                    # This is the first time the ModelSEED reaction has been encountered.
+                    network.modelseed_ec_number_aliases[modelseed_reaction_id] = [ec_number]
+                    network.modelseed_kegg_aliases[modelseed_reaction_id] = []
+                if modelseed_reaction_id in modelseed_reactions_data:
+                    # One of the other newly encountered KEGG reactions or EC numbers also
+                    # mapped to this ModelSEED reaction, so do not record redundant ModelSEED reaction data.
+                    continue
+                modelseed_reactions_data[modelseed_reaction_id] = modelseed_reaction_data
+        return modelseed_reactions_data
+
+    def _add_modelseed_reaction(
+        self,
+        network: ReactionNetwork,
+        ko: KO,
+        reaction: ModelSEEDReaction,
+        new_kegg_reaction_ids: List[str],
+        new_ec_numbers: List[str],
+        modelseed_compound_ids: List[str],
+        modelseed_compounds_table: pd.DataFrame
+    ) -> None:
+        """
+        Add an object representing the ModelSEED reaction and objects representing associated
+        ModelSEED compounds to the reaction network.
+
+        Parameters
+        ==========
+        network : ReactionNetwork
+            The reaction network object being built
+
+        ko : KO
+            The representation of the KO being processed
+
+        reaction : ModelSEEDReaction
+            The representation of the reaction with data sourced from ModelSEED Biochemistry
+
+        new_kegg_reaction_ids : list
+            Newly encountered KEGG REACTION IDs not associated with previously processed KOs
+
+        new_ec_numbers : list
+            Newly encountered EC numbers not associated with previously processed KOs
+
+        modelseed_compound_ids : list
+            ModelSEED compound IDs of the reactants and products in the reaction
+
+        modelseed_compounds_table : pd.DataFrame
+            Loaded ModelSEED Biochemistry compounds database
+
+        Returns
+        =======
+        None
+        """
+        modelseed_reaction_id = reaction.modelseed_id
+        ko.reactions[modelseed_reaction_id] = reaction
+        # Record which KEGG REACTION IDs and EC numbers from the KO yield the ModelSEED reaction.
+        ko.kegg_reaction_aliases[modelseed_reaction_id] = list(
+            set(new_kegg_reaction_ids).intersection(set(reaction.kegg_aliases))
+        )
+        ko.ec_number_aliases[modelseed_reaction_id] = list(
+            set(new_ec_numbers).intersection(set(reaction.ec_number_aliases))
+        )
+        network.reactions[modelseed_reaction_id] = reaction
+
+        # If the ModelSEED compound ID has been encountered in previously processed
+        # reactions, then there is already a ModelSEEDCompound object for it.
+        new_modelseed_compound_ids = []
+        reaction_compounds = []
+        for modelseed_compound_id in modelseed_compound_ids:
+            if modelseed_compound_id in network.metabolites:
+                reaction_compounds.append(network.metabolites[modelseed_compound_id])
+            else:
+                new_modelseed_compound_ids.append(modelseed_compound_id)
+
+        # Generate new metabolite objects in the network
+        for modelseed_compound_id in new_modelseed_compound_ids:
+            try:
+                modelseed_compound_series: pd.Series = modelseed_compounds_table.loc[modelseed_compound_id]
+            except KeyError:
+                raise ConfigError(
+                    f"A row for the ModelSEED compound ID, '{modelseed_compound_id}', was expected "
+                    "but not found in the ModelSEED compounds table. This ID was found in the equation "
+                    f"for the ModelSEED reaction, '{modelseed_reaction_id}'."
+                )
+            modelseed_compound_data = modelseed_compound_series.to_dict()
+            modelseed_compound_data['id'] = modelseed_compound_id
+            compound = self._get_modelseed_compound(modelseed_compound_data)
+            reaction_compounds.append(compound)
+            network.metabolites[modelseed_compound_id] = compound
+        reaction.compounds = tuple(reaction_compounds)
+
+    def _get_modelseed_reaction(self, modelseed_reaction_data: Dict) -> Tuple[ModelSEEDReaction, List[str]]:
+        """
+        Generate a ModelSEED reaction object and list of associated ModelSEED compound IDs from the
+        ModelSEED reaction table entry. The reaction object is not populated with metabolite objects
+        from the list of associated compound IDs.
+
+        Parameters
+        ==========
+        modelseed_reaction_data : Dict
+            A dictionary representation of a row for a reaction in the ModelSEED reaction table set
+            up by anvi'o.
+
+        Returns
+        =======
+        ModelSEEDReaction
+            An object representation of the ModelSEED reaction.
+
+        List[str]
+            ModelSEED compound IDs of reactants and products.
+        """
+        stoichiometry: str = modelseed_reaction_data['stoichiometry']
+        if pd.isna(stoichiometry):
+            # ignore any reaction lacking a chemical equation for some reason
+            return None, None
+
+        reaction = ModelSEEDReaction()
+
+        modelseed_id = modelseed_reaction_data['id']
+        if pd.isna(modelseed_id):
+            raise ConfigError(
+                "The row for the reaction in the ModelSEED table does not but should have an ID. "
+                f"Here is the data in the row: '{modelseed_reaction_data}'"
+            )
+        reaction.modelseed_id = modelseed_id
+
+        modelseed_name = modelseed_reaction_data['name']
+        if pd.isna(modelseed_name):
+            reaction.modelseed_name = None
+        else:
+            reaction.modelseed_name = modelseed_name
+
+        kegg_reaction_ids: str = modelseed_reaction_data['KEGG']
+        if pd.isna(kegg_reaction_ids):
+            reaction.kegg_aliases = tuple()
+        else:
+            reaction.kegg_aliases = tuple(kegg_reaction_ids.split('; '))
+
+        ec_numbers: str = modelseed_reaction_data['ec_numbers']
+        if pd.isna(ec_numbers):
+            reaction.ec_number_aliases = []
+        else:
+            reaction.ec_number_aliases = ec_numbers.split('|')
+
+        reversibility = modelseed_reaction_data['reversibility']
+        if pd.isna(reversibility):
+            raise ConfigError(
+                "The row for the reaction in the ModelSEED table was expected to have a 'reversibility' value. "
+                f"Here is the data in the row: '{modelseed_reaction_data}'"
+            )
+        if reversibility == '=' or reversibility == '?':
+            # Assume that reactions lacking data ('?') are reversible.
+            reaction.reversibility = True
+        else:
+            reaction.reversibility = False
+
+        decimal_reaction_coefficients = []
+        split_stoichiometry = stoichiometry.split(';')
+        modelseed_compound_ids = []
+        compartments = []
+        for entry in split_stoichiometry:
+            split_entry = entry.split(':')
+            decimal_reaction_coefficients.append(split_entry[0])
+            modelseed_compound_ids.append(split_entry[1])
+            compartments.append(ModelSEEDDatabase.compartment_ids[int(split_entry[2])])
+        reaction.compartments = tuple(compartments)
+        reaction_coefficients = self._to_lcm_denominator(decimal_reaction_coefficients)
+        direction = modelseed_reaction_data['direction']
+        if pd.isna(direction):
+            raise ConfigError(
+                "The row for the reaction in the ModelSEED table was expected to have a 'direction' value. "
+                f"Here is the data in the row: '{modelseed_reaction_data}'"
+            )
+        if (direction == '>' and reversibility == '<') or (direction == '<' and reversibility == '>'):
+            # The way the reaction is written is the opposite of the way the reaction proceeds.
+            reaction_coefficients = [-c for c in reaction_coefficients]
+        reaction.coefficients = tuple(reaction_coefficients)
+
+        return reaction, modelseed_compound_ids
+
+    def _to_lcm_denominator(self, floats: List[float]) -> Tuple[int]:
+        """
+        Convert a list of numbers to their lowest common integer multiples.
+
+        Parameters
+        ==========
+        floats : List[float]
+
+        Returns
+        =======
+        List[int]
+        """
+        def lcm(a, b):
+            return a * b // math.gcd(a, b)
+        rationals = [fractions.Fraction(f).limit_denominator() for f in floats]
+        lcm_denom = functools.reduce(lcm, [r.denominator for r in rationals])
+        return list(int(r.numerator * lcm_denom / r.denominator) for r in rationals)
+
+    def _get_modelseed_compound(self, modelseed_compound_data: Dict) -> ModelSEEDCompound:
+        """
+        Generate a ModelSEED compound object from its entry in the ModelSEED table.
+
+        Parameters
+        ==========
+        modelseed_compound_data : Dict
+            A dictionary representation of a row for a compound in the ModelSEED compound table set
+            up by anvi'o.
+
+        Returns
+        =======
+        ModelSEEDCompound
+            An object representation of the ModelSEED compound.
+        """
+        compound = ModelSEEDCompound()
+        compound.modelseed_id = modelseed_compound_data['id']
+
+        modelseed_name = modelseed_compound_data['name']
+        if pd.isna(modelseed_name):
+            compound.modelseed_name = None
+        else:
+            compound.modelseed_name = modelseed_name
+
+        kegg_aliases: str = modelseed_compound_data['KEGG']
+        if pd.isna(kegg_aliases):
+            compound.kegg_aliases = tuple()
+        else:
+            compound.kegg_aliases = tuple(kegg_aliases.split('; '))
+
+        formula = modelseed_compound_data['formula']
+        if pd.isna(formula):
+            compound.formula = None
+            # compounds without formulas have a nominal charge of 10000000 in compounds.tsv
+            compound.charge = None
+        else:
+            compound.formula = formula
+            charge = modelseed_compound_data['charge']
+            if pd.isna(charge):
+                raise ConfigError(
+                    f"The charge of a ModelSEED compound, '{compound.modelseed_id}', was not recorded "
+                    "in 'compounds.tsv' but is expected to be present as an integer. Here is the data "
+                    f"in the row for the compound: '{modelseed_compound_data}'"
+                )
+            compound.charge = charge
+
+        return compound
+
+    def _get_database_reactions_table(self, network: ReactionNetwork) -> pd.DataFrame:
+        """
+        Make a reactions table that can be stored in either a contigs or pan database, as the tables
+        have the same structure. A `ReactionNetwork` can be reconstructed with the same data from
+        the reactions and metabolites tables of the database.
+
+        Parameters
+        ==========
+        network : ReactionNetwork
+            The reaction network generated from gene or gene cluster KO annotations
+
+        Returns
+        =======
+        pd.DataFrame
+            The table of reactions data to be stored in the contigs or pan database
         """
+        assert tables.gene_function_reactions_table_structure == tables.pan_gene_cluster_function_reactions_table_structure
+        assert tables.gene_function_reactions_table_types == tables.pan_gene_cluster_function_reactions_table_types
+
         # Transfer data from reaction objects to dictionaries mapping to table entries.
         reactions_data: Dict[str, Dict] = {}
         for modelseed_reaction_id, reaction in network.reactions.items():
@@ -2760,30 +3430,27 @@ def _store_contigs_database_reactions(self, network: GenomicNetwork, contigs_db:
 
         reactions_table = pd.DataFrame.from_dict(reactions_data, orient='index').reset_index(drop=True).sort_values('modelseed_reaction_id')
         reactions_table = reactions_table[tables.gene_function_reactions_table_structure]
+        return reactions_table
 
-        cdb = ContigsDatabase(contigs_db)
-        cdb.db._exec_many(
-            f'''INSERT INTO {tables.gene_function_reactions_table_name} VALUES ({','.join('?' * len(tables.gene_function_reactions_table_structure))})''',
-            reactions_table.values
-        )
-        cdb.disconnect()
-
-    def _store_contigs_database_metabolites(self, network: GenomicNetwork, contigs_db: str) -> None:
+    def _get_database_metabolites_table(self, network: ReactionNetwork) -> pd.DataFrame:
         """
-        Store metabolite data in the relevant contigs database table.
+        Make a metabolites table that can be stored in either a contigs or pan database, as the tables
+        have the same structure. A `ReactionNetwork` can be reconstructed with the same data from
+        the reactions and metabolites tables of the database.
 
         Parameters
         ==========
-        network : GenomicNetwork
-            The reaction network generated from gene KO annotations in the contigs database.
-
-        contigs_db : str
-            The path to the contigs database from which the reaction network was generated.
+        network : ReactionNetwork
+            The reaction network generated from gene or gene cluster KO annotations
 
         Returns
         =======
-        None
+        pd.DataFrame
+            The table of metabolites data to be stored in the contigs or pan database
         """
+        assert tables.gene_function_metabolites_table_structure == tables.pan_gene_cluster_function_metabolites_table_structure
+        assert tables.gene_function_metabolites_table_types == tables.pan_gene_cluster_function_metabolites_table_types
+
         # Transfer data from metabolite objects to dictionaries mapping to table entries.
         metabolites_data = {}
         for modelseed_compound_id, compound in network.metabolites.items():
@@ -2797,28 +3464,22 @@ def _store_contigs_database_metabolites(self, network: GenomicNetwork, contigs_d
 
         metabolites_table = pd.DataFrame.from_dict(metabolites_data, orient='index').reset_index(drop=True).sort_values('modelseed_compound_id')
         metabolites_table = metabolites_table[tables.gene_function_metabolites_table_structure]
+        return metabolites_table
 
-        cdb = ContigsDatabase(contigs_db)
-        cdb.db._exec_many(
-            f'''INSERT INTO {tables.gene_function_metabolites_table_name} VALUES ({','.join('?' * len(tables.gene_function_metabolites_table_structure))})''',
-            metabolites_table.values
-        )
-        cdb.disconnect()
-
-    def hash_ko_annotations(self, gene_function_calls_dict: Dict) -> str:
+    def hash_contigs_db_ko_annotations(self, gene_function_calls_dict: Dict) -> str:
         """
-        Hash gene KO annotations in a contigs database to concisely represent the data used to
-        construct a reaction network.
+        To concisely represent the data underlying a reaction network, hash all gene KO annotations
+        in the contigs database.
 
         Parameters
         ==========
         gene_function_calls_dict : str
-            Dictionary containing gene KO annotations loaded by a contigs superclass.
+            This dictionary is loaded by a contigs superclass and contains gene KO annotations.
 
         Returns
         =======
         str
-            Hash representation of all gene KO annotations.
+            Hash representation of all gene KO annotations
         """
         ko_annotations = []
         for gcid, gene_dict in gene_function_calls_dict.items():
@@ -2827,7 +3488,6 @@ def hash_ko_annotations(self, gene_function_calls_dict: Dict) -> str:
             ko_name = ko_data[1]
             e_value = ko_data[2]
             ko_annotations.append((str(gcid), ko_id, ko_name, str(e_value)))
-        # Sort KO annotation data in ascending order of gene caller ID and KO accession.
         ko_annotations = sorted(ko_annotations, key=lambda x: (x[0], x[1]))
 
         ko_annotations_string = ''
@@ -2837,30 +3497,58 @@ def hash_ko_annotations(self, gene_function_calls_dict: Dict) -> str:
         hashed_ko_annotations = hashlib.sha1(ko_annotations_string.encode('utf-8')).hexdigest()
         return hashed_ko_annotations
 
-    # def make_pangenomic_network(
-    #     self,
-    #     genomes_storage_db: str,
-    #     pan_db: str,
-    #     store: bool = True,
-    #     overwrite_existing_network: bool = False
-    # ) -> PangenomicNetwork:
-    #     """
-    #     Make a pangenomic metabolic reaction network from KEGG Orthologs stored a genomes storage
-    #     database and gene clusters stored in a pan database.
-
-    #     Parameters
-    #     ==========
-    #     genomes_storage_db : str
-    #         Path to a genomes storage database. The pangenomic network is derived from gene KO
-    #         annotations stored in the database.
-
-    #     pan_db : str
-    #         Path to a pan database. The pangenomic network is determined for gene clusters stored in
-    #         the database.
-
-    #     Returns
-    #     =======
-    #     PangenomicNetwork
-    #         The network derived from the pangenomic databases.
-    #     """
-    #     return
+    def hash_pan_db_ko_annotations(
+        self,
+        genomes_storage_db: str,
+        gene_clusters_functions_summary_dict: Dict,
+        consensus_threshold: float,
+        discard_ties: bool
+    ) -> str:
+        """
+        To concisely represent the data underlying a reaction network, hash all gene KO annotations
+        in the constituent genomes, all consensus KO annotations of the gene clusters, and
+        parameters used to select consensus KOs.
+
+        Parameters
+        ==========
+        genomes_storage_db : str
+            This is the path to a genomes storage database with the underlying gene KO annotations.
+
+        gene_clusters_functions_summary_dict : dict
+            This dictionary is loaded by a pan superclass and contains gene cluster KO annotations.
+
+        consensus_threshold : float, None
+            This parameter was used in setting consensus KO annotations of gene clusters.
+
+        discard_ties : bool, False
+            This parameter was used in setting consensus KO annotations of gene clusters.
+
+        Returns
+        =======
+        str
+            Hash representation of all gene cluster consensus KO annotations and the parameters used
+            to select consensus KOs
+        """
+        gsdb = dbinfo.GenomeStorageDBInfo(genomes_storage_db).load_db()
+        functions_table = gsdb.get_table_as_dataframe('gene_function_calls', where_clause='source = "KOfam"')
+        gsdb.disconnect()
+        ko_annotations = []
+        for row in functions_table.itertuples(index=False):
+            ko_annotations.append((row.genome_name, str(row.gene_callers_id), row.accession, row.function, str(row.e_value)))
+        ko_annotations = sorted(ko_annotations, key=lambda x: (x[0], x[1], x[2]))
+
+        ko_annotations = []
+        for gene_cluster_id, gene_cluster_dict in gene_clusters_functions_summary_dict.items():
+            ko_data = gene_cluster_dict['KOfam']
+            ko_id = ko_data['accession']
+            ko_name = ko_data['function']
+            # When the KO ID and name are None, convert them into 'None'.
+            ko_annotations.append((str(gene_cluster_id), str(ko_id), str(ko_name)))
+        ko_annotations = sorted(ko_annotations, key=lambda x: x[0])
+
+        ko_annotations_string = f'{consensus_threshold}_{int(discard_ties)}_'
+        for ko_annotation in ko_annotations:
+            ko_annotations_string += ''.join(ko_annotation)
+
+        hashed_ko_annotations = hashlib.sha1(ko_annotations_string.encode('utf-8')).hexdigest()
+        return hashed_ko_annotations
diff --git a/anvio/cogs.py b/anvio/cogs.py
index c14041a710..1700af254d 100644
--- a/anvio/cogs.py
+++ b/anvio/cogs.py
@@ -702,7 +702,7 @@ def raise_error(line_num, line_content, fields, e):
         p_id_without_cog_id = set([])
 
         line_counter = 0
-        for line in open(input_file_path, 'rU').readlines():
+        for line in open(input_file_path, 'r').readlines():
             line_counter += 1
 
             if line_counter % 500 == 0:
@@ -823,7 +823,7 @@ def format_categories(self, input_file_path, output_file_path):
         progress.update('...')
 
         output = open(output_file_path, 'w')
-        for line in open(input_file_path, 'rU').readlines():
+        for line in open(input_file_path, 'r').readlines():
             if line.startswith('#'):
                 continue
 
@@ -951,7 +951,7 @@ def check_raw_data_hash_and_existence(self, input_file_path, output_file_path):
 
         # Get a dictionnary of checksums, the file is formatted as "checksum filename" per line
         checksums = {}
-        for line in open(input_file_path, 'rU').readlines():
+        for line in open(input_file_path, 'r').readlines():
             stripped = line.strip('\n').split(' ')
             file_name = stripped[-1].strip('*')
             checksums[file_name] = stripped[0]
diff --git a/anvio/data/static/template/inversions.tmpl b/anvio/data/static/template/inversions.tmpl
index e0da32bb93..c43e90167c 100644
--- a/anvio/data/static/template/inversions.tmpl
+++ b/anvio/data/static/template/inversions.tmpl
@@ -117,6 +117,7 @@
                                                 <tr>
                                                     <th>ID</th>
                                                     <th>Source</th>
+                                                    <th>Contig</th>
                                                     <th>Length</th>
                                                     <th>Direction</th>
                                                     <th>Start</th>
@@ -128,6 +129,7 @@
                                                 <tr>
                                                     <td>{{ gene|lookup:"gene_callers_id"|pretty }}</td>
                                                     <td>{{ gene|lookup:"source"|pretty }}</td>
+                                                    <td>{{ gene|lookup:"contig"|pretty }}</td>
                                                     <td>{{ gene|lookup:"length"|pretty }}</td>
                                                     <td>{{ gene|lookup:"direction"|pretty }}</td>
                                                     <td>{{ gene|lookup:"start"|pretty }}</td>
@@ -238,6 +240,14 @@
                                             <td width="25%">Length of the inversion</td>
                                             <td>{{ inversions|lookup:inversion|lookup:"inversion_data"|lookup:"distance"|pretty }}</td>
                                         </tr>
+                                        <tr>
+                                            <td width="25%">Start position</td>
+                                            <td>{{ inversions|lookup:inversion|lookup:"inversion_data"|lookup:"first_end"|pretty }}</td>
+                                        </tr>
+                                        <tr>
+                                            <td width="25%">Stop position</td>
+                                            <td>{{ inversions|lookup:inversion|lookup:"inversion_data"|lookup:"second_start"|pretty }}</td>
+                                        </tr>
                                         <tr>
                                             <td width="25%">Number of samples observed</td>
                                             <td>{{ inversions|lookup:inversion|lookup:"inversion_data"|lookup:"num_samples" }}</td>
@@ -256,6 +266,7 @@
                             <div class="panel-heading">
                                 Inverted Repeats
                             </div>
+
                             <div class="panel-body">
                                 <table class="table table-hover">
                                     <thead id="{{ inversion }}-table">
@@ -355,6 +366,35 @@
                                     </div>
                                 </div>
                             </div>
+                                
+                            <div class="panel panel-default" style="margin-right:10px; margin-left:10px;">
+                                <div class="panel-heading">
+                                    Motifs
+                                </div>
+                                <div class="panel-body image-panel">
+                                    <table class="table">
+                                        <tbody>
+                                                <tr>
+                                                    <td width="25%"><h5>Motif group</h5></td>
+                                                    <td><h5>Motif logo</h5></td>
+                                                </tr>
+                                                {% for motif in inversions|lookup:inversion|lookup:"motifs" %}
+                                                        <tr>
+                                                            <td width="15%" style="vertical-align:middle;">{{ motif }}</td>
+                                                            <td class="extra-long>">
+                                                            {% if inversions|lookup:inversion|lookup:"motifs"|lookup:motif|lookup:'logo_path' == None %}
+                                                                MEME was not able to generate the motif's logo in png format, which means that you are missing cool logo pictures in this summary.<br>
+                                                                The logos are still available in .eps format in the ouput directory.
+                                                            {% else %}
+                                                                <img src="{{ inversions|lookup:inversion|lookup:"motifs"|lookup:motif|lookup:'logo_path' }}" alt="Motif logo" style="height:120px;">
+                                                            </td>
+                                                            {% endif %}
+                                                        </tr>
+                                                {% endfor %}
+                                        </tbody>
+                                    </table>
+                                </div>
+                            </div>
                         </div>
                     </div>
                 </div>
@@ -389,10 +429,19 @@
         white-space:normal;
         max-width: 300px;
     }
+    .extra-long{
+        white-space:normal;
+        max-width: 900px;
+    }
     #popover-panel{
         border: none;
         margin-bottom: 0px;
     }
+    .image-panel{
+        width: fit-content;
+        display: flex;
+        justify-content: left;
+    }
 </style>
 <script type="text/javascript">
     // Binding template to the Popover Content
diff --git a/anvio/dbops.py b/anvio/dbops.py
index de223efc37..ce700b784d 100644
--- a/anvio/dbops.py
+++ b/anvio/dbops.py
@@ -3983,15 +3983,17 @@ def init(self):
             return
 
         self.meta = dbi(self.db_path, expecting=self.db_type).get_self_table()
-
-        for key in ['num_genomes', 'gene_cluster_min_occurrence', 'use_ncbi_blast', 'exclude_partial_gene_calls', \
-                    'num_gene_clusters', 'num_genes_in_gene_clusters', 'gene_alignments_computed', 'items_ordered']:
+        for key in ['num_genomes', 'gene_cluster_min_occurrence', 'use_ncbi_blast', 'exclude_partial_gene_calls',
+                    'num_gene_clusters', 'num_genes_in_gene_clusters', 'gene_alignments_computed', 'items_ordered',
+                    'reaction_network_ko_annotations_hash', 'reaction_network_kegg_database_release',
+                    'reaction_network_modelseed_database_sha']:
             try:
                 self.meta[key] = int(self.meta[key])
             except:
                 pass
 
-        for key in ['min_percent_identity', 'minbit', 'mcl_inflation']:
+        for key in ['min_percent_identity', 'minbit', 'mcl_inflation',
+                    'reaction_network_consensus_threshold', 'reaction_network_discard_ties']:
             try:
                 self.meta[key] = float(self.meta[key])
             except:
@@ -4015,6 +4017,8 @@ def touch(self):
 
         # creating empty default tables for pan specific operations:
         self.db.create_table(t.pan_gene_clusters_table_name, t.pan_gene_clusters_table_structure, t.pan_gene_clusters_table_types)
+        self.db.create_table(t.pan_gene_cluster_function_reactions_table_name, t.pan_gene_cluster_function_reactions_table_structure, t.pan_gene_cluster_function_reactions_table_types)
+        self.db.create_table(t.pan_gene_cluster_function_metabolites_table_name, t.pan_gene_cluster_function_metabolites_table_structure, t.pan_gene_cluster_function_metabolites_table_types)
 
         # creating empty default tables for standard anvi'o pan dbs
         self.db.create_table(t.item_additional_data_table_name, t.item_additional_data_table_structure, t.item_additional_data_table_types)
@@ -4079,8 +4083,7 @@ def init(self):
         try:
             for key in ['split_length', 'kmer_size', 'total_length', 'num_splits', 'num_contigs',
                         'genes_are_called', 'splits_consider_gene_calls', 'scg_taxonomy_was_run',
-                        'trna_taxonomy_was_run', 'external_gene_calls', 'external_gene_amino_acid_seqs',
-                        'skip_predict_frame']:
+                        'trna_taxonomy_was_run', 'external_gene_calls', 'external_gene_amino_acid_seqs', 'skip_predict_frame']:
                 self.meta[key] = int(self.meta[key])
         except KeyError:
             raise ConfigError("Oh no :( There is a contigs database here at '%s', but it seems to be broken :( It is very "
@@ -4332,7 +4335,7 @@ def create(self, args):
 
         if description_file_path:
             filesnpaths.is_file_plain_text(description_file_path)
-            description = open(os.path.abspath(description_file_path), 'rU').read()
+            description = open(os.path.abspath(description_file_path), 'r').read()
         else:
             description = ''
 
@@ -4573,6 +4576,9 @@ def create(self, args):
         self.db.set_meta_value('scg_taxonomy_database_version', None)
         self.db.set_meta_value('trna_taxonomy_was_run', False)
         self.db.set_meta_value('trna_taxonomy_database_version', None)
+        self.db.set_meta_value('reaction_network_ko_annotations_hash', None)
+        self.db.set_meta_value('reaction_network_kegg_database_release', None)
+        self.db.set_meta_value('reaction_network_modelseed_database_sha', None)
         self.db.set_meta_value('creation_date', self.get_date())
         self.disconnect()
 
@@ -4951,7 +4957,7 @@ def get_description_in_db(anvio_db_path, run=run):
 
 def update_description_in_db_from_file(anvio_db_path, description_file_path, run=run):
     filesnpaths.is_file_plain_text(description_file_path)
-    description = open(os.path.abspath(description_file_path), 'rU').read()
+    description = open(os.path.abspath(description_file_path), 'r').read()
 
     update_description_in_db(anvio_db_path, description, run=run)
 
diff --git a/anvio/docs/artifacts/user-modules-data.md b/anvio/docs/artifacts/user-modules-data.md
index 73a8c01a3b..d3e3c8b74c 100644
--- a/anvio/docs/artifacts/user-modules-data.md
+++ b/anvio/docs/artifacts/user-modules-data.md
@@ -15,9 +15,11 @@ Also, think about how you will annotate each enzyme, because for each one you wi
 Enzyme comes from... | annotation program | ANNOTATION_SOURCE
 |:---|:---|:---|
 KEGG KOfam | %(anvi-run-kegg-kofams)s | Kofam
-NCBI COG (2020) | %(anvi-run-ncbi-cogs)s | COG20_FUNCTION
-NCBI COG (2014) | %(anvi-run-ncbi-cogs)s | COG14_FUNCTION
+NCBI COG (2020) | %(anvi-run-ncbi-cogs)s with `--cog-version COG20`| COG20_FUNCTION
+NCBI COG (2014) | %(anvi-run-ncbi-cogs)s with `--cog-version COG14`| COG14_FUNCTION
+archaeal COGs (2014) | %(anvi-run-ncbi-cogs)s with `--cog-version arCOG14`| arCOG14_FUNCTION
 PFAM | %(anvi-run-pfams)s | Pfam
+CAZy dbCAN | %(anvi-run-cazymes)s | CAZyme
 custom HMMs | %(anvi-run-hmms)s with `--hmm-source` and `--add-to-functions-table` parameters | name of directory given to `--hmm-source`
 other annotation strategy | %(anvi-import-functions)s | source defined in input file
 
diff --git a/anvio/docs/images/png/anvi-report-inversions-01.png b/anvio/docs/images/png/anvi-report-inversions-01.png
new file mode 100644
index 0000000000..193f93bbe4
Binary files /dev/null and b/anvio/docs/images/png/anvi-report-inversions-01.png differ
diff --git a/anvio/docs/images/png/anvi-report-inversions-02.gif b/anvio/docs/images/png/anvi-report-inversions-02.gif
new file mode 100644
index 0000000000..e1d2c12516
Binary files /dev/null and b/anvio/docs/images/png/anvi-report-inversions-02.gif differ
diff --git a/anvio/docs/images/png/anvi-report-inversions-03.png b/anvio/docs/images/png/anvi-report-inversions-03.png
new file mode 100644
index 0000000000..1d636f4e2d
Binary files /dev/null and b/anvio/docs/images/png/anvi-report-inversions-03.png differ
diff --git a/anvio/docs/images/png/anvi-report-inversions-04.png b/anvio/docs/images/png/anvi-report-inversions-04.png
new file mode 100644
index 0000000000..dc5c0e0ea7
Binary files /dev/null and b/anvio/docs/images/png/anvi-report-inversions-04.png differ
diff --git a/anvio/docs/images/png/anvi-report-inversions-05.png b/anvio/docs/images/png/anvi-report-inversions-05.png
new file mode 100644
index 0000000000..f7631f267e
Binary files /dev/null and b/anvio/docs/images/png/anvi-report-inversions-05.png differ
diff --git a/anvio/docs/images/png/metabolism_reconstruction.png b/anvio/docs/images/png/metabolism_reconstruction.png
index da0a0556f0..08f53bc25c 100644
Binary files a/anvio/docs/images/png/metabolism_reconstruction.png and b/anvio/docs/images/png/metabolism_reconstruction.png differ
diff --git a/anvio/docs/programs/anvi-estimate-metabolism.md b/anvio/docs/programs/anvi-estimate-metabolism.md
index ac688191da..2c9379976a 100644
--- a/anvio/docs/programs/anvi-estimate-metabolism.md
+++ b/anvio/docs/programs/anvi-estimate-metabolism.md
@@ -698,7 +698,7 @@ Once we have the completeness scores and copy numbers of all possible paths thro
 So if the module does not have any complete paths, then its copy number is 0. If it has one complete path, then its copy number is the copy number of that path. If there are multiple paths with highest completeness score, then its copy number is the maximum of the copy numbers of those paths - for example, let's say we have two paths, both of which are 90%% complete. One of those paths has a copy number of 1 and the other has a copy number of 3. The module copy number would be 3 in this case.
 
 {:.notice}
-We're making assumptions here again, just like we were when computing module completeness. Any of those paths (or none of them) could be the one that is used in the cell, and we don't know which one. But the idea here is that if a sample has the most copies of path X, there is probably a good reason that is has that many copies because microbial cells like to streamline their genomes whenever possible.
+We're making assumptions here again, just like we were when computing module completeness. Any of those paths (or none of them) could be the one that is used in the cell, and we don't know which one. But the idea here is that if a sample has the most copies of path X, there is probably a good reason that it has that many copies because microbial cells like to streamline their genomes whenever possible.
 
 One last note - if a module does not have any paths of highest completeness, we cannot compute the copy number. In this case, the copy number of the module will be reported as 'NA' in the output file(s).
 
diff --git a/anvio/docs/programs/anvi-report-inversions.md b/anvio/docs/programs/anvi-report-inversions.md
index 02275e33d9..c8f0358dab 100644
--- a/anvio/docs/programs/anvi-report-inversions.md
+++ b/anvio/docs/programs/anvi-report-inversions.md
@@ -1,8 +1,8 @@
 This program allows you to find genomic inversions using metagenomic read recruitment results, and their activity patterns across samples.
 
-An inversion is typically carried out by an invertase. This enzyme recognizes a pair of inverted repeats (IR), which are a special case of palindromic sequence where the repeats are facing inward on different DNA strands. The IRs are distant from each other and the invertase will invert the DNA fragment between the IRs.
+Specifically, this program search for site-specific inversions which are carried out by site-specific recombinases. This enzyme recognizes a pair of inverted repeats (IRs). The IRs are distant from each other and the site-specific recombinase invert the DNA fragment between the IRs.
 
-In brief, anvi'o leverages paired-read orientation (through the `--fetch-filter` mechanism in %(anvi-profile)s explained below) to locate regions of interest in a set of contigs. It screens for IRs within regions that are enriched in read pairs that are enriched in forward/forward or reverse/reverse orientations, and uses short-reads to confirm which IRs corrrespond to real inversions. Anvi'o can also compute the 'inversion activity', i.e., the relative proportion of each orientation of an inversion in each sample.
+In brief, anvi'o leverages paired-read orientation (through the `--fetch-filter` mechanism in %(anvi-profile)s explained below) to locate regions of interest in a set of contigs. It screens for IRs within regions that are enriched in read pairs that are enriched in forward/forward or reverse/reverse orientations, and uses short-reads to confirm which IRs correspond to real inversions. Anvi'o can also compute the 'inversion activity', i.e., the relative proportion of each orientation of an inversion in each sample.
 
 ### Anvi'o philosophy to find inversions
 
@@ -71,7 +71,7 @@ You can set the minimum distance between two palindromic sequences with `--min-d
 
 When searching for palindromes with mismatches, the algorithm will extend the palindrome length as much as possible, often including mismatches which are outside of the true palindrome sequences. The flag `--min-mismatch-distance-to-first-base` allows you to trim the palindrome when one or more mismatches are n nucleotides away from a palindrome's start or stop. The default value is 1, meaning that a palindrome `MMMMMM(X)M`, where M denotes matching nucleotides and X a mismatch, will be trimmed to the first 6 matches `MMMMMM`.
 
-There are currently two algorithms to find palindromes in anvi'o: numba and BLAST. Numba is very fast when looking for palindromes in short sequences, and BLAST is more efficient for longer stretches. Anvi'o dynamically set the algorithm accoding to each stretch length: numba for stretches under 5,000 bp and BLAST for longer stretches. You can use the flag `--palindrome-search-algorithm` to ask anvi'o to use either of these methods explicitly. Note that results between the two methods may differ.
+There are currently two algorithms to find palindromes in anvi'o: numba and BLAST. Numba is very fast when looking for palindromes in short sequences, and BLAST is more efficient for longer stretches. Anvi'o dynamically set the algorithm according to each stretch length: numba for stretches under 5,000 bp and BLAST for longer stretches. You can use the flag `--palindrome-search-algorithm` to ask anvi'o to use either of these methods explicitly. Note that results between the two methods may differ.
 
 {{ codestart }}
 anvi-report-inversions -P %(bams-and-profiles-txt)s \
@@ -97,7 +97,7 @@ If you provide the short-reads R1 and R2 in the %(bams-and-profiles-txt)s, anvi'
 
 This is a very time consuming step, and if you have multiple sample, you can use the parameter `--num-threads` to set the maximum of threads for multithreading when possible.
 
-To compute the inversion's ratios, anvi'o designs in silco primers based on the palidrome sequence and the upstream/downstream genomic context to search short-reads in the raw fastq files. The variable `--oligo-primer-base-length` is used to control how much of the palindrome should be used to design the primers. The longer, the more specific, but if it is too long, fewer reads will match to the primer.
+To compute the inversion's ratios, anvi'o designs in silico primers based on the palindrome sequence and the upstream/downstream genomic context to search short-reads in the raw fastq files. The variable `--oligo-primer-base-length` is used to control how much of the palindrome should be used to design the primers. The longer, the more specific, but if it is too long, fewer reads will match to the primer.
 
 This step is very computationally intense, but you can test it with the parameter `--end-primer-search-after-x-hits`. Once the total number of reads reach this parameter, anvi'o will stop searching further and will continue with the next sample. This flag is only good for testing.
 
@@ -122,7 +122,7 @@ anvi-report-inversions -P %(bams-and-profiles-txt)s \
                        -o activity_calculations
 {{ codestop }}
 
-In this mode, %(anvi-report-inversions)s will not recalulate inversions, and only report the activity of inversions found in the input file across samples listed in the %(bams-and-profiles-txt)s file.
+In this mode, %(anvi-report-inversions)s will not recalculate inversions, and only report the activity of inversions found in the input file across samples listed in the %(bams-and-profiles-txt)s file.
 
 ### Reporting genomic context around inversions
 
@@ -134,6 +134,21 @@ To select a specific gene caller, you can use `--gene-caller`. The default is pr
 
 If you want to skip this step, you can use the flag `--skip-recovering-genomic-context`.
 
+### Searching for conserved motifs in inverted-repeats
+
+The inversions are carried out by site-specific recombinase which recognize a DNA motifs on each end of the invertible DNA fragment. This DNA motif is a relatively conserved palindrome separated by a short sequence called a spacer. 
+
+A fascinating aspect of site-specific recombinases is that they can invert multiple site, providing the DNA recognition motif is present. Some genomes can have **one** site-specific recombinase responsible **many** inversions! Some genomes have a few site-specific recombinase regulating different set of inversions. 
+
+When you use this command, anvi'o will leverage the program [MEME](https://meme-suite.org/meme/tools/meme) to identify palindrome motifs in the inverted-repeats.
+It is done in two steps: 
+- Per inversion. Anvi'o searches and report three motifs. You can find the output of MEME in each inversion's directory (e.g. `PER_INV/INV_0001/MEME`).
+- For all inversions. Anvi'o searches for shared and conserved motifs across all inversions. By default it will search for as many motifs as there are inversions. This can be time consuming if you have a lot of inversions, and you can use the flag `--num-of-motifs` to specify the number of motifs to be reported. The output of MEME can be found here: `PER_INV/ALL_INVERSIONS/MEME`.
+
+In the final outputs, we report the 'motif group' for each inversions. Which means that you can link together groups of inversion putatively associated with the same site-specific recombinase. 
+
+If you want to skip this step, you can use the flag `--skip-search-for-motifs`.
+
 ### Targeted search
 
 If you are interested in a given contig region you can use the following flags to limit the search:
@@ -142,36 +157,86 @@ If you are interested in a given contig region you can use the following flags t
 * `--target-region-start`: the start position of the region of interest,
 * `--target-region-end`: the end position of the region of interest.
 
-### Output
-%(anvi-report-inversions)s searches for inversions in every single sample at a time and thus generates a TAB-delimited table for every sample: `INVERSIONS-IN-SAMPLE_01.txt`, `INVERSIONS-IN-SAMPLE_02`, ...
+### HTML output
+The first output of interest is `index.html` which is a static html page with all the information about each inversions.
+
+On the top of this page, you will find general informations such as number of inversions found and link to some tab-delimited files that summarize all inversions:
+
+![html header](../../images/anvi-report-inversions-01.png)
+
+#### Genomic context
+
+![genomic_context](../../images/anvi-report-inversions-02.gif)
+
+For each inversions you can see the genomic context. This part is interactive and allow you to inspect genes information such as their functions, DNA and amino acid sequences:
+
+#### Activity
+
+![activity](../../images/anvi-report-inversions-03.png)
+
+If you provided short-reads to the analysis, you can see barplots representing the inversion's activity. As explained in [the activity section](#computing-inversion-activity), anvi'o compute the activity on each end of an inversion, which explains the two barplots per sample. "Reference" correspond to the relative proportion of short-read matching to an inversion's orientation similar to your reference sequence. And "Inversion" correspond to the relative proportion of short-reads matching the reverse orientation. 
+
+The two barplots per sample should be relatively similar. It is not the case when (1) the coverage is low (fewer reads = less accurate relative proportions) or (2) there is more than one pair of inverted-repeat in this genomic site. [Here](https://doi.org/10.1093/nar/gkaa824) is a nice example of multiple nested IRs. If you ever see this, you should consider re-running the command for that specific region with [targeted search](#targeted-search), and searching for all possible palindrome with `--check-all-palindromes`. Yes, anvi'o can report nested, multiple IRs inversions when you use these flags :rainbow:.
+
+It is possible to see more colors than the two "Reference" and "Inversion". For instance, if you have a nested multiple IRs inversions (lucky you), you should see another color (a variation of grey) indicating that more than one sequence can end up on this side of an inversions. Another reason is sequencing error. Anvi'o relies on exact matches to report "Reference" and "Inversion", and a single read mismatch can create a third category (and therefore a third color in the barplot). If you see some **red** color, it means more than 4 different DNA sequence can be found at the edge of an inversions, which means that something is probably wrong and requires some manual inspection (or you should collect your Nobel prize).
 
-These tables contains the following information:
+#### General information
 
-* entry ID,
-* contig name,
-* first palindrome sequence,
-* aligment midline,
-* second palindrome sequence,
-* start and stop position of the first and second palindrome sequence,
-* number of mismatches,
-* number of gaps,
-* length of the palindrome sequence,
-* distance between the first and second palindrome seqeuences, i.e. the size of the inversion,
-* the number of samples in which it was detected and confirmed,
-* the in silico primers used to compute the inversion's activity, for the first and second palindrome,
-* the oligo corresponding to the reference sequence.
+![general_information](../../images/anvi-report-inversions-04.png)
 
-Anvi'o eventually creates a consensus table with all the unique inversions found accross all your samples in a file called `INVERSIONS-CONSENSUS.txt`. This table has the same format as the individual sample outputs, with the 'entry ID' replaced by a unique inversion ID.
+General information about each inversions like contig, position, length and the sample in which it was found.  
 
-Another default output table is named `ALL-STRETCHES-CONSIDERED.txt` and it reports every stretch that passed the ['Identifying regions of interest'](#identifying-regions-of-interest) parameters. It reports the maximum coverage of FWD/FWD and REV/REV in that stretch, per sample. It also reports the number of palindromes found and if a true inversion was confirmed.
+#### Inverted repeats and motifs
 
-If the user enables the reporting of the genomic context, two addition TAB-delimited tables are generated: `INVERSIONS-CONSENSUS-SURROUNDING-GENES.txt` and `INVERSIONS-CONSENSUS-SURROUNDING-FUNCTIONS.txt`.
-The first table reports the gene calls surrounding every inversion when possible (inversions_id, gene_caller_id, start and stop position, orientation, gene_caller and contig).
-The second table reports the function associated with every gene call reported in the first file (inversions_id, gene_caller_id, source, accession, function).
+![ir_and_motifs](../../images/anvi-report-inversions-05.png)
 
-Finally, if the user provides R1 and R2 fastq files and enables the reporting of inversion's activity, %(anvi-report-inversions)s will generate a long-format file named `INVERSION-ACTIVITY.txt`. This file reports, for every inversion and sample, the relative proportion and read abundance of unique oligos, which either correspond to the reference contig (no inversion), or to an inversion sequence. The inversion's activity is computed and reported for both sides of each inversion.
+Here you can see the two inverted-repeats, their alignment, length and position. 
+You can also see the "primer" sequence used to search short-read to report the activity, or relative proportion of an inversion's orientation per sample. 
 
+And finally you can see the palindromic motif likely recognized by a site-specific recombinase which carries out such inversion. 
+The same motif can occur in multiple inversions, which suggest that a unique site-specific recombinase is responsible for a set of inversions. 
+Typically there is only one motif per inversion, but we don't control biology so it is possible that more than one motif are reported.
 
+### Other outputs
 
+%(anvi-report-inversions)s create an output directory with the following structure (if you have not use the `--skip-[..]` flags):
 
+```
+INVERSIONS-OUTPUT/
+├── ALL-STRETCHES-CONSIDERED.txt
+├── INVERSION-ACTIVITY.txt
+├── INVERSIONS-CONSENSUS.txt
+├── PER_INV
+│   ├── ALL_INVERSIONS
+│   │   ├── MEME
+│   │   │   ├── logo1.eps
+│   │   │   ├── [...] 
+│   │   │   └── meme.xml
+│   │   ├── inverted_repeats.fasta
+│   │   └── run-MEME.log
+│   ├── INV_0001
+│   │   ├── MEME
+│   │   │   ├── logo1.eps
+│   │   │   ├── [...]
+│   │   │   └── meme.xml
+│   │   ├── SURROUNDING-FUNCTIONS.txt
+│   │   ├── SURROUNDING-GENES.txt
+│   │   ├── inverted_repeats.fasta
+│   │   └── run-MEME.log
+│   └── INV_0002
+│       ├── MEME
+│       │   ├── logo1.eps
+│       │   ├── [...]
+│       │   └── meme.xml
+│       ├── SURROUNDING-FUNCTIONS.txt
+│       ├── SURROUNDING-GENES.txt
+│       ├── inverted_repeats.fasta
+│       └── run-MEME.log
+├── PER_SAMPLE
+│   ├── INVERSIONS-IN-S01.txt
+│   ├── INVERSIONS-IN-S02.txt
+│   └── INVERSIONS-IN-S03.txt
+└── index.html
+```
 
+For more information about each of these txt files, go check %(inversions-txt)s.
diff --git a/anvio/docs/programs/anvi-setup-ncbi-cogs.md b/anvio/docs/programs/anvi-setup-ncbi-cogs.md
index 650754b2fb..7c8ed317b2 100644
--- a/anvio/docs/programs/anvi-setup-ncbi-cogs.md
+++ b/anvio/docs/programs/anvi-setup-ncbi-cogs.md
@@ -18,4 +18,69 @@ anvi-setup-ncbi-cogs --reset
 anvi-setup-ncbi-cogs --cog-version COG14
 {{ codestop }}
 
-Not sure which versions of %(cogs-data)s are available? You can type something random after the `--cog-version` parameter to see the options.
\ No newline at end of file
+Not sure which versions of %(cogs-data)s are available? You can type something random after the `--cog-version` parameter to see the options.
+
+### Always getting checksum errors? Instructions for manual downloads of the COG data (for COG 2020)
+
+Sometimes the NCBI servers drop incoming connections, leading to incomplete file downloads and errors like the following:
+
+```
+Config Error: Something went wrong with your download :/ The checksum we calculated for       
+              `cog-20.cog.csv` anvi'o just finished downloading does not match to the checksum
+              provided by the NCBI. This is most likely due to an interrupted download, as the
+              NCBI servers often prematurely end data transfers. Please try running the same  
+              command again with the `--reset` flag. 
+```
+
+If you have tried re-running `anvi-setup-ncbi-cogs` multiple times but are always getting checksum errors and are about to lose your mind, here is a set of commands that you can follow to manually download the data for the **2020 release of COGs** without having to go through the setup program every time. 
+
+First, you will need to move to the directory where anvi'o expects to find the COG files. This location will depend on where conda and anvi'o are installed on your computer, but if you have the anvi'o environment loaded in your terminal, you can easily get there by running the following:
+```
+cd $CONDA_PREFIX/lib/python3.10/site-packages/anvio/data/misc/COG/COG20/RAW_DATA_FROM_NCBI/
+```
+
+The files that anvi'o needs to see in that folder are the following:
+```
+checksum.md5.txt cog-20.def.tab   fun-20.tab
+cog-20.cog.csv   cog-20.fa.gz
+```
+
+Since you have already tried running `anvi-setup-ncbi-cogs` so many times, probably there are some of those files already in there. But the checksums of those files need to match those that are listed in the `checksum.md5.txt` file. For instance, if you look for `cog-20.cog.csv` inside the checksum file:
+
+```
+grep cog-20.cog.csv checksum.md5.txt
+```
+
+You will see the following line: ```1bed944a61e0ec404669361fb69ae52d  cog-20.cog.csv```
+which indicates that the file's checksum should match exactly to `1bed944a61e0ec404669361fb69ae52d`. If you run `md5sum cog-20.cog.csv`, you should see that exact string. If you don't see the same thing, it means the file has been incompletely downloaded, so it needs to be downloaded again. You can do it like this:
+
+```
+rm -rf cog-20.cog.csv
+
+curl -O https://ftp.ncbi.nih.gov/pub/COG/COG2020/data/cog-20.cog.csv
+
+md5sum cog-20.cog.csv
+```
+
+If you don't want to compare the strings manually, you can use the `diff` program to check that they are the same, like this:
+```
+grep cog-20.cog.csv checksum.md5.txt > expected_checksum
+md5sum cog-20.cog.csv > observed_checksum
+diff expected_checksum observed_checksum
+```
+If the two checksums match, you won't see any output from the `diff` command.
+
+Once you get a copy of the file with an exactly matching MD5 checksum, you can move on. 
+
+You should run `md5sum` on every file listed above (except for `checksum.md5.txt`), and check if it matches the corresponding string inside `checksum.md5.txt`. For any file with a non-matching MD5 checksum, you should download it using `curl` as we did above:
+```
+rm -rf [FILENAME THAT DOES NOT MATCH]
+curl -O https://ftp.ncbi.nih.gov/pub/COG/COG2020/data/[FILENAME THAT DOES NOT MATCH]
+```
+(make sure you change the file name at the end of the path to match the file that you need)
+
+After you have all the files with matching checksums, you can leave the data folder, and then re-run `anvi-setup-ncbi-cogs`, which should now work perfectly using the manually downloaded files:
+```
+cd
+anvi-setup-ncbi-cogs
+```
diff --git a/anvio/drivers/emapper.py b/anvio/drivers/emapper.py
index 7ea2d8fa53..dd94e9baa8 100644
--- a/anvio/drivers/emapper.py
+++ b/anvio/drivers/emapper.py
@@ -357,7 +357,7 @@ def populate_annotations_dict(self, annotations_file_path):
 
         num_entries_processed = 0
         self.progress.new('Parsing the annotations file')
-        for line in open(annotations_file_path, 'rU').readlines():
+        for line in open(annotations_file_path, 'r').readlines():
             if line.startswith('#') or line == '\n':
                 continue
 
diff --git a/anvio/fastalib.py b/anvio/fastalib.py
index 2da45c16f0..0980098ae7 100644
--- a/anvio/fastalib.py
+++ b/anvio/fastalib.py
@@ -97,7 +97,7 @@ def __init__(self, fasta_file_path, lazy_init=True, unique=False, allow_mixed_ca
         if self.compressed:
             self.file_pointer = gzip.open(self.fasta_file_path, mode="rt")
         else:
-            self.file_pointer = io.open(self.fasta_file_path, 'rU', newline='')
+            self.file_pointer = io.open(self.fasta_file_path, 'r', newline='')
 
         if not self.file_pointer.read(1) == '>':
             self.file_pointer.close()
diff --git a/anvio/filesnpaths.py b/anvio/filesnpaths.py
index 93327207de..a9d7939cbc 100644
--- a/anvio/filesnpaths.py
+++ b/anvio/filesnpaths.py
@@ -73,7 +73,7 @@ def is_proper_external_gene_calls_file(file_path):
     headers_proper = ['gene_callers_id', 'contig', 'start', 'stop', 'direction', 'partial', 'call_type', 'source', 'version', 'aa_sequence']
     call_types_allowed = set(list(constants.gene_call_types.values()))
 
-    with open(file_path, 'rU') as input_file:
+    with open(file_path, 'r') as input_file:
         headers = input_file.readline().strip().split('\t')
 
         if len(headers) == 10:
@@ -196,7 +196,7 @@ def is_file_empty(file_path):
 
 def is_file_tab_delimited(file_path, separator='\t', expected_number_of_fields=None, dont_raise=False):
     is_file_exists(file_path)
-    f = open(file_path, 'rU')
+    f = open(file_path, 'r')
 
     try:
         while True:
@@ -246,7 +246,7 @@ def is_file_json_formatted(file_path):
     is_file_exists(file_path)
 
     try:
-        json.load(open(file_path, 'rU'))
+        json.load(open(file_path, 'r'))
     except ValueError as e:
         raise FilesNPathsError("File '%s' does not seem to be a properly formatted JSON "
                            "file ('%s', cries the library)." % (file_path, e))
@@ -272,7 +272,7 @@ def is_file_plain_text(file_path, dont_raise=False):
     is_file_exists(file_path)
 
     try:
-        open(os.path.abspath(file_path), 'rU').read(512)
+        open(os.path.abspath(file_path), 'r').read(512)
     except IsADirectoryError:
         if dont_raise:
             return False
diff --git a/anvio/interactive.py b/anvio/interactive.py
index f397c0e56d..1564353064 100644
--- a/anvio/interactive.py
+++ b/anvio/interactive.py
@@ -546,7 +546,7 @@ def process_external_item_order(self):
 
         filesnpaths.is_file_exists(self.item_order_path)
 
-        item_order = [l.strip() for l in open(self.item_order_path, 'rU').readlines()]
+        item_order = [l.strip() for l in open(self.item_order_path, 'r').readlines()]
         self.run.info('Items order', 'An items order with %d items is found at %s.' % (len(item_order), self.item_order_path), mc='cyan')
 
         self.progress.new('External items order')
diff --git a/anvio/inversions.py b/anvio/inversions.py
index 3ac4b2d08d..072d20615a 100644
--- a/anvio/inversions.py
+++ b/anvio/inversions.py
@@ -6,6 +6,7 @@
 import copy
 import argparse
 import numpy as np
+import xml.etree.ElementTree as ET
 from collections import OrderedDict, Counter
 
 # multiprocess is a fork of multiprocessing that uses the dill serializer instead of pickle
@@ -75,6 +76,9 @@ def __init__(self, args, skip_sanity_check=False, run=terminal.Run(), progress=t
         # consensus inversions for downstream fun
         self.genomic_context_surrounding_consensus_inversions = {}
 
+        # in which we will store the motif info
+        self.motifs = {}
+
         # in which we will store all the static HTML output related stuff
         self.summary = {}
 
@@ -127,12 +131,15 @@ def __init__(self, args, skip_sanity_check=False, run=terminal.Run(), progress=t
         # stop inversion activity computation early for testing?
         self.end_primer_search_after_x_hits = A('end_primer_search_after_x_hits')
 
+        # this variable is used to filter out oligo supported by less than x reads
+        self.min_frequency = A('min_frequency_to_report') or 1
+
         # skip learning about the genomic context that surrounds inversions?
         self.skip_recovering_genomic_context = A('skip_recovering_genomic_context')
         self.gene_caller_to_consider_in_context = A('gene_caller') or 'prodigal'
         self.num_genes_to_consider_in_context = A('num_genes_to_consider_in_context') or 3
 
-        # paramters for motif search
+        # parameters for motif search
         self.skip_search_for_motifs = A('skip_search_for_motifs')
         self.num_of_motifs = A('num_of_motifs')
 
@@ -148,7 +155,7 @@ def __init__(self, args, skip_sanity_check=False, run=terminal.Run(), progress=t
         self.target_region_end = A('target_region_end')
 
         # these are the keys we are interested in finding in input files offered to reconstruct
-        # inverson profiles via the --pre-computed-inversions flag. NOTE that these keys are not ALL
+        # inversion profiles via the --pre-computed-inversions flag. NOTE that these keys are not ALL
         # keys that are used to build inversion profiles in the code, but the minimum set that
         # co-occur both sample-specific and consensus inversion reports. this way, the user can
         # attempt to characterize the activity of inversions found in a single sample if they wish:
@@ -936,6 +943,13 @@ def process_inversion_data_for_HTML_summary(self):
                                 self.summary['inversions'][inversion_id]['activity'][sample][oligo_primer][i]['start'] = i_start
                                 self.summary['inversions'][inversion_id]['activity'][sample][oligo_primer][i]['width'] = i_width
 
+        # add motif info
+        if self.skip_search_for_motifs:
+            pass
+        else:
+            for inversion_id in self.summary['inversions']:
+                self.summary['inversions'][inversion_id]['motifs'] =  copy.deepcopy(self.motifs[inversion_id]['motifs'])
+
 
     def recover_genomic_context_surrounding_inversions(self):
         """Learn about what surrounds the consensus inversion sites"""
@@ -1191,6 +1205,10 @@ def search_for_motifs(self):
 
         # are we checking for motifs?
         if self.skip_search_for_motifs:
+            # add motif info to consensus table
+            for entry in self.consensus_inversions:
+                inversion_id = entry['inversion_id']
+                entry['motif_group'] = 'NA'
             return
 
         # how many motifs should we look for?
@@ -1252,11 +1270,91 @@ def search_for_motifs(self):
         # search for as many motifs as inversions. Can be time consuming.
         self.use_motif_finder(fasta_path, meme_output, meme_log, num_motifs = self.num_of_motifs)
 
+        # parse the output xml
+        self.parse_motif_output(meme_output, meme_log)
+
         self.run.info('Reporting motifs in inverted repeats', output, nl_after=1)
 
 
+    def parse_motif_output(self, meme_output_path, meme_log):
+        """ After searching for conserved motifs in the inverted repeats, we want to report 
+        the motif's group for each inversions. Then we can see in the report (txt summary and 
+        html output) which inversions are linked together by site-specific invertase
+        """
+
+        # parse the xml output
+        tree = ET.parse(os.path.join(meme_output_path, "meme.xml"))
+        root = tree.getroot()
+
+        # for each inversion, we created 4 sequences. And MEME gave them a different id. 
+        # it looks like this
+        # INV_0001_first_IR: sequence_0
+        # INV_0001_first_IR_rc: sequence_1
+        # INV_0001_second_IR: sequence_2
+        # INV_0001_second_IR_rc: sequence_3
+        # ...
+        # we need to associate MEME id with each inversion id
+        for seq in root.findall('training_set/sequence'):
+            inversion_id = seq.get('name').split("_")[0] + "_" + seq.get('name').split("_")[1]
+            if inversion_id not in self.motifs:
+                self.motifs[inversion_id] = {'seq_list': [seq.get('id')]}
+            else:
+                self.motifs[inversion_id]['seq_list'].append(seq.get('id'))
+
+        # collect the motif regex and path to output figure
+        motif_dict = {}
+        is_path_to_logo = False
+        for motif in root.findall('motifs/motif'):
+            motif_id = motif.get('id')
+
+            # get the regex
+            regex = motif.find('regular_expression')
+            motif_dict[motif_id] = {'regex': regex.text.replace('\n', '', 2),
+                                    'logo_path': None}
+
+            # add the path to the logo image
+            logo_name_png = ''.join(['logo', motif.get('id').split('motif_')[1], '.png'])
+            path_to_logo = os.path.join('PER_INV', 'ALL_INVERSIONS', 'MEME', logo_name_png)
+            if os.path.isfile(os.path.join(self.output_directory, path_to_logo)):
+                motif_dict[motif_id]['logo_path'] = path_to_logo
+                is_path_to_logo = True
+
+        # no png logo? look at MEME log file
+        # may need to add ghostscript to list of mamba package
+        if not is_path_to_logo:
+            self.run.warning(None, header="SEARCHING DNA MOTIFS WITH MEME", lc="yellow")
+            self.run.info_single(f"MEME was not able to generate the motif's logo in png format, which means that you are missing "
+                                 f"some cool logo pictures in the final html summary. The logos are still available in .eps format here: "
+                                 f"{meme_output_path}. If you want to fix this issue, you should look at the log output of MEME: {meme_log}",
+                                 level=0, nl_after=1)
+
+        # anvi'o provides 4 sequences per inversions site. we want to keep only 
+        # motifs that occur on all 4 sequences.
+        for sites in root.findall('scanned_sites_summary/scanned_sites'):
+            for inversion_id, inversion_dict in self.motifs.items():
+                if 'motifs' not in self.motifs[inversion_id]:
+                    self.motifs[inversion_id]['motifs'] = {}
+                if sites.get('sequence_id') in inversion_dict['seq_list']:
+                    motif_per_seq = {}
+                    for site in sites:
+                        motif_id = site.get('motif_id')
+                        motif_per_seq[motif_id] = {'motif_id': motif_id, **motif_dict[motif_id]}
+
+                    if not self.motifs[inversion_id]['motifs']:
+                        self.motifs[inversion_id]['motifs'] = motif_per_seq
+                    else:
+                        intersection_dict = {key: motif_per_seq[key] for key in self.motifs[inversion_id]['motifs'].keys() & motif_per_seq.keys()}
+                        self.motifs[inversion_id]['motifs'] = intersection_dict
+
+        # add motif info to consensus table
+        for entry in self.consensus_inversions:
+            inversion_id = entry['inversion_id']
+            motif_list = list(self.motifs[inversion_id]['motifs'])
+            entry['motif_group'] = ','.join(motif_list)
+
+
     @staticmethod
-    def compute_inversion_activity_for_sample(input_queue, output_queue, samples_dict, primers_dict, oligo_length=6, end_primer_search_after_x_hits=None, run=run_quiet, progress=progress_quiet):
+    def compute_inversion_activity_for_sample(input_queue, output_queue, samples_dict, primers_dict, min_frequency, oligo_length=6, end_primer_search_after_x_hits=None, run=run_quiet, progress=progress_quiet):
         """Go back to the raw metagenomic reads to compute activity of inversions for a single sample.
 
         Returns
@@ -1289,6 +1387,7 @@ def compute_inversion_activity_for_sample(input_queue, output_queue, samples_dic
             args = argparse.Namespace(samples_dict=samples_dict_for_sample,
                                       primers_dict=primers_dict,
                                       min_remainder_length=oligo_length,
+                                      min_frequency=min_frequency,
                                       only_keep_remainder=True)
 
             # if the user is testing:
@@ -1307,8 +1406,8 @@ def compute_inversion_activity_for_sample(input_queue, output_queue, samples_dic
                 reads_found = False
 
                 for oligo, frequency in oligos_frequency_dict.items():
-                    sample_counts.append((sample_name, primer_name, oligo, oligo == primers_dict[primer_name]['oligo_reference'], frequency, frequency / num_oligos))
-                    if frequency:
+                    if frequency > min_frequency:
+                        sample_counts.append((sample_name, primer_name, oligo, oligo == primers_dict[primer_name]['oligo_reference'], frequency, frequency / num_oligos))
                         reads_found = True
 
                 # if the reference oligo has no frequency but reads were found for other oligo
@@ -1424,8 +1523,10 @@ def compute_inversion_activity(self):
                                                    output_queue,
                                                    self.profile_db_bam_file_pairs,
                                                    primers_dict,
+                                                   self.min_frequency,
                                                    self.oligo_length,
                                                    self.end_primer_search_after_x_hits),
+
                                              kwargs=({'progress': self.progress if self.num_threads == 1 else progress_quiet}))
             workers.append(worker)
             worker.start()
@@ -1569,6 +1670,15 @@ def process(self):
         else:
             self.run.info("[Genomic context] Recover and report genomic context?",  "False", mc="red", nl_after=1)
 
+        if not self.skip_search_for_motifs:
+            if self.num_of_motifs:
+                self.run.info("[Search for motifs] Search for DNA motifs?", "True", mc="green")
+                self.run.info("[Search for motifs] Number of motifs to search", self.num_of_motifs, nl_after=1)
+            else:
+                self.run.info("[Search for motifs] Search for DNA motifs?", "True", mc="green", nl_after=1)
+        else:
+            self.run.info("[Search for motifs] Search for DNA motifs?", "False", mc="red", nl_after=1)
+
         # are we to compute inversion activity by going through raw reads?
         inversion_activity_will_be_computed = self.raw_r1_r2_reads_are_present and not self.skip_compute_inversion_activity
         self.run.info("[Inversion activity] Compute inversion activity?",  "True" if inversion_activity_will_be_computed else "False", mc=("green" if inversion_activity_will_be_computed else "red"))
@@ -1583,8 +1693,10 @@ def process(self):
             self.run.info("[Inversion activity] Number of threads", self.num_threads, mc=("green" if self.num_threads > 1 else "red"))
             if self.end_primer_search_after_x_hits:
                 self.run.info("[Inversion activity] Oligo primer base length", self.oligo_primer_base_length)
+                self.run.info("[Inversion activity] Minimum frequency reported", self.min_frequency)
                 self.run.info("[Inversion activity Debug] Num hits to end primer search",  self.end_primer_search_after_x_hits, mc="red", nl_after=1)
             else:
+                self.run.info("[Inversion activity] Minimum frequency reported", self.min_frequency)
                 self.run.info("[Inversion activity] Oligo primer base length", self.oligo_primer_base_length, nl_after=1)
 
         if self.target_contig:
@@ -1633,7 +1745,7 @@ def process(self):
 
         # here we will process and summarize all inversion data to populate `self.summary`
         # so it is ready to be used to render a static HTML output
-        self.process_inversion_data_for_HTML_summary()
+        # self.process_inversion_data_for_HTML_summary()
 
         # Do all reporting
         self.report()
@@ -1748,21 +1860,6 @@ def report(self):
             else:
                 self.run.info(f'Inversions in {entry_name}', 'No true inversions in this one :/', mc='red')
 
-        headers = ['inversion_id', 'contig_name', 'first_seq', 'midline', 'second_seq', 'first_start',
-                   'first_end', 'second_start', 'second_end', 'num_mismatches', 'num_gaps', 'length',
-                   'distance', 'num_samples', 'sample_names', 'first_oligo_primer',  'first_oligo_reference',
-                   'second_oligo_primer', 'second_oligo_reference']
-
-        ################################################################################################
-        # Consensus inversions
-        ################################################################################################
-        output_path = os.path.join(self.output_directory, 'INVERSIONS-CONSENSUS.txt')
-        with open(output_path, 'w') as output:
-            output.write('\t'.join(headers) + '\n')
-            for v in self.consensus_inversions:
-                output.write('\t'.join([f"{v[k]}" for k in headers]) + '\n')
-        self.run.info('Reporting file for consensus inversions', output_path, mc='green', nl_before=1)
-
         ################################################################################################
         # All stretches considered
         ################################################################################################
@@ -1781,9 +1878,25 @@ def report(self):
         ################################################################################################
         self.search_for_motifs()
 
+        ################################################################################################
+        # Consensus inversions
+        ################################################################################################
+        headers = ['inversion_id', 'contig_name', 'first_seq', 'midline', 'second_seq', 'first_start',
+                   'first_end', 'second_start', 'second_end', 'num_mismatches', 'num_gaps', 'length',
+                   'distance', 'num_samples', 'sample_names', 'motif_group', 'first_oligo_primer',
+                   'first_oligo_reference', 'second_oligo_primer', 'second_oligo_reference']
+
+        output_path = os.path.join(self.output_directory, 'INVERSIONS-CONSENSUS.txt')
+        with open(output_path, 'w') as output:
+            output.write('\t'.join(headers) + '\n')
+            for v in self.consensus_inversions:
+                output.write('\t'.join([f"{v[k]}" for k in headers]) + '\n')
+        self.run.info('Reporting file for consensus inversions', output_path, mc='green', nl_before=1)
+
         ################################################################################################
         # Generate HTML summary
         ################################################################################################
+        self.process_inversion_data_for_HTML_summary()
         SummaryHTMLOutput(self.summary, r=self.run, p=self.progress).generate()
 
 
diff --git a/anvio/kegg.py b/anvio/kegg.py
index 7398020b7a..4f25761453 100644
--- a/anvio/kegg.py
+++ b/anvio/kegg.py
@@ -924,7 +924,7 @@ def process_pathway_file(self):
         filesnpaths.is_file_exists(self.kegg_pathway_file)
         filesnpaths.is_file_plain_text(self.kegg_pathway_file)
 
-        f = open(self.kegg_pathway_file, 'rU')
+        f = open(self.kegg_pathway_file, 'r')
         self.progress.new("Parsing KEGG Pathway file")
 
         current_category = None
@@ -998,7 +998,7 @@ def get_accessions_from_htext_file(self, htext_file):
         filesnpaths.is_file_exists(htext_file)
         filesnpaths.is_file_plain_text(htext_file)
 
-        f = open(htext_file, 'rU')
+        f = open(htext_file, 'r')
         self.progress.new(f"Parsing KEGG htext file: {htext_file}")
 
         target_level = None
@@ -1077,7 +1077,7 @@ def download_generic_flat_file(self, accession, download_dir="./"):
         utils.download_file(self.kegg_rest_api_get + '/' + accession,
             file_path, progress=self.progress, run=self.run)
         # verify entire file has been downloaded
-        f = open(file_path, 'rU')
+        f = open(file_path, 'r')
         f.seek(0, os.SEEK_END)
         f.seek(f.tell() - 4, os.SEEK_SET)
         last_line = f.readline().strip('\n')
@@ -1146,7 +1146,7 @@ def download_pathways(self):
             utils.download_file(self.kegg_rest_api_get + '/' + konum,
                 file_path, progress=self.progress, run=self.run)
             # verify entire file has been downloaded
-            f = open(file_path, 'rU')
+            f = open(file_path, 'r')
             f.seek(0, os.SEEK_END)
             f.seek(f.tell() - 4, os.SEEK_SET)
             last_line = f.readline().strip('\n')
@@ -1528,7 +1528,7 @@ def process_module_file(self):
         filesnpaths.is_file_exists(self.kegg_module_file)
         filesnpaths.is_file_plain_text(self.kegg_module_file)
 
-        f = open(self.kegg_module_file, 'rU')
+        f = open(self.kegg_module_file, 'r')
         self.progress.new("Parsing KEGG Module file")
 
         current_module_type = None
@@ -1641,7 +1641,7 @@ def confirm_downloaded_modules(self):
                                   f"on your computer. Very sorry to tell you this, but you need to re-download the KEGG "
                                   f"data. We recommend the --reset flag.")
             # verify entire file has been downloaded
-            f = open(file_path, 'rU')
+            f = open(file_path, 'r')
             f.seek(0, os.SEEK_END)
             f.seek(f.tell() - 4, os.SEEK_SET)
             last_line = f.readline().strip('\n')
@@ -2401,7 +2401,7 @@ class is nothing but one that iterates through all contigs DBs
         A = lambda x: args.__dict__[x] if x in args.__dict__ else None
         self.metagenome_mode = True if A('metagenome_mode') else False
         self.module_completion_threshold = A('module_completion_threshold') or 0.75
-        self.output_file_prefix = A('output_file_prefix') or "kegg-metabolism"
+        self.output_file_prefix = A('output_file_prefix') or "metabolism"
         self.write_dict_to_json = True if A('get_raw_data_as_json') else False
         self.json_output_file_path = A('get_raw_data_as_json')
         self.store_json_without_estimation = True if A('store_json_without_estimation') else False
@@ -5327,11 +5327,20 @@ def generate_output_dict_for_modules(self, kegg_superdict, headers_to_include=No
                         if "annotated_enzymes_in_path" in headers_to_include:
                             annotated = []
                             for accession in p:
-                                if (accession in self.all_modules_in_db and mod_dict[accession]["pathwise_is_complete"]) or \
-                                   (accession in c_dict['kofam_hits'].keys()):
-                                    annotated.append(accession)
+                                # handle enzyme components
+                                if '+' in accession or '-' in accession:
+                                    components = re.split(r'\+|\-', accession)
+                                    for c in components:
+                                        if c in c_dict['kofam_hits'].keys():
+                                            annotated.append(c)
+                                        else:
+                                            annotated.append(f"[MISSING {c}]")
                                 else:
-                                    annotated.append(f"[MISSING {accession}]")
+                                    if (accession in self.all_modules_in_db and mod_dict[accession]["pathwise_is_complete"]) or \
+                                    (accession in c_dict['kofam_hits'].keys()):
+                                        annotated.append(accession)
+                                    else:
+                                        annotated.append(f"[MISSING {accession}]")
                             d[self.modules_unique_id]["annotated_enzymes_in_path"] = ",".join(annotated)
 
                         # add path-level redundancy if requested
@@ -6668,7 +6677,7 @@ def create(self):
         for mnum in self.module_dict.keys():
             self.progress.update("Parsing Module %s" % mnum)
             mod_file_path = os.path.join(self.module_data_directory, mnum)
-            f = open(mod_file_path, 'rU')
+            f = open(mod_file_path, 'r')
 
             prev_data_name_field = None
             module_has_annotation_source = False
diff --git a/anvio/mcgclassifier.py b/anvio/mcgclassifier.py
index 2d9f0b0bb3..bd38770778 100644
--- a/anvio/mcgclassifier.py
+++ b/anvio/mcgclassifier.py
@@ -92,7 +92,7 @@ def __init__(self, args, run=run, progress=progress):
         if self.exclude_samples:
             # check that there is a file like this
             filesnpaths.is_file_exists(self.exclude_samples)
-            self.samples_to_exclude = set([l.split('\t')[0].strip() for l in open(self.exclude_samples, 'rU').readlines()])
+            self.samples_to_exclude = set([l.split('\t')[0].strip() for l in open(self.exclude_samples, 'r').readlines()])
 
             if not self.samples_to_exclude:
                 raise ConfigError("You asked to exclude samples, but provided an empty list.")
@@ -102,7 +102,7 @@ def __init__(self, args, run=run, progress=progress):
         if self.include_samples:
             # check that there is a file like this
             filesnpaths.is_file_exists(self.include_samples)
-            self.samples_to_include = set([l.split('\t')[0].strip() for l in open(self.include_samples, 'rU').readlines()])
+            self.samples_to_include = set([l.split('\t')[0].strip() for l in open(self.include_samples, 'r').readlines()])
 
             if not self.samples_to_include:
                 raise ConfigError("You provided an empty list of samples to include.")
diff --git a/anvio/merger.py b/anvio/merger.py
index 0e2aa44480..440f07a592 100644
--- a/anvio/merger.py
+++ b/anvio/merger.py
@@ -334,7 +334,7 @@ def sanity_check(self):
         # do we have a description file?
         if self.description_file_path:
             filesnpaths.is_file_plain_text(self.description_file_path)
-            self.description = open(os.path.abspath(self.description_file_path), 'rU').read()
+            self.description = open(os.path.abspath(self.description_file_path), 'r').read()
 
 
     def set_sample_id(self):
diff --git a/anvio/migrations/contigs/v21_to_v22.py b/anvio/migrations/contigs/v21_to_v22.py
new file mode 100644
index 0000000000..e5c4f29816
--- /dev/null
+++ b/anvio/migrations/contigs/v21_to_v22.py
@@ -0,0 +1,69 @@
+#!/usr/bin/env python
+# -*- coding: utf-8
+
+import sys
+import argparse
+
+import anvio.dbinfo as dbinfo
+import anvio.terminal as terminal
+
+from anvio.errors import ConfigError
+
+current_version, next_version = [x[1:] for x in __name__.split('_to_')]
+
+run = terminal.Run()
+progress = terminal.Progress()
+
+def migrate(db_path):
+    if db_path is None:
+        raise ConfigError("No database path is given.")
+
+    contigs_db_info = dbinfo.ContigsDBInfo(db_path)
+    if str(contigs_db_info.version) != current_version:
+        raise ConfigError(
+            f"The version of the provided contigs database is {contigs_db_info.version}, "
+            f"not the required version, {current_version}, so this script cannot upgrade the database.")
+
+    progress.new("Migrating")
+    progress.update("Adding any missing database metavariables")
+
+    self_table = contigs_db_info.get_self_table()
+    contigs_db = contigs_db_info.load_db()
+    for key in [
+        'reaction_network_ko_annotations_hash',
+        'reaction_network_kegg_database_release',
+        'reaction_network_modelseed_database_sha'
+    ]:
+        if key not in self_table:
+            contigs_db.set_meta_value(key, None)
+
+    progress.update("Updating version")
+    contigs_db.remove_meta_key_value_pair('version')
+    contigs_db.set_version(next_version)
+
+    progress.update("Committing changes")
+    contigs_db.disconnect()
+
+    progress.end()
+
+    message = (
+        "Congratulations! Your contigs database is now version 22. This update fixes a bug that prevented "
+        "construction and storage of a metabolic reaction network in version 21 databases that were created "
+        "from scratch and not migrated from version 20. You can blame the author of this script for the "
+        "oversight responsible for the bug and this annoying migration. If the version 21 database was "
+        "created from scratch, then placeholders for three 'metavariables' should now have been added to the "
+        "database; if the version 21 database migrated from version 20, then nothing at all should have "
+        "changed in the database except the version number."
+    )
+    run.info_single(message, nl_after=1, nl_before=1, mc='green')
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description=f"A simple script to upgrade an anvi'o contigs database from version {current_version} to version {next_version}")
+    parser.add_argument("contigs_db", metavar="CONTIGS_DB", help=f"An anvi'o contigs database of version {current_version}")
+    args, unknown = parser.parse_known_args()
+
+    try:
+        migrate(args.contigs_db)
+    except ConfigError as e:
+        print(e)
+        sys.exit(-1)
diff --git a/anvio/migrations/genomestorage/v4_to_v5.py b/anvio/migrations/genomestorage/v4_to_v5.py
index 85e37d67c3..9edf137702 100755
--- a/anvio/migrations/genomestorage/v4_to_v5.py
+++ b/anvio/migrations/genomestorage/v4_to_v5.py
@@ -92,11 +92,11 @@ def migrate(db_path):
             attr = I(genome_name, column_name)
 
             if attr.dtype == 'int64':
-                values += (int(attr.value), )
+                values += (int(attr[()]), )
             elif attr.dtype == 'float64':
-                values += (float(attr.value), )
+                values += (float(attr[()]), )
             else:
-                values += ((attr.value), )
+                values += ((attr[()]), )
 
         genome_info_entries.append(values)
     genomes_db.insert_many(genome_info_table_name, entries=genome_info_entries)
@@ -106,7 +106,7 @@ def migrate(db_path):
     gene_entries = []
     for genome_name in genome_names:
         for gene_callers_id in fp['/data/genomes/%s' % genome_name]:
-            G = lambda key: fp['/data/genomes/%s/%s/%s' % (genome_name, gene_callers_id, key)].value
+            G = lambda key: fp['/data/genomes/%s/%s/%s' % (genome_name, gene_callers_id, key)][()]
             gene_entries.append((genome_name, gene_callers_id, G('aa_sequence'), G('dna_sequence'), int(G('partial')), int(G('length')), ))
     genomes_db.insert_many(gene_info_table_name, entries=gene_entries)
     del gene_entries
@@ -119,7 +119,7 @@ def migrate(db_path):
             functions_path = '/data/genomes/%s/%s/functions' % (genome_name, gene_callers_id)
             if functions_path in fp:
                 for source in fp[functions_path]:
-                    annotation_list = str(fp['/data/genomes/%s/%s/functions/%s' % (genome_name, gene_callers_id, source)].value).split('|||')
+                    annotation_list = str(fp['/data/genomes/%s/%s/functions/%s' % (genome_name, gene_callers_id, source)][()]).split('|||')
 
                     functions_entries.append((genome_name, entry_id_counter, gene_callers_id, source, annotation_list[0], annotation_list[1], 0, ))
                     entry_id_counter += 1
diff --git a/anvio/migrations/pan/v16_to_v17.py b/anvio/migrations/pan/v16_to_v17.py
new file mode 100644
index 0000000000..e8547be21d
--- /dev/null
+++ b/anvio/migrations/pan/v16_to_v17.py
@@ -0,0 +1,93 @@
+#!/usr/bin/env python
+# -*- coding: utf-8
+
+import sys
+import argparse
+
+import anvio.dbinfo as dbinfo
+import anvio.terminal as terminal
+
+from anvio.errors import ConfigError
+
+run = terminal.Run()
+progress = terminal.Progress()
+
+current_version, next_version = [x[1:] for x in __name__.split('_to_')]
+
+pan_gene_cluster_function_reactions_table_name        = 'gene_cluster_function_reactions'
+pan_gene_cluster_function_reactions_table_structure   = ['modelseed_reaction_id', 'modelseed_reaction_name', 'ko_kegg_reaction_source', 'ko_ec_number_source', 'other_kegg_reaction_ids', 'other_ec_numbers', 'metabolite_modelseed_ids', 'stoichiometry', 'compartments', 'reversibility']
+pan_gene_cluster_function_reactions_table_types       = [         'text'        ,            'text'        ,          'text'          ,         'text'       ,         'text'           ,       'text'      ,           'text'          ,      'text'    ,     'text'    ,      'bool'    ]
+
+pan_gene_cluster_function_metabolites_table_name      = 'gene_cluster_function_metabolites'
+pan_gene_cluster_function_metabolites_table_structure = ['modelseed_compound_id', 'modelseed_compound_name', 'kegg_aliases', 'formula', 'charge']
+pan_gene_cluster_function_metabolites_table_types     = [         'text'        ,           'text'         ,     'text'    ,   'text' , 'numeric']
+
+def migrate(db_path):
+    if db_path is None:
+        raise ConfigError("No database path is given.")
+
+    pan_db_info = dbinfo.PanDBInfo(db_path)
+    if str(pan_db_info.version) != current_version:
+        raise ConfigError(
+            f"The version of the provided pan database is {pan_db_info.version}, not the required version, "
+            f"{current_version}, so this script cannot upgrade the database.")
+
+    pan_db = pan_db_info.load_db()
+
+    if str(pan_db.get_version()) != current_version:
+        raise ConfigError("Version of this contigs database is not %s (hence, this script cannot really do anything)." % current_version)
+
+    progress.new("Migrating")
+    progress.update("Creating two new tables for reactions and metabolites")
+
+    # To be on the safe side, remove any reaction network tables and metadata that might exist.
+    try:
+        pan_db.drop_table(pan_gene_cluster_function_reactions_table_name)
+        pan_db.drop_table(pan_gene_cluster_function_metabolites_table_name)
+    except:
+        pass
+
+    try:
+        pan_db.remove_meta_key_value_pair('reaction_network_ko_annotations_hash')
+        pan_db.remove_meta_key_value_pair('reaction_network_kegg_database_release')
+        pan_db.remove_meta_key_value_pair('reaction_network_modelseed_database_sha')
+        pan_db.remove_meta_key_value_pair('reaction_network_consensus_threshold')
+        pan_db.remove_meta_key_value_pair('reaction_network_discard_ties')
+    except:
+        pass
+
+    pan_db.set_meta_value('reaction_network_ko_annotations_hash', None)
+    pan_db.set_meta_value('reaction_network_kegg_database_release', None)
+    pan_db.set_meta_value('reaction_network_modelseed_database_sha', None)
+    pan_db.set_meta_value('reaction_network_consensus_threshold', None)
+    pan_db.set_meta_value('reaction_network_discard_ties', None)
+    pan_db.create_table(pan_gene_cluster_function_reactions_table_name, pan_gene_cluster_function_reactions_table_structure, pan_gene_cluster_function_reactions_table_types)
+    pan_db.create_table(pan_gene_cluster_function_metabolites_table_name, pan_gene_cluster_function_metabolites_table_structure, pan_gene_cluster_function_metabolites_table_types)
+
+    progress.update("Updating version")
+    pan_db.remove_meta_key_value_pair('version')
+    pan_db.set_version(next_version)
+
+    progress.update("Committing changes")
+    pan_db.disconnect()
+
+    progress.end()
+
+    message = (
+        "Congratulations! Your pan database is now version 17, which means it now contains two new empty tables. "
+        "These tables are not as boring as they first appear, because you can now run `anvi-reaction-network` to store "
+        "a network of the metabolic reactions that may be encoded by gene clusters. A metabolic model representing the "
+        "network can be exported from the database using `anvi-get-metabolic-model-file`."
+    )
+    run.info_single(message, nl_after=1, nl_before=1, mc='green')
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='A simple script to upgrade the pan database from version %s to version %s' % (current_version, next_version))
+    parser.add_argument('pan_db', metavar = 'PAN_DB', help = "An anvi'o pan database of version %s" % current_version)
+    args, unknown = parser.parse_known_args()
+
+    try:
+        migrate(args.pan_db)
+    except ConfigError as e:
+        print(e)
+        sys.exit(-1)
diff --git a/anvio/panops.py b/anvio/panops.py
index 5cf700d29a..824c2d5ac8 100644
--- a/anvio/panops.py
+++ b/anvio/panops.py
@@ -234,7 +234,7 @@ def check_params(self):
 
         if self.description_file_path:
             filesnpaths.is_file_plain_text(self.description_file_path)
-            self.description = open(os.path.abspath(self.description_file_path), 'rU').read()
+            self.description = open(os.path.abspath(self.description_file_path), 'r').read()
 
         self.pan_db_path = self.get_output_file_path(self.project_name + '-PAN.db')
 
diff --git a/anvio/parsers/kaiju.py b/anvio/parsers/kaiju.py
index 4d8f60e60b..057320a42a 100644
--- a/anvio/parsers/kaiju.py
+++ b/anvio/parsers/kaiju.py
@@ -62,7 +62,7 @@ def fix_input_file(self, input_file_path):
 
         corrected_temp_file_path = filesnpaths.get_temp_file_path()
         corrected_temp_file = open(corrected_temp_file_path, 'w')
-        input_file = open(input_file_path, 'rU')
+        input_file = open(input_file_path, 'r')
 
         num_correct_lines = 0
         for line in input_file.readlines():
diff --git a/anvio/profiler.py b/anvio/profiler.py
index 2a25ec3592..d2facf2a25 100644
--- a/anvio/profiler.py
+++ b/anvio/profiler.py
@@ -450,7 +450,7 @@ def init_dirs_and_dbs(self):
 
         if self.description_file_path:
             filesnpaths.is_file_plain_text(self.description_file_path)
-            self.description = open(os.path.abspath(self.description_file_path), 'rU').read()
+            self.description = open(os.path.abspath(self.description_file_path), 'r').read()
 
         if self.output_directory:
             self.output_directory = filesnpaths.check_output_directory(self.output_directory, ok_if_exists=self.overwrite_output_destinations)
diff --git a/anvio/programs.py b/anvio/programs.py
index b404d470a9..230f4c248d 100644
--- a/anvio/programs.py
+++ b/anvio/programs.py
@@ -55,7 +55,7 @@ def get_until_blank(output):
 
 
 def get_meta_information_from_file(file_path, meta_tag):
-    all_lines = [l.strip() for l in open(file_path, 'rU').readlines()]
+    all_lines = [l.strip() for l in open(file_path, 'r').readlines()]
 
     meta_tag_content = ''
 
diff --git a/anvio/samplesops.py b/anvio/samplesops.py
index f603df9779..814b0d96f4 100644
--- a/anvio/samplesops.py
+++ b/anvio/samplesops.py
@@ -50,7 +50,7 @@ def process_samples_information_file(self, samples_information_path):
         self.sample_names_in_samples_information_file = filesnpaths.is_proper_samples_information_file(samples_information_path)
 
         self.samples_information_dict, self.aliases_to_attributes_dict = self.convert_samples_information_dict(utils.get_TAB_delimited_file_as_dictionary(samples_information_path))
-        self.samples_information_default_layer_order = open(samples_information_path, 'rU').readline().strip().split('\t')[1:]
+        self.samples_information_default_layer_order = open(samples_information_path, 'r').readline().strip().split('\t')[1:]
 
         self.run.info('Samples information', 'Loaded for %d samples' % len(self.samples_information_dict), quiet=self.quiet)
 
@@ -122,7 +122,7 @@ def process_single_order_data(self, single_order_path, single_order_name):
 
         filesnpaths.is_file_plain_text(single_order_path)
 
-        single_order_file_content = [l.strip('\n') for l in open(single_order_path, 'rU').readlines()]
+        single_order_file_content = [l.strip('\n') for l in open(single_order_path, 'r').readlines()]
 
         if len(single_order_file_content) != 1:
             raise SamplesError("The single order file should contain a single line of information. It can't have nothing,\
diff --git a/anvio/structureops.py b/anvio/structureops.py
index aa47125fe2..d9a41fcaca 100755
--- a/anvio/structureops.py
+++ b/anvio/structureops.py
@@ -1968,7 +1968,7 @@ def get_path(self, gene_callers_id):
 
     def is_header_ok(self):
         headers_proper = ['gene_callers_id', 'path']
-        with open(self.path, 'rU') as input_file:
+        with open(self.path, 'r') as input_file:
             headers = input_file.readline().strip().split('\t')
             missing_headers = [h for h in headers_proper if h not in headers]
 
diff --git a/anvio/tables/__init__.py b/anvio/tables/__init__.py
index d344b0fd3b..ca6caf9b9a 100644
--- a/anvio/tables/__init__.py
+++ b/anvio/tables/__init__.py
@@ -14,10 +14,10 @@
 __email__ = "a.murat.eren@gmail.com"
 
 
-contigs_db_version = "21"
+contigs_db_version = "22"
 profile_db_version = "38"
 genes_db_version = "6"
-pan_db_version = "16"
+pan_db_version = "17"
 auxiliary_data_version = "2"
 structure_db_version = "2"
 genomes_storage_vesion = "7"
@@ -47,6 +47,14 @@
 pan_gene_clusters_table_structure      = ['gene_caller_id', 'gene_cluster_id', 'genome_name', 'alignment_summary']
 pan_gene_clusters_table_types          = [    'numeric'   ,      'str'       ,     'str'    ,        'str'       ]
 
+pan_gene_cluster_function_reactions_table_name        = 'gene_cluster_function_reactions'
+pan_gene_cluster_function_reactions_table_structure   = ['modelseed_reaction_id', 'modelseed_reaction_name', 'ko_kegg_reaction_source', 'ko_ec_number_source', 'other_kegg_reaction_ids', 'other_ec_numbers', 'metabolite_modelseed_ids', 'stoichiometry', 'compartments', 'reversibility']
+pan_gene_cluster_function_reactions_table_types       = [         'text'        ,            'text'        ,          'text'          ,         'text'       ,         'text'           ,       'text'      ,           'text'          ,      'text'    ,     'text'    ,      'bool'    ]
+
+pan_gene_cluster_function_metabolites_table_name      = 'gene_cluster_function_metabolites'
+pan_gene_cluster_function_metabolites_table_structure = ['modelseed_compound_id', 'modelseed_compound_name', 'kegg_aliases', 'formula', 'charge']
+pan_gene_cluster_function_metabolites_table_types     = [         'text'        ,           'text'         ,     'text'    ,   'text' , 'numeric']
+
 
 ####################################################################################################
 #
@@ -88,7 +96,7 @@
 
 gene_function_reactions_table_name        = 'gene_function_reactions'
 gene_function_reactions_table_structure   = ['modelseed_reaction_id', 'modelseed_reaction_name', 'ko_kegg_reaction_source', 'ko_ec_number_source', 'other_kegg_reaction_ids', 'other_ec_numbers', 'metabolite_modelseed_ids', 'stoichiometry', 'compartments', 'reversibility']
-gene_function_reactions_table_types       = [         'text'        ,            'text'        ,           'text'         ,         'text'       ,           'text'         ,       'text'      ,          'text'          ,      'text'    ,      'str'    ,      'bool'    ]
+gene_function_reactions_table_types       = [         'text'        ,            'text'        ,           'text'         ,         'text'       ,           'text'         ,       'text'      ,          'text'           ,      'text'    ,     'text'    ,      'bool'    ]
 
 gene_function_metabolites_table_name      = 'gene_function_metabolites'
 gene_function_metabolites_table_structure = ['modelseed_compound_id', 'modelseed_compound_name', 'kegg_aliases', 'formula', 'charge']
@@ -386,6 +394,8 @@
                                   'max_normalized_ratio_splits': False,
                                   'relative_abundance_splits': False,
                                   pan_gene_clusters_table_name: True,
+                                  pan_gene_cluster_function_reactions_table_name: False,
+                                  pan_gene_cluster_function_metabolites_table_name: False,
                                   genes_in_splits_table_name: True,
                                   gene_function_calls_table_name: True,
                                   gene_function_reactions_table_name: False,
diff --git a/anvio/tests/sandbox/data/genomes/archaea/S_islandicus_LS215.db b/anvio/tests/sandbox/data/genomes/archaea/S_islandicus_LS215.db
index 2997385630..11c6b2eee6 100644
Binary files a/anvio/tests/sandbox/data/genomes/archaea/S_islandicus_LS215.db and b/anvio/tests/sandbox/data/genomes/archaea/S_islandicus_LS215.db differ
diff --git a/anvio/tests/sandbox/data/genomes/bacteria/B_thetaiotamicron_VPI-5482.db b/anvio/tests/sandbox/data/genomes/bacteria/B_thetaiotamicron_VPI-5482.db
index 2cd632cfa3..730598c577 100644
Binary files a/anvio/tests/sandbox/data/genomes/bacteria/B_thetaiotamicron_VPI-5482.db and b/anvio/tests/sandbox/data/genomes/bacteria/B_thetaiotamicron_VPI-5482.db differ
diff --git a/anvio/tests/sandbox/data/genomes/bacteria/P_marinus_CCMP1375.db b/anvio/tests/sandbox/data/genomes/bacteria/P_marinus_CCMP1375.db
index 34fe388325..3725811952 100644
Binary files a/anvio/tests/sandbox/data/genomes/bacteria/P_marinus_CCMP1375.db and b/anvio/tests/sandbox/data/genomes/bacteria/P_marinus_CCMP1375.db differ
diff --git a/anvio/tests/sandbox/data/metagenomes/human_gut/IGD_SUBSET/CONTIGS.db b/anvio/tests/sandbox/data/metagenomes/human_gut/IGD_SUBSET/CONTIGS.db
index b64f94e24f..bc30523090 100644
Binary files a/anvio/tests/sandbox/data/metagenomes/human_gut/IGD_SUBSET/CONTIGS.db and b/anvio/tests/sandbox/data/metagenomes/human_gut/IGD_SUBSET/CONTIGS.db differ
diff --git a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6240.db b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6240.db
index 79fb7f4b5e..756c0cf40b 100644
Binary files a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6240.db and b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6240.db differ
diff --git a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6255.db b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6255.db
index 8e96191a12..bb8381021c 100644
Binary files a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6255.db and b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6255.db differ
diff --git a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6512.db b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6512.db
index 134561fade..a5f2a48e19 100644
Binary files a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6512.db and b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6512.db differ
diff --git a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6557.db b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6557.db
index e05447afd7..e1474104eb 100644
Binary files a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6557.db and b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6557.db differ
diff --git a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6563.db b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6563.db
index d74d0d2bb0..6243bba446 100644
Binary files a/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6563.db and b/anvio/tests/sandbox/mock_data_for_pangenomics/E_faecalis_6563.db differ
diff --git a/anvio/utils.py b/anvio/utils.py
index 4e599aaa3e..ab4c817b1a 100644
--- a/anvio/utils.py
+++ b/anvio/utils.py
@@ -850,7 +850,7 @@ def transpose_tab_delimited_file(input_file_path, output_file_path, remove_after
     filesnpaths.is_file_tab_delimited(input_file_path)
     filesnpaths.is_output_file_writable(output_file_path)
 
-    file_content = [line.strip('\n').split('\t') for line in open(input_file_path, 'rU').readlines()]
+    file_content = [line.strip('\n').split('\t') for line in open(input_file_path, 'r').readlines()]
 
     output_file = open(output_file_path, 'w')
     for entry in zip(*file_content):
@@ -1048,7 +1048,7 @@ def get_column_data_from_TAB_delim_file(input_file_path, column_indices=[], expe
     for index in column_indices:
         d[index] = []
 
-    with open(input_file_path, "rU") as input_file:
+    with open(input_file_path, "r") as input_file:
         for line in input_file.readlines():
             fields = line.strip('\n').split(separator)
 
@@ -1066,9 +1066,9 @@ def get_columns_of_TAB_delim_file(file_path, include_first_column=False):
     filesnpaths.is_file_exists(file_path)
 
     if include_first_column:
-        return open(file_path, 'rU').readline().strip('\n').split('\t')
+        return open(file_path, 'r').readline().strip('\n').split('\t')
     else:
-        return open(file_path, 'rU').readline().strip('\n').split('\t')[1:]
+        return open(file_path, 'r').readline().strip('\n').split('\t')[1:]
 
 
 def get_names_order_from_newick_tree(newick_tree, newick_format=1, reverse=False, names_with_only_digits_ok=False):
@@ -1081,10 +1081,24 @@ def get_names_order_from_newick_tree(newick_tree, newick_format=1, reverse=False
     return list(reversed(names)) if reverse else names
 
 
-def get_vectors_from_TAB_delim_matrix(file_path, cols_to_return=None, rows_to_return=[], transpose=False, pad_with_zeros=False):
+def get_vectors_from_TAB_delim_matrix(file_path, cols_to_return=None, rows_to_return=[], transpose=False, pad_with_zeros=False, run=run):
     filesnpaths.is_file_exists(file_path)
     filesnpaths.is_file_tab_delimited(file_path)
 
+    run.warning("Anvi'o is recovering your data from your TAB-delimited file, and it is"
+                "instructed to pad your input vectors with 0 values probably because you "
+                "used the flag `--pad-input-with-zeros` somewhere. Just so you know.")
+
+    if cols_to_return and pad_with_zeros:
+        raise ConfigError("Dear developer, you can't use `cols_to_return` and `pad_with_zeros` at the same "
+                          "time with this function. The `pad_with_zeros` header variable in this function "
+                          "is a mystery at this point. But the only way to be able to use it requires one "
+                          "to not use `cols_to_return`. More mystery .. but essentially this is a necessity "
+                          "because we have to update fields_of_interest value if pad_with_zeros is true, so "
+                          "anvi'o clustering step DOES NOT IGNORE THE LAST SAMPLE IN THE MATRIX BECUASE PAD "
+                          "WITH ZEROS SHIFT EVERYTHING, and we can't do it blindly if the programmer requests "
+                          "only specific columnts to be returned with `cols_to_return` :/")
+
     if transpose:
         transposed_file_path = filesnpaths.get_temp_file_path()
         transpose_tab_delimited_file(file_path, transposed_file_path)
@@ -1095,7 +1109,7 @@ def get_vectors_from_TAB_delim_matrix(file_path, cols_to_return=None, rows_to_re
     id_to_sample_dict = {}
     sample_to_id_dict = {}
 
-    input_matrix = open(file_path, 'rU')
+    input_matrix = open(file_path, 'r')
     columns = input_matrix.readline().strip('\n').split('\t')[1:]
 
     fields_of_interest = []
@@ -1114,19 +1128,23 @@ def get_vectors_from_TAB_delim_matrix(file_path, cols_to_return=None, rows_to_re
     id_counter = 0
     for line in input_matrix.readlines():
         row_name = line.strip().split('\t')[0]
+
         if rows_to_return and row_name not in rows_to_return:
-                continue
+            continue
+
         id_to_sample_dict[id_counter] = row_name
         fields = line.strip('\n').split('\t')[1:]
 
-        # long story.
+        # because stupid stuff. see warning above.
         if pad_with_zeros:
             fields = [0] + fields + [0]
+            fields_of_interest = list(range(0, len(fields)))
 
         try:
             if fields_of_interest:
                 vector = [float(fields[i]) if fields[i] != '' else None for i in fields_of_interest]
             else:
+                # the code will literally never enter here:
                 vector = [float(f) if f != '' else None for f in fields]
         except ValueError:
             raise ConfigError("Matrix should contain only numerical values.")
@@ -1489,7 +1507,7 @@ def get_gene_caller_ids_from_args(gene_caller_ids, delimiter=','):
     gene_caller_ids_set = set([])
     if gene_caller_ids:
         if os.path.exists(gene_caller_ids):
-            gene_caller_ids_set = set([g.strip() for g in open(gene_caller_ids, 'rU').readlines()])
+            gene_caller_ids_set = set([g.strip() for g in open(gene_caller_ids, 'r').readlines()])
         else:
             gene_caller_ids_set = set([g.strip() for g in gene_caller_ids.split(delimiter)])
 
@@ -1764,7 +1782,7 @@ def concatenate_files(dest_file, file_list, remove_concatenated_files=False):
 
     dest_file_obj = open(dest_file, 'w')
     for chunk_path in file_list:
-        for line in open(chunk_path, 'rU'):
+        for line in open(chunk_path, 'r'):
             dest_file_obj.write(line)
 
     dest_file_obj.close()
@@ -3547,7 +3565,7 @@ def get_TAB_delimited_file_as_dictionary(file_path, expected_fields=None, dict_t
     failed_lines = []
     column_mapping_for_line_failed = None
 
-    f = open(file_path, 'rU')
+    f = open(file_path, 'r')
 
     # learn the number of fields and reset the file:
     num_fields = len(f.readline().strip('\n').split(separator))
diff --git a/anvio/variabilityops.py b/anvio/variabilityops.py
index c116469a15..deb19b14e3 100644
--- a/anvio/variabilityops.py
+++ b/anvio/variabilityops.py
@@ -764,7 +764,7 @@ def sanity_check(self):
             filesnpaths.is_file_tab_delimited(self.genes_of_interest_path, expected_number_of_fields=1)
 
             try:
-                self.gene_caller_ids = [int(g.strip()) for g in open(self.genes_of_interest_path, 'rU').readlines()]
+                self.gene_caller_ids = [int(g.strip()) for g in open(self.genes_of_interest_path, 'r').readlines()]
             except:
                 raise ConfigError("The gene caller ids anvi'o found in that file does not seem like gene caller "
                                   "ids anvi'o would use. There is something wrong here :(")
diff --git a/anvio/workflows/__init__.py b/anvio/workflows/__init__.py
index ffae6b78dd..828dab9af0 100644
--- a/anvio/workflows/__init__.py
+++ b/anvio/workflows/__init__.py
@@ -333,7 +333,7 @@ def dry_run(self, workflow_graph_output_file_path_prefix='workflow'):
         # we are (it still may be better to do it elsewhere more appropriate .. so
         # we can look more decent or whatever):
         if self.save_workflow_graph:
-            lines = open(log_file_path, 'rU').readlines()
+            lines = open(log_file_path, 'r').readlines()
 
             try:
                 line_of_interest = [line_no for line_no in range(0, len(lines)) if lines[line_no].startswith('digraph')][0]
diff --git a/bin/anvi-export-structures b/bin/anvi-export-structures
index 147f82c346..0f059b74ed 100755
--- a/bin/anvi-export-structures
+++ b/bin/anvi-export-structures
@@ -38,7 +38,7 @@ def main(args):
         raise ConfigError("Pick one of --gene-caller-ids and --genes-of-interest")
     elif genes_of_interest_path:
         filesnpaths.is_file_exists(args.genes_of_interest)
-        genes_of_interest = set(int(g.strip()) for g in open(args.genes_of_interest, 'rU').readlines())
+        genes_of_interest = set(int(g.strip()) for g in open(args.genes_of_interest, 'r').readlines())
     elif gene_caller_ids:
         genes_of_interest = set(int(g) for g in gene_caller_ids.split(','))
     else:
diff --git a/bin/anvi-get-sequences-for-hmm-hits b/bin/anvi-get-sequences-for-hmm-hits
index b18183737d..f2fec99652 100755
--- a/bin/anvi-get-sequences-for-hmm-hits
+++ b/bin/anvi-get-sequences-for-hmm-hits
@@ -166,7 +166,7 @@ def main(args):
 
     # figure out gene names.. if the user provided a file, use that, otherwhise parse gene names out of the comma-separated text
     if args.gene_names and filesnpaths.is_file_exists(args.gene_names, dont_raise=True):
-        gene_names = [g.strip() for g in open(args.gene_names, 'rU').readlines()] if args.gene_names else []
+        gene_names = [g.strip() for g in open(args.gene_names, 'r').readlines()] if args.gene_names else []
     else:
         gene_names = [g.strip() for g in args.gene_names.split(',')] if args.gene_names else []
 
diff --git a/bin/anvi-help b/bin/anvi-help
index 40ab83fd56..4236526780 100755
--- a/bin/anvi-help
+++ b/bin/anvi-help
@@ -6,7 +6,7 @@ from anvio.argparse import ArgumentParser
 import textwrap
 import pandas as pd
 
-from colored import fore, back, style
+from colored import Fore, Back, Style
 from operator import itemgetter
 from itertools import groupby
 
@@ -32,11 +32,11 @@ __description__ = "Search for anvi\'o programs by keyword, inputs/outputs, etc"
 run = terminal.Run()
 progress = terminal.Progress()
 
-TABLE_BG = back.GREY_11
-TABLE_FG = fore.GREY_100
+TABLE_BG = Back.GREY_11
+TABLE_FG = Fore.GREY_100
 TABLE_STYLE = TABLE_BG + TABLE_FG
-HIGHLIGHT_BG = back.GREY_11
-HIGHLIGHT_FG = fore.GREEN
+HIGHLIGHT_BG = Back.GREY_11
+HIGHLIGHT_FG = Fore.GREEN
 HIGHLIGHT_STYLE = HIGHLIGHT_BG + HIGHLIGHT_FG
 COL_WIDTH = 20 # Does not apply to the description column, which is extended if possible to fill terminal width
 
@@ -100,7 +100,7 @@ class ProgramSearch:
 
 
     def process(self):
-        if sys.stdout.encoding != "UTF-8":
+        if sys.stdout.encoding.lower() != "utf-8":
             run.warning("Sorry :/ The encoding of your terminal is not UTF-8, and as a result you will "
                         "not see anything but gibberish from displaying the nice table anvi'o will "
                         "put together for you. Aborting mission.")
@@ -231,7 +231,7 @@ class ProgramSearch:
                 self.highlight_matches()
                 tabulated = tabulate(self.table_as_string, headers='keys', showindex=False, tablefmt="fancy_grid")
 
-        print('\n' + TABLE_STYLE + tabulated + style.RESET)
+        print('\n' + TABLE_STYLE + tabulated + Style.RESET)
 
         run.info('Number of programs matching', self.table.shape[0], nl_before=1)
 
diff --git a/bin/anvi-matrix-to-newick b/bin/anvi-matrix-to-newick
index 2bea91d658..b03532fadf 100755
--- a/bin/anvi-matrix-to-newick
+++ b/bin/anvi-matrix-to-newick
@@ -35,7 +35,7 @@ def main(args):
 
     # a quick check of the data to see if there are any missing
     # values
-    _, _, _, vectors = utils.get_vectors_from_TAB_delim_matrix(args.input_matrix)
+    _, _, _, vectors = utils.get_vectors_from_TAB_delim_matrix(args.input_matrix, run=run)
     num_missing_data = len([item for sublist in vectors for item in sublist if item == None])
     if num_missing_data:
         run.warning(f"Oy. Your file contains {PL('missing data item', num_missing_data)}. Anvi'o will do its "
@@ -46,7 +46,7 @@ def main(args):
     progress.new('Analyzing input file')
     clustering.create_newick_file_from_matrix_file(args.input_matrix, args.output_file, linkage=args.linkage,
                                     distance=args.distance, transpose=args.transpose, progress=progress,
-                                    items_order_file_path=args.items_order_file, pad_with_zeros=True)
+                                    items_order_file_path=args.items_order_file, pad_with_zeros=args.pad_input_with_zeros)
     progress.end()
     run.info('Output newick', args.output_file)
     if args.items_order_file:
@@ -72,7 +72,12 @@ if __name__ == '__main__':
     groupC.add_argument(*anvio.A('transpose'), **anvio.K('transpose'))
     groupC.add_argument(*anvio.A('distance'), **anvio.K('distance'))
     groupC.add_argument(*anvio.A('linkage'), **anvio.K('linkage'))
-
+    groupC.add_argument('--pad-input-with-zeros', default=False, action="store_true",
+                        help="Do you want your vectors in the input file to be 'padded' by some zero values "
+                             "so even hideous matrix files that contain entires with all empty values can be "
+                             "processed with this program? Well, this flag will try to make things work for "
+                             "you. But you must know that this is one of those cases where 'if you have to "
+                             "use this then you have not one but two problems.")
     try:
         args = parser.get_args(parser)
         main(args)
diff --git a/bin/anvi-reaction-network b/bin/anvi-reaction-network
index 9f89aa5215..099c63b753 100755
--- a/bin/anvi-reaction-network
+++ b/bin/anvi-reaction-network
@@ -24,29 +24,84 @@ __description__ = "Generate a metabolic reaction network in an anvi'o contigs da
 def main() -> None:
     args = get_args()
     constructor = Constructor(ko_dir=args.ko_dir, modelseed_dir=args.modelseed_dir)
-    constructor.make_network(contigs_db=args.contigs_db, overwrite_existing_network=args.overwrite_existing_network)
+    if args.contigs_db:
+        constructor.make_network(
+            contigs_db=args.contigs_db,
+            overwrite_existing_network=args.overwrite_existing_network
+        )
+    elif args.pan_db or args.genomes_storage:
+        constructor.make_network(
+            pan_db=args.pan_db,
+            genomes_storage_db=args.genomes_storage,
+            overwrite_existing_network=args.overwrite_existing_network,
+            consensus_threshold=args.consensus_threshold,
+            discard_ties=args.discard_ties
+        )
+    else:
+        raise ConfigError(
+            "Either a contigs database (`--contigs-db`) OR a pan database (`--pan-db`) and genomes "
+            "storage database (`--genomes-storage`) must be provided to make a (meta)genomic or "
+            "pangenomic reaction network, respectively."
+        )
 
 def get_args() -> Namespace:
     parser = ArgumentParser(description=__description__)
-    parser.add_argument(*A('contigs-db'), **K('contigs-db'))
-    parser.add_argument(
+
+    groupA = parser.add_argument_group(
+        "SINGLE GENOME OR METAGENOME INPUT",
+        "Generate a reaction network from a contigs database, and store the network in the database."
+    )
+    groupA.add_argument(*A('contigs-db'), **K('contigs-db', {'required': False}))
+
+    groupB = parser.add_argument_group(
+        "PANGENOME INPUT",
+        "Generate a reaction network from a pan database and genomes storage database, "
+        "and store the network in the pan database."
+    )
+    groupB.add_argument(*A('pan-db'), **K('pan-db', {'required': False}))
+    groupB.add_argument(*A('genomes-storage'), **K('genomes-storage', {'required': False}))
+    groupB.add_argument(
+        '--consensus-threshold', default=None, type=float,
+        help=(
+            "If this argument is provided, then a protein annotation must be assigned to this "
+            "minimum proportion of genes in a cluster to be imputed to the cluster as a whole. "
+            "By default, without this argument, the annotation assigned to the most genes becomes "
+            "the annotation of the cluster (also see --discard-ties). The consensus threshold must "
+            "be a number from 0 to 1."
+        )
+    )
+    groupB.add_argument(
+        '--discard-ties', default=False, action='store_true',
+        help=(
+            "By default, a gene cluster is assigned a protein annotation by finding the protein "
+            "ortholog that occurs in the greatest number of genes in the cluster (see "
+            "--consensus-threshold) and arbitrarily choosing one ortholog in case of a tie. With "
+            "this flag, a tie instead results in an ortholog annotation not being assigned to the cluster."
+        )
+    )
+
+    groupC = parser.add_argument_group("DATABASE", "KEGG and ModelSEED reference database information")
+    groupC.add_argument(
         '--ko-dir', type=str, metavar='PATH',
         help=(
             "Path to KEGG KO database directory. If this option is not used, the program expects a "
             "database set up in the default location used by 'anvi-setup-kegg-data'."
         )
     )
-    parser.add_argument(
+    groupC.add_argument(
         '--modelseed-dir', type=str, metavar='PATH',
         help=(
             "Path to ModelSEED Biochemistry database directory. If this option is not used, the program "
             "expects a database set up in the default location used by 'anvi-setup-modelseed-database'."
         )
     )
-    parser.add_argument(
+
+    groupD = parser.add_argument_group("OTHER OPTIONS")
+    groupD.add_argument(
         '--overwrite-existing-network', default=False, action='store_true',
         help="Overwrite an existing reaction network in the database with the newly computed network."
     )
+
     args = parser.get_args(parser)
     return args
 
diff --git a/bin/anvi-report-inversions b/bin/anvi-report-inversions
index 372e234c5c..809824a77a 100755
--- a/bin/anvi-report-inversions
+++ b/bin/anvi-report-inversions
@@ -44,7 +44,7 @@ if __name__ == '__main__':
                     "parameters there.")
     groupB.add_argument(*anvio.A('pre-computed-inversions'), **anvio.K('pre-computed-inversions'))
 
-    groupC = parser.add_argument_group('KEY ALGORITHMIC COMPONENT 01: IDENTIFYING REGIONS OF INTERSET', "How should anvi'o identify regions of interest "
+    groupC = parser.add_argument_group('KEY ALGORITHMIC COMPONENT 01: IDENTIFYING REGIONS OF INTEREST', "How should anvi'o identify regions of interest "
                     "based on REV/REV and FWD/FWD paired-end reads? Defaults will be good for most cases.")
     groupC.add_argument('--min-coverage-to-define-stretches', default=10, type=int, help="Value to break up contigs into 'stretches' of "
                     "high-coverage regions of FWD/FWD and REV/REV reads. The lower the value, the more noise. This acts as a low-pass "
@@ -93,17 +93,17 @@ if __name__ == '__main__':
                     "in almost all instances (since anvi'o at this stage is only focusing on very specific "
                     "regions of genomes). But this parameter is here in case you insist on only using inverted "
                     "paired-end reads and assert your authority. You do you and turn on the flag, you rebellious "
-                    "scientist who will likely miss a lot of additoinal inversions like a boss.")
+                    "scientist who will likely miss a lot of additional inversions like a boss.")
 
     groupF = parser.add_argument_group('KEY ALGORITHMIC COMPONENT 04: COMPUTING INVERSION ACTIVITY', "What is the "
                     "proportion of invertible repeat orientation across samples? A two million dollars question "
                     "that anvi'o WILL answer for you IF you have `r1` and `r2` columns in your `bams-and-profiles-txt` "
                     "file that points to raw FASTQ reads you have used to generate your BAM files for each sample. "
-                    "Truly cray stuff.")
+                    "Truly crazy stuff.")
     groupF.add_argument(*anvio.A('num-threads'), **anvio.K('num-threads'))
     groupF.add_argument('--oligo-primer-base-length', default=12, type=int, help="Calculating inversion ratios "
-                    "require anvi'o to 'design' an in silico primer based on palindromes associated with inersions "
-                    "and the upstream/downstream genomic context to search for short reads in raw sequenicng data"
+                    "require anvi'o to 'design' an in silico primer based on palindromes associated with inversions "
+                    "and the upstream/downstream genomic context to search for short reads in raw sequencing data"
                     "to find the ratio of inversion activity per sample. This variable is to control how much of "
                     "the palindrome for a given inversion should be used to build a primer to search for short "
                     "reads. The longer it is, the more specific the primers will be to survey short reads. But if "
@@ -119,8 +119,12 @@ if __name__ == '__main__':
                     "datasets, primer search can take a very long time. By setting a small integer here, you can ask "
                     "anvi'o to stop searching primers after a few hits. Once the total number of primer hits reach to "
                     "number for a given sample, anvi'o will stop searching further and continue with the next sample. "
-                    "This flag is only good for testing, since it will prematurely end the search without testting "
+                    "This flag is only good for testing, since it will prematurely end the search without testing "
                     "all primers")
+    groupF.add_argument('--min-frequency-to-report', default=1, type=int, help="By default, anvi'o will only report "
+                    "primers supported by more than one read from the `r1` and `r2` entry in your `bams-and-profiles-txt`. "
+                    "The reason for this filtering is sequencing errors, which  can create very low frequency "
+                    "entries in the activity report. Use this flag to change that minimum threshold.")
 
     groupG = parser.add_argument_group('KEY ALGORITHMIC COMPONENT 05: REPORTING GENOMIC CONTEXT AROUND INVERSIONS',
                     "Once the consensus inversions are computed, anvi'o can go back to contigs on which they are "
diff --git a/bin/anvi-setup-user-modules b/bin/anvi-setup-user-modules
index 87025a3a3c..14604a774f 100755
--- a/bin/anvi-setup-user-modules
+++ b/bin/anvi-setup-user-modules
@@ -26,7 +26,7 @@ def main(args):
     args.download_from_kegg = None
 
     setup = kegg.KeggSetup(args)
-    setup.setup_data()
+    setup.setup_user_data()
 
 if __name__ == '__main__':
     from anvio.argparse import ArgumentParser