Source code for cobra.medium.minimal_medium

"""Provide functions and helpers to obtain minimal growth media."""

import logging
from typing import TYPE_CHECKING, Iterable, Union

import pandas as pd
from optlang.interface import OPTIMAL
from optlang.symbolics import Zero

from .boundary_types import find_boundary_types


if TYPE_CHECKING:
    from cobra import Model, Reaction


[docs]logger = logging.getLogger(__name__)
[docs]def add_linear_obj(model: "Model") -> None: r"""Add a linear version of a minimal medium to the model solver. Changes the optimization objective to finding the growth medium requiring the smallest total import flux: ..math:: minimize \sum_{r_i in import_reactions} |r_i| Parameters ---------- model : cobra.Model The cobra model to modify. """ coefs = {} for rxn in find_boundary_types(model, "exchange"): export = len(rxn.reactants) == 1 if export: coefs[rxn.reverse_variable] = 1 else: coefs[rxn.forward_variable] = 1 model.objective.set_linear_coefficients(coefs) model.objective.direction = "min"
[docs]def add_mip_obj(model: "Model") -> None: """Add a mixed-integer version of a minimal medium to the model. Changes the optimization objective to finding the medium with the least components: minimize size(R) where R part of import_reactions Arguments --------- model : cobra.model The model to modify. """ if len(model.variables) > 1e4: logger.warning( "The MIP version of minimal media is extremely slow for " "models that large :(" ) exchange_rxns = find_boundary_types(model, "exchange") big_m = max(abs(b) for r in exchange_rxns for b in r.bounds) prob = model.problem coefs = {} to_add = [] for rxn in exchange_rxns: export = len(rxn.reactants) == 1 indicator = prob.Variable("ind_" + rxn.id, lb=0, ub=1, type="binary") if export: vrv = rxn.reverse_variable indicator_const = prob.Constraint( vrv - indicator * big_m, ub=0, name="ind_constraint_" + rxn.id ) else: vfw = rxn.forward_variable indicator_const = prob.Constraint( vfw - indicator * big_m, ub=0, name="ind_constraint_" + rxn.id ) to_add.extend([indicator, indicator_const]) coefs[indicator] = 1 model.add_cons_vars(to_add) model.solver.update() model.objective.set_linear_coefficients(coefs) model.objective.direction = "min"
[docs]def _as_medium( exchanges: Iterable["Reaction"], tolerance: float = 1e-6, exports: bool = False ) -> pd.Series: """Convert a solution to medium. Parameters ---------- exchanges : list of cobra.reaction The exchange reactions to consider. tolerance : float > 0, optional The absolute tolerance for fluxes. Fluxes with an absolute value smaller than this number will be ignored (default 1e-6). exports : bool, optional Whether to return export fluxes as well (default False). Returns ------- pandas.Series The "medium", meaning all active import fluxes in the solution. """ logger.debug("Formatting medium.") medium = pd.Series() for rxn in exchanges: export = len(rxn.reactants) == 1 flux = rxn.flux if abs(flux) < tolerance: continue if export: medium[rxn.id] = -flux elif not export: medium[rxn.id] = flux if not exports: medium = medium[medium > 0] return medium
[docs]def minimal_medium( model: "Model", min_objective_value: float = 0.1, exports: bool = False, minimize_components: Union[bool, int] = False, open_exchanges: bool = False, ) -> Union[pd.Series, pd.DataFrame, None]: """Find the minimal growth medium for the `model`. Finds the minimal growth medium for the `model` which allows for model as well as individual growth. Here, a minimal medium can either be the medium requiring the smallest total import flux or the medium requiring the least components (ergo ingredients), which will be much slower due to being a mixed integer problem (MIP). Parameters ---------- model : cobra.model The model to modify. min_objective_value : float > 0 or array-like object, optional The minimum growth rate (objective) that has to be achieved (default 0.1). exports : bool, optional Whether to include export fluxes in the returned medium. Defaults to False which will only return import fluxes (default False). minimize_components : bool or int > 0, optional Whether to minimize the number of components instead of the total import flux. Might be more intuitive if set to True, but may also be slow to calculate for large communities. If set to a number `n` will return up to `n` alternative solutions all with the same number of components (default False). open_exchanges : bool or number, optional Whether to ignore currently set bounds and make all exchange reactions in the `model` possible. If set to a `number`, all exchange reactions will be opened with (-`number`, `number`) as bounds (default False). Returns ------- pandas.Series, pandas.DataFrame or None A pandas.Series giving the import flux for each required import reaction and (optionally) the associated export fluxes. All exchange fluxes are oriented into the import reaction e.g. positive fluxes denote imports and negative fluxes exports. If `minimize_components` is a number larger than 1, may return a pandas.DataFrame where each column is a minimal medium. Returns None, if the minimization is infeasible (for instance if min_growth > maximum growth rate). Notes ----- Due to numerical issues, the `minimize_components` option will usually only minimize the number of "large" import fluxes. Specifically, the detection limit is given by ``integrality_tolerance * max_bound`` where ``max_bound`` is the largest bound on an import reaction. Thus, if you are interested in small import fluxes as well you may have to adjust the solver tolerance at first with `model.tolerance = 1e-7` for instance. However, this will be *very* slow for large models especially with GLPK. """ exchange_rxns = find_boundary_types(model, "exchange") if isinstance(open_exchanges, bool): open_bound = 1000 else: open_bound = open_exchanges with model as mod: if open_exchanges: logger.debug(f"Opening exchanges for {len(exchange_rxns)} imports.") for rxn in exchange_rxns: rxn.bounds = (-open_bound, open_bound) logger.debug("Applying objective value constraints.") obj_const = mod.problem.Constraint( mod.objective.expression, lb=min_objective_value, name="medium_obj_constraint", ) mod.add_cons_vars([obj_const]) mod.solver.update() mod.objective = Zero logger.debug("Adding new media objective.") tol = mod.solver.configuration.tolerances.feasibility if minimize_components: add_mip_obj(mod) if isinstance(minimize_components, bool): minimize_components = 1 seen = set() best = num_components = mod.slim_optimize() if mod.solver.status != OPTIMAL: logger.warning("Minimization of medium was infeasible.") return None exclusion = mod.problem.Constraint(Zero, ub=0) mod.add_cons_vars([exclusion]) mod.solver.update() media = [] for i in range(minimize_components): logger.info(f"Finding alternative medium #{(i + 1)}.") vars = [mod.variables["ind_" + s] for s in seen] if len(seen) > 0: exclusion.set_linear_coefficients(dict.fromkeys(vars, 1)) exclusion.ub = best - 1 num_components = mod.slim_optimize() if mod.solver.status != OPTIMAL or num_components > best: if i == 0: logger.warning( "Could not get an optimal solution. " "This is usually due to numerical instability. " "Possible remedies are relaoding the model " "from scratch, switching to a different solver, " "or decreasing the solver tolerance. Please, " "carefully read the note on numerical instability " "in the function documentation." ) return None break medium = _as_medium(exchange_rxns, tol, exports=exports) media.append(medium) seen.update(medium[medium > 0].index) if len(media) > 1: medium = pd.concat(media, axis=1, sort=True).fillna(0.0) medium.sort_index(axis=1, inplace=True) else: medium = media[0] else: add_linear_obj(mod) mod.slim_optimize() if mod.solver.status != OPTIMAL: logger.warning("Minimization of medium was infeasible.") return None medium = _as_medium(exchange_rxns, tol, exports=exports) return medium