Source code for bw2calc.monte_carlo

# -*- coding: utf-8 -*-
from __future__ import print_function, unicode_literals, division
from eight import *
from future.utils import implements_iterator

from .lca import LCA
from .utils import clean_databases, get_seed
from bw2data import projects
from contextlib import contextmanager
from scipy.sparse.linalg import cgs
from stats_arrays.random import MCRandomNumberGenerator
import multiprocessing
import platform
import sys
import warnings

try:
    from pypardiso import spsolve
except ImportError:
    from scipy.sparse.linalg import spsolve


if sys.version_info < (3, 0):
    # multiprocessing.pool as a context manager not available in Python 2.7
    @contextmanager

[docs]
    def pool_adapter(pool):
        try:
            yield pool
        finally:
            pool.terminate()

else:
    pool_adapter = lambda x: x


@implements_iterator

[docs]
class IterativeMonteCarlo(LCA):
    """Base class to use iterative techniques instead of `LU factorization <http://en.wikipedia.org/wiki/LU_decomposition>`_ in Monte Carlo."""
    def __init__(self, demand, method=None, iter_solver=cgs,
                 seed=None, *args, **kwargs):

[docs]
        self.seed = seed or get_seed()

        super(IterativeMonteCarlo, self).__init__(demand, method=method,
                                                  seed=self.seed, *args, **kwargs)

[docs]
        self.iter_solver = iter_solver


[docs]
        self.guess = None


[docs]
        self.lcia = method is not None

        self.logger.info("Seeded RNGs", extra={'seed': self.seed})

    def __iter__(self):
        return self

    def __call__(self):
        return next(self)

    def __next__(self):
        raise NotImplemented


[docs]
    def solve_linear_system(self):
        if not self.iter_solver or self.guess is None:
            self.guess = spsolve(
                self.technosphere_matrix,
                self.demand_array)
            return self.guess
        else:
            solution, status = self.iter_solver(
                self.technosphere_matrix,
                self.demand_array,
                x0=self.guess,
                atol='legacy',
                maxiter=1000)
            if status != 0:
                return spsolve(
                    self.technosphere_matrix,
                    self.demand_array
                )
            return solution





[docs]
class DirectSolvingMixin(IterativeMonteCarlo):

[docs]
    def solve_linear_system(self):
        return LCA.solve_linear_system(self)




@implements_iterator

[docs]
class MonteCarloLCA(IterativeMonteCarlo):
    """Monte Carlo uncertainty analysis with separate `random number generators <http://en.wikipedia.org/wiki/Random_number_generation>`_ (RNGs) for each set of parameters."""

[docs]
    def load_data(self):
        self.load_lci_data()
        self.tech_rng = MCRandomNumberGenerator(self.tech_params, seed=self.seed)
        self.bio_rng = MCRandomNumberGenerator(self.bio_params, seed=self.seed)
        if self.lcia:
            self.load_lcia_data()
            self.cf_rng = MCRandomNumberGenerator(self.cf_params, seed=self.seed)
        if self.weighting:
            self.load_weighting_data()
            self.weighting_rng = MCRandomNumberGenerator(self.weighting_params, seed=self.seed)
        if self.presamples:
            self.presamples.reset_sequential_indices()


    def __next__(self):
        if not hasattr(self, "tech_rng"):
            self.load_data()
        self.rebuild_technosphere_matrix(self.tech_rng.next())
        self.rebuild_biosphere_matrix(self.bio_rng.next())
        if self.lcia:
            self.rebuild_characterization_matrix(self.cf_rng.next())
        if self.weighting:
            self.weighting_value = self.weighting_rng.next()

        if self.presamples:
            self.presamples.update_matrices()

        if not hasattr(self, "demand_array"):
            self.build_demand_array()

        self.lci_calculation()
        if self.lcia:
            self.lcia_calculation()
            if self.weighting:
                self.weighting_calculation()
            return self.score
        else:
            return self.supply_array




[docs]
class DirectSolvingMonteCarloLCA(MonteCarloLCA, DirectSolvingMixin):
    pass



@implements_iterator

[docs]
class ComparativeMonteCarlo(IterativeMonteCarlo):
    """First draft approach at comparative LCA"""
    def __init__(self, demands, *args, **kwargs):

[docs]
        self.demands = demands

        # Get all possibilities for database retrieval

[docs]
        demand_all = demands[0].copy()

        for other in demands[1:]:
            demand_all.update(other)
        super(ComparativeMonteCarlo, self).__init__(demand_all, *args, **kwargs)


[docs]
    def load_data(self):
        if not getattr(self, "method"):
            raise ValueError("Must specify an LCIA method")

        self.load_lci_data()
        self.load_lcia_data()
        self.tech_rng = MCRandomNumberGenerator(self.tech_params, seed=self.seed)
        self.bio_rng = MCRandomNumberGenerator(self.bio_params, seed=self.seed)
        self.cf_rng = MCRandomNumberGenerator(self.cf_params, seed=self.seed)


    def __next__(self):
        if not hasattr(self, "tech_rng"):
            self.load_data()
        self.rebuild_technosphere_matrix(self.tech_rng.next())
        self.rebuild_biosphere_matrix(self.bio_rng.next())
        self.rebuild_characterization_matrix(self.cf_rng.next())

        if self.presamples:
            self.presamples.update_matrices()

        results = []
        for demand in self.demands:
            self.build_demand_array(demand)
            self.lci_calculation()
            self.lcia_calculation()
            results.append(self.score)
        return results




[docs]
def single_worker(args):
    project, demand, method, iterations = args
    projects.set_current(project, writable=False)
    mc = MonteCarloLCA(demand=demand, method=method)
    return [next(mc) for x in range(iterations)]




[docs]
def direct_solving_worker(args):
    project, demand, method, iterations = args
    projects.set_current(project, writable=False)
    mc = DirectSolvingMonteCarloLCA(demand=demand, method=method)
    return [next(mc) for x in range(iterations)]




[docs]
class ParallelMonteCarlo(object):
    """Split a Monte Carlo calculation into parallel jobs"""
    def __init__(self, demand, method, iterations=1000, chunk_size=None,
                 cpus=None, log_config=None):
        if platform.system() in ("Windows", "Darwin"):
            MSG = (
                "The ParallelMonteCarlo class is deprecated; as of Python 3.8 it doesn't "
                "work reliably on Windows or MacOS, and doesn't offer speed advantages "
                "when using the Pardiso solver"
            )
            warnings.warn(MSG, DeprecationWarning)

        clean_databases()

[docs]
        self.demand = demand


[docs]
        self.method = method


[docs]
        self.cpus = cpus or multiprocessing.cpu_count()

        if chunk_size:
            self.chunk_size = chunk_size
            self.num_jobs = iterations // chunk_size
            if iterations % self.chunk_size:
                self.num_jobs += 1
        else:
            self.num_jobs = self.cpus
            self.chunk_size = (iterations // self.num_jobs) + 1


[docs]
    def calculate(self, worker=single_worker):
        with pool_adapter(multiprocessing.Pool(processes=self.cpus)) as pool:
            results = pool.map(
                worker,
                [
                    (projects.current, self.demand, self.method, self.chunk_size)
                    for _ in range(self.num_jobs)
                ]
            )
        return [x for lst in results for x in lst]





[docs]
def multi_worker(args):
    """Calculate a single Monte Carlo iteration for many demands.

    ``args`` are in order:
        * ``project``: Name of project
        * ``demands``: List of demand dictionaries
        * ``method``: LCIA method

    Returns a list of results: ``[(demand dictionary, result)]``

    """
    project, demands, method = args
    projects.set_current(project, writable=False)
    mc = MonteCarloLCA(demands[0], method)
    next(mc)
    results = []
    for demand in demands:
        mc.redo_lcia(demand)
        results.append((demand, mc.score))
    return results




[docs]
class MultiMonteCarlo(object):
    """
This is a class for the efficient calculation of *many* demand vectors from
each Monte Carlo iteration.

Args:
    * ``args`` is a list of demand dictionaries
    * ``method`` is a LCIA method
    * ``iterations`` is the number of Monte Carlo iterations desired
    * ``cpus`` is the (optional) number of CPUs to use

The input list can have complex demands, so ``[{('foo', 'bar'): 1, ('foo', 'baz'): 1}, {('foo', 'another'): 1}]`` is OK.

Call ``.calculate()`` to generate results.

    """
    def __init__(self, demands, method, iterations, cpus=None):
        clean_databases()
        # Convert from activity proxies if necessary

[docs]
        self.demands = [{(k[0], k[1]): v for k, v in obj.items()}
                        for obj in demands]


[docs]
        self.method = method


[docs]
        self.iterations = iterations


[docs]
        self.cpus = cpus or multiprocessing.cpu_count()



[docs]
    def merge_results(self, objs):
        """Merge the results from each ``multi_worker`` worker.

        ``[('a', [0,1]), ('a', [2,3])]`` becomes ``[('a', [0,1,2,3)]``.

        """
        r = {}
        for obj in objs:
            for key, value in obj:
                r.setdefault(frozenset(key.items()), []).append(value)
        return [(dict(x), y) for x, y in r.items()]



[docs]
    def calculate(self, worker=multi_worker):
        """Calculate Monte Carlo results for many demand vectors.

        Returns a list of results with the format::

            [(demand dictionary, [lca scores])]

        There is no guarantee that the results are returned in the same order as the ``demand`` input variable.

        """
        with pool_adapter(multiprocessing.Pool(processes=self.cpus)) as pool:
            results = pool.map(
                worker,
                [
                    (projects.current, self.demands, self.method)
                    for _ in range(self.iterations)
                ]
            )
        return self.merge_results(results)