brightway-lca · TimoDiepers · Jul 11, 2024 · Jun 26, 2024 · Jun 28, 2024 · Jul 8, 2024
diff --git a/bw_timex/SetList.py b/bw_timex/SetList.py
@@ -0,0 +1,69 @@
+import warnings
+
+class SetList:
+    """A little helper class fot the mapping of the same/mapped activity in different (temporal) databases.
+    It contains a list of sets, that hold can hold the set of tuples of (act_id, database). It is built by
+    adding sets to the list, and returns the matching sets if one calls the an item from a set. 
+
+    Example: If the class instance is called my_setlist, my_setlist.add(set). When called """
+
+    def __init__(
+        self,
+    ) -> None:
+        self.list = []
+
+    def add(
+        self,
+        new_set: set,
+    ) -> None:
+        """
+        This method adds a set to the SetList instance.
+        Input
+        -----
+        new_set: a set to add to the SetList instance
+
+        Returns
+        -------
+        None (or rather nothing)
+
+        """
+
+        if new_set not in self.list:
+            checklist_items = [item for itemset in self.list for item in new_set if item in itemset]
+            checklist_sets = [itemset for itemset in self.list for item in new_set if item in itemset]
+            if len(checklist_items) != 0:
+                warnings.warn('tried to add {} to the SetList\n, but {} already exist in the SetList in:\n {}. \n Skipping {}'.format(
+                    new_set, checklist_items, checklist_sets, new_set))
+                pass
+            else:
+                self.list.append(new_set)
+        else:
+            pass
+
+    def __getitem__(
+        self,
+        key: any
+    ) -> set:
+        """
+        Returns all sets in the SetList instance containing the key
+        Inputs
+        ------
+        key: the key to look for in the sets of the SetList
+
+        Returns
+        -------
+        A list containing the set or all sets 
+        """
+        sets = [matching_set for matching_set in self.list if key in matching_set]
+        if len(sets)>1:
+            warnings.warn('Key found in multiple sets!!!! {} Please check! Returning only the first set'.format(sets))
+        if len(sets)>0: 
+            return sets[0]
+        else: 
+            warnings.warn('Key {} not found in SetList'.format(key))
+            return None
+
+    def __len__(
+        self,
+    ) -> int:
+        return len(self.list)
diff --git a/bw_timex/__init__.py b/bw_timex/__init__.py
@@ -1,8 +1,10 @@
 from .dynamic_biosphere_builder import DynamicBiosphereBuilder
 from .dynamic_characterization import DynamicCharacterization
+from .dynamic_biosphere_builder_from_timeline import DynamicBiosphereBuilder
 from .edge_extractor import EdgeExtractor
 from .matrix_modifier import MatrixModifier
 from .timeline_builder import TimelineBuilder
 from .timex_lca import TimexLCA
+from .SetList import SetList
 
 __version__ = "0.1.4"
diff --git a/bw_timex/dynamic_biosphere_builder.py b/bw_timex/dynamic_biosphere_builder.py
@@ -62,7 +62,7 @@ def __init__(
         }
 
         self.lca_obj = lca_obj
-        self.technosphere_matrix = lca_obj.technosphere_matrix
+        self.technosphere_matrix = lca_obj.technosphere_matrix.tocsc()  # convert to csc as this is only used for column slicing 
         self.activity_dict = lca_obj.dicts.activity
         self.activity_time_mapping_dict = activity_time_mapping_dict
         self.biosphere_time_mapping_dict = biosphere_time_mapping_dict
@@ -133,7 +133,7 @@ def build_dynamic_biosphere_matrix(self):
 
                     # first create a row index for the tuple((db, bioflow), date))
                     time_mapped_matrix_id = self.biosphere_time_mapping_dict.add(
-                        (exc.input, date)
+                        (exc.input.id, date)
                     )
 
                     # populate lists with which sparse matrix is constructed
@@ -142,11 +142,10 @@ def build_dynamic_biosphere_matrix(self):
                         col=process_col_index,
                         amount=amount,
                     )
-
         for id in self.node_id_collection_dict["temporal_markets"]:
             process_col_index = self.activity_dict[id]  # get the matrix column index
             technosphere_column = (
-                self.technosphere_matrix[:, process_col_index].toarray().flatten()
+                self.technosphere_matrix[:, process_col_index].toarray().ravel()
             )  # 1-d np.array
             demand = dict()
             for idx, amount in enumerate(technosphere_column):
@@ -171,7 +170,7 @@ def build_dynamic_biosphere_matrix(self):
             )  # aggregated biosphere flows of background supply chain emissions. Rows are bioflows.
 
             for idx, amount in enumerate(aggregated_inventory.flatten().tolist()[0]):
-                bioflow = bd.get_activity(self.lca_obj.dicts.biosphere.reversed[idx])
+                bioflow = self.lca_obj.dicts.biosphere.reversed[idx]
                 ((_, _), time) = self.activity_time_mapping_dict.reversed()[id]
 
                 time_in_datetime = convert_date_string_to_datetime(

diff --git a/bw_timex/dynamic_biosphere_builder_from_timeline.py b/bw_timex/dynamic_biosphere_builder_from_timeline.py
@@ -0,0 +1,217 @@
+from scipy import sparse as sp
+import pandas as pd
+import numpy as np
+import bw2data as bd
+from bw_temporalis import TemporalDistribution
+from .remapping import TimeMappingDict
+from bw2calc import LCA
+from datetime import datetime
+from .utils import convert_date_string_to_datetime
+from .SetList import SetList
+
+
+class DynamicBiosphereBuilder:
+    """
+    This class is used to build a dynamic biosphere matrix, which in contrast to the normal biosphere matrix has rows for each biosphere flow at their time of emission. 
+    Thus, the dimensions are (bio_flows at a specific timestep) x (processes).
+    """
+
+    def __init__(
+        self,
+        lca_obj: LCA,
+        activity_time_mapping_dict: dict,
+        biosphere_time_mapping_dict: dict,
+        demand_timing_dict: dict,
+        node_id_collection_dict: dict,
+        temporal_grouping: str,
+        database_date_dict: dict,
+        database_date_dict_static_only: dict,
+        timeline: pd.DataFrame,
+        interdatabase_activity_mapping: SetList,
+    ) -> None:
+        """ 
+        Initializes the DynamicBiosphereBuilder object.
+
+        Parameters
+        ----------
+        lca_obj : LCA objecct
+            instance of the bw2calc LCA class, e.g. TimexLCA.lca
+        activity_time_mapping_dict : dict
+            A dictionary mapping activity to their respective timing in the format (('database', 'code'), datetime_as_integer): time_mapping_id)
+        biosphere_time_mapping_dict : dict
+            A dictionary mapping biosphere flows to their respective timing in the format (('database', 'code'), datetime_as_integer): time_mapping_id), at this point still empty.
+        demand_timing_dict : dict
+            A dictionary mapping of the demand to demand time
+        node_id_collection_dict : dict
+            A dictionary containing lists of node ids for different node subsets
+        temporal_grouping : str
+            A string indicating the temporal grouping of the processes, e.g. 'year', 'month', 'day', 'hour'
+        database_date_dict : dict
+            A dictionary mapping database names to their respective date
+        database_date_dict_static_only : dict
+            A dictionary mapping database names to their respective date, but only containing static databases, which are the background databases.
+
+        Returns
+        -------
+        None
+
+        """
+
+        self._time_res_dict = {
+            "year": "datetime64[Y]",
+            "month": "datetime64[M]",
+            "day": "datetime64[D]",
+            "hour": "datetime64[h]",
+        }
+
+        self.lca_obj = lca_obj
+        # self.technosphere_matrix = lca_obj.technosphere_matrix.tocsc()  # convert to csc as this is only used for column slicing 
+        # self.activity_dict = lca_obj.dicts.activity
+        self.activity_time_mapping_dict = activity_time_mapping_dict
+        self.biosphere_time_mapping_dict = biosphere_time_mapping_dict
+        self.demand_timing_dict = demand_timing_dict
+        self.node_id_collection_dict = node_id_collection_dict
+        self.time_res = self._time_res_dict[temporal_grouping]
+        self.temporal_grouping = temporal_grouping
+        self.database_date_dict = database_date_dict
+        self.database_date_dict_static_only = database_date_dict_static_only
+        # self.dynamic_supply_array = lca_obj.supply_array
+        self.timeline = timeline
+        self.interdatabase_activity_mapping = interdatabase_activity_mapping
+        self.rows = []
+        self.cols = []
+        self.values = []
+
+    def build_dynamic_biosphere_matrix(self):
+        """
+        This function creates a separate biosphere matrix, with the dimenions (bio_flows at a specific timestep) x (processes).
+        Every temporally resolved biosphere flow has its own row in the matrix, making it highly sparse.
+        The timing of the emitting process and potential additional temporal information of the bioshpere flow (e.g. delay of emission compared to timing of process) are considered.
+
+        Parameters
+        ----------
+        None
+
+        Returns
+        -------
+        dynamic_biomatrix : scipy.sparse.csr_matrix
+            A sparse matrix with the dimensions (bio_flows at a specific timestep) x (processes), where every row represents a biosphere flow at a specific time.
+        """
+
+        for row in self.timeline.itertuples():
+            id = row.time_mapped_producer
+            process_col_index = row.Index
+            (
+                (original_db, original_code), 
+                time) = self.activity_time_mapping_dict.reversed()[  # time is here an integer, with various length depending on temporal grouping, e.g. [Y] -> 2024, [M] - > 202401
+                id
+            ]
+            if id in self.node_id_collection_dict["temporalized_processes"]:
+
+                time_in_datetime = convert_date_string_to_datetime(
+                    self.temporal_grouping, str(time)
+                )  # now time is a datetime
+
+                td_producer = TemporalDistribution(
+                    date=np.array([time_in_datetime], dtype=self.time_res),
+                    amount=np.array([1]),
+                ).date
+                date = td_producer[0]
+
+                act = bd.get_node(database=original_db, code=original_code)
+
+                for exc in act.biosphere():
+                    if exc.get("temporal_distribution"):
+                        td_dates = exc["temporal_distribution"].date  # time_delta
+                        td_values = exc["temporal_distribution"].amount
+                        dates = (
+                            td_producer + td_dates
+                        )  # we can add a datetime of length 1 to a timedelta of length N without problems
+                        values = exc["amount"] * td_values
+
+                    else:  # exchange has no TD
+                        dates = td_producer  # datetime array, same time as producer
+                        values = [exc["amount"]]
+
+                    # Add entries to dynamic bio matrix
+                    for date, amount in zip(dates, values):
+
+                        # first create a row index for the tuple((db, bioflow), date))
+                        time_mapped_matrix_id = self.biosphere_time_mapping_dict.add(
+                            (exc.input.id, date)
+                        )
+
+                        # populate lists with which sparse matrix is constructed
+                        self.add_matrix_entry_for_biosphere_flows(
+                            row=time_mapped_matrix_id,
+                            col=process_col_index,
+                            amount=amount,
+                        )
+            elif id in self.node_id_collection_dict["temporal_markets"]:
+                demand = {}
+                for db, amount in row.interpolation_weights.items():
+                    # if not db in act_time_combinations.get(original_code):  #check if act time combination already exists
+                    [
+                        (timed_act_id,timed_db)] = [(act, db_name) for (act, db_name) 
+                        in self.interdatabase_activity_mapping[(row.producer,original_db)]
+                        if db==db_name
+                    ]
+                    # t_act = bd.get_activity(timed_act_id)
+                    demand[timed_act_id] = amount
+
+                self.lca_obj.redo_lci(demand)
+
+                aggregated_inventory = self.lca_obj.inventory.sum(
+                    axis=1
+                )  # aggregated biosphere flows of background supply chain emissions. Rows are bioflows.
+
+                for idx, amount in enumerate(aggregated_inventory.A1):
+                    bioflow = self.lca_obj.dicts.biosphere.reversed[idx]
+                    ((_, _), time) = self.activity_time_mapping_dict.reversed()[id]
+
+                    time_in_datetime = convert_date_string_to_datetime(
+                        self.temporal_grouping, str(time)
+                    )  # now time is a datetime
+
+                    td_producer = TemporalDistribution(
+                        date=np.array([str(time_in_datetime)], dtype=self.time_res),
+                        amount=np.array([1]),
+                    ).date  # TODO: Simplify
+                    date = td_producer[0]
+
+                    time_mapped_matrix_id = self.biosphere_time_mapping_dict.add(
+                        (bioflow, date)
+                    )
+
+                    self.add_matrix_entry_for_biosphere_flows(
+                        row=time_mapped_matrix_id, col=process_col_index, amount=amount
+                    )
+
+        # now build the dynamic biosphere matrix
+        shape = (max(self.rows) + 1, len(self.timeline))
+        dynamic_biomatrix = sp.coo_matrix((self.values, (self.rows, self.cols)), shape)
+        self.dynamic_biomatrix = dynamic_biomatrix.tocsr()
+
+        return self.dynamic_biomatrix
+
+    def add_matrix_entry_for_biosphere_flows(self, row, col, amount):
+        """
+        Adds an entry to the lists of row, col and values, which are then used to construct the dynamic biosphere matrix.
+
+        Parameters
+        ----------
+        row : int
+            A row index of a new element to the dynamic biosphere matrix
+        col: int
+            A column index of a new element to the dynamic biosphere matrix
+        amount: float
+            The amount of the new element to the dynamic biosphere matrix
+
+        Returns
+        -------
+        None, but the lists of row, col and values are updated
+
+        """
+        self.rows.append(row)
+        self.cols.append(col)
+        self.values.append(amount)