mdciofalo
diff --git a/‎.gitignore
+1 b/‎.gitignore
+1
diff --git a/‎data/climate_data_calculations.py
+5-7 b/‎data/climate_data_calculations.py
+5-7
diff --git a/‎data/export_data.py
-53 b/‎data/export_data.py
-53
diff --git a/‎data/facts/municipalities_counties.py
+1-2 b/‎data/facts/municipalities_counties.py
+1-2
diff --git a/‎data/issues/emissions/approximated_data_calculations.py
+55 b/‎data/issues/emissions/approximated_data_calculations.py
+55
@@ -39,6 +39,7 @@ yarn-error.log*
 *.tsbuildinfo
 
 /.vscode/
+/.idea/
 
 # python
 __pycache__/
 
@@ -3,7 +3,9 @@
 import json
 
 from solutions.cars.electric_car_change_rate import get_electric_car_change_rate
-from solutions.cars.electric_vehicle_per_charge_points import get_electric_vehicle_per_charge_points
+from solutions.cars.electric_vehicle_per_charge_points import (
+    get_electric_vehicle_per_charge_points,
+)
 from solutions.bicycles.bicycle_data_calculations import bicycle_calculations
 from facts.plans.plans_data_prep import get_climate_plans
 from facts.municipalities_counties import get_municipalities
@@ -55,12 +57,8 @@
         'totalApproximatedHistoricalEmission': df.iloc[i]['totalApproximatedHistorical'],
         'trend': df.iloc[i]['trend'],
         'trendEmission': df.iloc[i]['trendEmission'],
-        'historicalEmissionChangePercent': df.iloc[i][
-            'historicalEmissionChangePercent'
-        ],
-        'neededEmissionChangePercent': df.iloc[i][
-            'neededEmissionChangePercent'
-        ],
+        'historicalEmissionChangePercent': df.iloc[i]['historicalEmissionChangePercent'],
+        'neededEmissionChangePercent': df.iloc[i]['neededEmissionChangePercent'],
         'hitNetZero': df.iloc[i]['hitNetZero'],
         'budgetRunsOut': df.iloc[i]['budgetRunsOut'],
         'electricCarChangePercent': df.iloc[i]['electricCarChangePercent'],
 
@@ -1,6 +1,5 @@
 import pandas as pd
 
-
 def get_municipalities():
     # Load the data
     df = pd.read_excel('facts/kommunlankod_2023.xls')
@@ -25,4 +24,4 @@ def get_municipalities():
             result = pd.concat([result, pd.DataFrame({'Kommun': [municipality], 'Kod': [code], 'Län': [county]})], ignore_index=True)
 
     # Return the resulting dataframe
-    return result
+    return result
@@ -0,0 +1,55 @@
+import numpy as np
+
+
+def calculate_approximated_historical(df, last_year_with_smhi_data, current_year):
+    """
+    Calculate approximated historical data values for years passed since the last year with SMHI data.
+    This is done by interpolation using previously calculated linear trend coefficients.
+
+    Args:
+        df (pandas.DataFrame): The input DataFrame containing the data.
+        last_year_with_smhi_data (int): The last year with SMHI data.
+        current_year (int): The current year.
+
+    Returns:
+        pandas.DataFrame: The DataFrame with the approximated historical data values added.
+
+    """
+
+    # Get the years passed since last year with SMHI data (including current year)
+    approximated_years = range(last_year_with_smhi_data+1, current_year+1)
+
+    temp = [] # temporary list that we will append to
+    df = df.sort_values('Kommun', ascending=True)
+    for i in range(len(df)):
+        # We'll store the approximated values for each municipality
+        # in a dictionary where the keys are the years
+        approximated_data_dict = {}
+
+        if list(approximated_years):  # only fill dict if approximation is needed
+            # Add the latest recorded datapoint to the dict
+            # The rest of the years will be added below
+            approximated_data_dict = {last_year_with_smhi_data:
+                df.iloc[i][last_year_with_smhi_data]}
+            # Get trend coefficients
+            fit = df.iloc[i]['trendCoefficients']
+
+            for year in approximated_years:
+                # Add the approximated value for each year using the trend line coefficients
+                # Max function so we don't get negative values
+                approximated_data_dict[year] = max(0, fit[0]*year+fit[1])
+
+        temp.append(approximated_data_dict)
+
+    df['approximatedHistorical'] = temp
+
+    temp = [
+        np.trapz(
+            list(df.iloc[i]['approximatedHistorical'].values()),
+            list(df.iloc[i]['approximatedHistorical'].keys()),
+        )
+        for i in range(len(df))
+    ]
+    df['totalApproximatedHistorical'] = temp
+
+    return df