Adding optimisation features and steps

JBris · JBris · commit cf960468e4ea · 2026-02-07T22:39:48.000+13:00
diff --git a/behave.ini b/behave.ini
@@ -0,0 +1,6 @@
+[behave]
+paths = features
+tags = not @skip
+logging_level = INFO
+stop = False
+show_skipped = True
diff --git a/data/ground_truth.json b/data/ground_truth.json
@@ -0,0 +1,11 @@
+{
+    "TSUM1": 255,
+    "TSUM2": 1400,
+    "TBASEM": 3.0,
+    "TSUMEM": 170.0,
+    "TEFFMX": 18.0,
+    "SPAN": 37,
+    "TDWI": 75,
+    "RGRLAI": 0.016,
+    "Q10": 2.0
+}
diff --git a/data/synthetic_test_data.csv b/data/synthetic_test_data.csv
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -22,6 +22,7 @@ For our community code of conduct, please also view `CODE_OF_CONDUCT.md. <https:
    :maxdepth: 1
    :caption: Contents:
 
+   tutorials/quickstart.rst
    api_reference/index.rst
    changelogs/changelog.rst
    community/index.rst
diff --git a/docs/source/tutorials/quickstart.rst b/docs/source/tutorials/quickstart.rst
@@ -0,0 +1,31 @@
+Quickstart
+==========
+
+First, run the following code to install all dependencies:
+
+.. code-block:: bash
+
+    poetry install --no-interaction
+
+Secondly, execute the following to run the behaviour tests:
+
+.. code-block:: bash
+
+    behave --verbose --summary
+
+Python Environment
+==================
+
+behave
+------
+
+`The behave package was used to implement all BDD tests. <https://behave.readthedocs.io/en/stable/index.html>`_
+These tests have been written using Gherkin syntax. `For more information on Gherkin, click here. <https://cucumber.io/docs/gherkin/reference/>`_
+
+* Feature files containing human-readable Gherkin can be found here: :file:`features`
+* The implementation of the scenario steps can be found here: :file:`features/steps`
+
+Data
+====
+
+* The potato data were originally retrieved from here: `https://github.com/ajwdewit/pcse_notebooks/tree/master/data`_
diff --git a/features/environment.py b/features/environment.py
@@ -1,6 +1,9 @@
+import optuna
 from behave.model import Feature, Scenario
 from behave.runner import Context
 
+optuna.logging.set_verbosity(optuna.logging.WARNING)
+
 
 def before_feature(context: Context, feature: Feature) -> None:
 	pass
diff --git a/features/optimisation.feature b/features/optimisation.feature
@@ -1,17 +1,21 @@
 Feature: Calibration of WOFOST potato using black-box optimisation
-    Because crop model parameters are uncertain
+    Because potato crop model parameters are uncertain
     We want to calibrate WOFOST by exploring the parameter space with black-box optimisation
+    And minimising the discrepancy for end-of-season LAI and TWSO
     So potato crop development and growth is both accurate and well-constrained
 
     Background:
         Given we are using WOFOST site data with a WAV of "50.0"
         And we are using default soil parameter values
         And we are using crop data stored in the "data" directory
         And our state variables are "LAI and TWSO"
+        And we are using "mean squared error" as our error metric
+        And we are using observed data from the "data/synthetic_test_data.csv" file
+        And we are using ground truth data from the "data/ground_truth.json" file
         And the following parameter specification is used for calibration:
             | name   | description                                                   | range       | distribution | type       |
             | TSUM1  | Temperature sum from emergence to anthesis                    | 150, 280    | uniform      | continuous |
-            | TSUM2  | Temperature sum from anthesis to maturity                     | 1400, 2100  | uniform      | continuous |
+            | TSUM2  | Temperature sum from anthesis to maturity                     | 1550, 2100  | uniform      | continuous |
             | TBASEM | Base temperature for emergence                                | 2, 4        | uniform      | continuous |
             | TSUMEM | Temperature sum required for crop emergence                   | 170, 255    | uniform      | continuous |
             | TEFFMX | Maximum effective temperature for emergence                   | 18, 32      | uniform      | continuous |
@@ -20,11 +24,19 @@ Feature: Calibration of WOFOST potato using black-box optimisation
             | RGRLAI | Relative growth rate of leaf area index                       | 0.008, 0.02 | uniform      | continuous |
             | Q10    | Temperature response factor for respiration (Q10 coefficient) | 2, 3        | uniform      | continuous |
         And the following specification is used for the calibration procedure:
-            | name              | description                                   | value                 |
-            | experiment_name   | The name of the current experiment            | WOFOST optimisation   |
-            | n_jobs            | The number of simulations to run in parallel  | -1                    |
+            | name            | description                                  | value                |
+            | experiment_name | The name of the current experiment           | WOFOST optimisation  |
+            | n_jobs          | The number of simulations to run in parallel | -1                   |
+            | random_seed     | The random seed for replicability            | 100                  |
 
-    Scenario: run a simple test
-        Given we have behave installed
-        When we implement a test
-        Then behave will test it for us!
+    @netherlands @optimisation
+    Scenario: Black-box optimisation of WOFOST potato for end-of-season LAI and TWSO in Limburg, Netherlands
+        Given we are using NASA weather data with a latitude of "51" and a longitude of "5"
+        And we are using agronomy management data in the "data/potato_netherlands_2021.agro" file
+        When we execute an optimisation procedure using the "TPES" method and the "Optuna" library with "5" iterations
+
+    @india @optimisation
+    Scenario: Black-box optimisation of WOFOST potato for end-of-season LAI and TWSO in Gujarat, India
+        Given we are using NASA weather data with a latitude of "23" and a longitude of "73"
+        And we are using agronomy management data in the "data/potato_india_2021.agro" file
+        When we execute an optimisation procedure using the "TPES" method and the "Optuna" library with "5" iterations
diff --git a/features/sensitivity.feature b/features/sensitivity.feature
@@ -1,7 +1,7 @@
 Feature: Sobol sensitivity analysis for WOFOST potato
-    Because parameter uncertainty drives crop development and growth
+    Because parameter uncertainty drives potato crop development and growth
     We want to quantify global sensitivities using Sobol indices
-    So we can identify influential parameters for potato LAI and TWSO
+    So we can identify influential parameters for end-of-season LAI and TWSO
 
     Background:
         Given we are using WOFOST site data with a WAV of "50.0"
@@ -23,17 +23,30 @@ Feature: Sobol sensitivity analysis for WOFOST potato
             | name              | description                                   | value                             |
             | experiment_name   | The name of the current experiment            | WOFOST sensitivity analysis       |
             | n_jobs            | The number of simulations to run in parallel  | 10                                |
+            | random_seed       | The random seed for replicability             | 100                               |
 
     @netherlands @sensitivity
-    Scenario: Sobol sensitivity analysis for LAI and TWSO in Limburg, Netherlands
+    Scenario: Sobol sensitivity analysis for end-of-season LAI and TWSO in Limburg, Netherlands
         Given we are using NASA weather data with a latitude of "51" and a longitude of "5"
         And we are using agronomy management data in the "data/potato_netherlands_2021.agro" file
-        When we execute a sensitivity analysis using the "Sobol" method and the "SALib" library with "4" samples
-        Then behave will test it for us!
+        When we execute a sensitivity analysis using the "Sobol" method and the "SALib" library with "256" samples
+        Then the "1st" highest "first order" sensitivity index for "LAI" should be "SPAN"
+        And the "1st" highest "total order" sensitivity index for "LAI" should be "SPAN"
+        And the "2nd" highest "total order" sensitivity index for "LAI" should be "TSUM1"
+        And the "1st" highest "first order" sensitivity index for "TWSO" should be "SPAN"
+        And the "2nd" highest "first order" sensitivity index for "TWSO" should be "Q10"
+        And the "1st" highest "total order" sensitivity index for "TWSO" should be "SPAN"
+        And the "2nd" highest "total order" sensitivity index for "TWSO" should be "TSUM2"
 
     @india @sensitivity
-    Scenario: Sobol sensitivity analysis for LAI and TWSO in Gujarat, India
+    Scenario: Sobol sensitivity analysis for end-of-season LAI and TWSO in Gujarat, India
         Given we are using NASA weather data with a latitude of "23" and a longitude of "73"
         And we are using agronomy management data in the "data/potato_india_2021.agro" file
-        When we execute a sensitivity analysis using the "Sobol" method and the "SALib" library with "4" samples
-        Then behave will test it for us!
+        When we execute a sensitivity analysis using the "Sobol" method and the "SALib" library with "256" samples
+        Then the "1st" highest "first order" sensitivity index for "LAI" should be "SPAN"
+        And the "1st" highest "total order" sensitivity index for "LAI" should be "SPAN"
+        And the "2nd" highest "total order" sensitivity index for "LAI" should be "TSUM1"
+        And the "1st" highest "first order" sensitivity index for "TWSO" should be "TSUM1"
+        And the "2nd" highest "first order" sensitivity index for "TWSO" should be "TSUM2"
+        And the "1st" highest "total order" sensitivity index for "TWSO" should be "TSUM1"
+        And the "2nd" highest "total order" sensitivity index for "TWSO" should be "TSUM2"
diff --git a/features/steps/step_calibration.py b/features/steps/step_calibration.py
@@ -1,10 +1,15 @@
-from behave import given, register_type, when
+import json
+
+import pandas as pd
+from behave import given, register_type, then, when
 from behave.runner import Context
 from pcse.base import ParameterProvider
 
 from wofostat import (
 	end_of_season_sensitivity_func,
 	get_parameter_spec,
+	objective_func,
+	run_optimisation,
 	run_sensitivity_analysis,
 	snake_case_string,
 )
@@ -23,6 +28,22 @@ def specify_calibration(context: Context) -> None:
 	context.calibration_spec = {row["name"]: row["value"] for row in context.table}
 
 
+@given('we are using "{distance_metric}" as our error metric')
+def set_distance_metric(context: Context, distance_metric: str) -> None:
+	context.distance_metric = distance_metric
+
+
+@given('we are using observed data from the "{fpath}" file')
+def get_observed_data(context: Context, fpath: str) -> None:
+	context.observed_data = pd.read_csv(fpath)
+
+
+@given('we are using ground truth data from the "{fpath}" file')
+def get_ground_truth(context: Context, fpath: str) -> None:
+	with open(fpath) as f:
+		context.ground_truth = json.load(f)
+
+
 def _get_params(context: Context) -> ParameterProvider:
 	params = WOFOST.get_params(
 		cropd=context.cropd, sited=context.sited, soild=context.soild
@@ -52,3 +73,56 @@ def execute_sensitivity(
 		engine=engine,
 		**context.calibration_spec,
 	)
+
+
+@then(
+	'the "{position}" highest "{order}" sensitivity index for "{state_var}" '
+	'should be "{param_name}"'
+)
+def check_sensitivity_index(
+	context: Context, position: str, order: str, state_var: str, param_name: str
+) -> None:
+	index = "".join(c for c in position if c.isdigit())
+	index = int(index) - 1
+
+	if order == "total order":
+		order = "ST"
+	else:
+		order = "S1"
+
+	sensitivity_param = context.sp_df[state_var][order].iloc[index].name
+	if sensitivity_param != param_name:
+		raise RuntimeWarning(f"Parameter is {sensitivity_param}")
+
+	assert sensitivity_param == param_name
+
+
+@when(
+	'we execute an optimisation procedure using the "{method:SnakeCaseString}" method '
+	'and the "{engine:SnakeCaseString}" library with "{n_iterations:d}" iterations'
+)
+def execute_optimisation(
+	context: Context, method: str, engine: str, n_iterations: int
+) -> None:
+	params = _get_params(context)
+
+	(
+		context.calibrator,
+		context.param_importances,
+		context.trials_df,
+		context.parameter_estimates,
+	) = run_optimisation(
+		parameter_spec=context.parameter_spec,
+		n_iterations=n_iterations,
+		wdp=context.wdp,
+		agro=context.agro,
+		state_vars=context.state_vars,
+		calibration_func=objective_func,
+		params=params,
+		method=method,
+		engine=engine,
+		ground_truth=context.ground_truth,
+		observed_data=context.observed_data,
+		distance_metric=context.distance_metric,
+		**context.calibration_spec,
+	)
diff --git a/notebooks/6_full_sensitivity_wofost.ipynb b/notebooks/6_full_sensitivity_wofost.ipynb
@@ -221,7 +221,7 @@
    "source": [
     "state_vars = [\"LAI\", \"TWSO\"]\n",
     "\n",
-    "run_sensitivity_analysis(\n",
+    "calibrator, sp = run_sensitivity_analysis(\n",
     "    experiment_name = \"netherlands_sensitivity_analysis\",\n",
     "    parameter_spec=parameter_spec,\n",
     "    n_samples = 8,\n",
diff --git a/notebooks/7_full_optimisation_wofost.ipynb b/notebooks/7_full_optimisation_wofost.ipynb
@@ -8,7 +8,7 @@
    "outputs": [],
    "source": [
     "import os.path as osp\n",
-    "\n",
+    "import json\n",
     "import numpy as np\n",
     "from pcse.input import (\n",
     "\tDummySoilDataProvider,\n",
@@ -20,7 +20,7 @@
     "from wofostat.wofost import WOFOST, DEFAULT_PARAMETER_VALUES\n",
     "from wofostat import objective_func, run_optimisation, get_parameter_spec, table_to_dict\n",
     "from pcse.base import ParameterProvider\n",
-    "\n",
+    "from pathlib import Path\n",
     "from pcse.base import ParameterProvider"
    ]
   },
@@ -120,14 +120,30 @@
     "    { \"name\": \"Q10\", \"value\":  2.0  },\n",
     "]\n",
     "ground_truth = table_to_dict(ground_truth)\n",
+    "with open(Path(\"..\", \"data\") / \"ground_truth.json\", \"w\") as f:\n",
+    "    json.dump(ground_truth, f, indent=4)\n",
+    "    \n",
     "params = WOFOST.get_params(cropd=cropd, sited=sited, soild=soild)\n",
     "wofost = WOFOST(params, netherlands_wdp, netherlands_agro)\n",
     "\n",
     "params = WOFOST.override(ground_truth, params)\n",
     "observed_data = wofost.run()\n",
+    "observed_data.to_csv(\n",
+    "    Path(\"..\", \"data\") / \"synthetic_test_data.csv\", index=False\n",
+    ")\n",
     "observed_data"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "87dad4bc-503b-4232-8642-33b7095d0ee5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "ground_truth"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
diff --git a/wofostat/calibration.py b/wofostat/calibration.py
@@ -110,6 +110,7 @@ def run_sensitivity_analysis(
 	n_jobs: int = 1,
 	method: str = "sobol",
 	engine: str = "salib",
+	random_seed: int | None = None,
 ) -> tuple[SensitivityAnalysisMethod, dict[str, dict[str, pd.DataFrame]]]:
 	"""Run a sensitivity analysis.
 
@@ -125,6 +126,7 @@ def run_sensitivity_analysis(
 	    n_jobs (int, optional): Number of simulations to run in parallel. Defaults to 1.
 		method (str, optional): The calibration method.
 		engine (str, optional): The underlying calibration library.
+		random_seed (int, optional): The random seed for replicability.
 
 	Returns:
 	    tuple[SensitivityAnalysisMethod, dict[str, dict[str, pd.DataFrame]]]]: The
@@ -140,6 +142,7 @@ def run_sensitivity_analysis(
 		verbose=True,
 		batched=False,
 		method_kwargs=dict(calc_second_order=False, scramble=True),
+		random_seed=random_seed,
 		analyze_kwargs=dict(
 			calc_second_order=False,
 			num_resamples=200,
@@ -160,8 +163,8 @@ def run_sensitivity_analysis(
 	sp = {}
 	for i, state_var in enumerate(state_vars):
 		sp[state_var] = {
-			"ST": sp_df[i][0],
-			"S1": sp_df[i][1],
+			"ST": sp_df[i][0].sort_values("ST", ascending=False),
+			"S1": sp_df[i][1].sort_values("S1", ascending=False),
 		}
 
 	return calibrator, sp
@@ -226,6 +229,9 @@ def run_optimisation(
 	observed_data: np.ndarray | None,
 	distance_metric: str = "mean squared error",
 	n_jobs: int = 1,
+	method: str = "tpes",
+	engine: str = "optuna",
+	random_seed: int | None = None,
 ) -> tuple[OptimisationMethod, dict[str, dict[Any, Any]], pd.DataFrame, pd.DataFrame]:
 	"""Run an optimisation procedure.
 
@@ -243,6 +249,9 @@ def run_optimisation(
 	    distance_metric (str, optional): The distance metric function
 	    for the discrepancy. Defaults to "mean squared error".
 	    n_jobs (int, optional): Number of simulations to run in parallel. Defaults to 1.
+		method (str, optional): The calibration method.
+		engine (str, optional): The underlying calibration library.
+		random_seed (int, optional): The random seed for replicability.
 
 	Returns:
 	    tuple[OptimisationMethod, dict[str, dict[Any, Any]],
@@ -255,11 +264,12 @@ def run_optimisation(
 		experiment_name=experiment_name,
 		parameter_spec=parameter_spec,
 		observed_data=observed_data,
-		method="tpes",
+		method=method,
 		output_labels=state_vars,
 		directions=directions,
 		n_jobs=n_jobs,
 		n_iterations=n_iterations,
+		random_seed=random_seed,
 		calibration_func_kwargs=dict(
 			wdp=wdp,
 			agro=agro,
@@ -270,7 +280,7 @@ def run_optimisation(
 	)
 
 	calibrator = OptimisationMethod(
-		calibration_func=calibration_func, specification=specification, engine="optuna"
+		calibration_func=calibration_func, specification=specification, engine=engine
 	)
 
 	calibrator.specify().execute()