UPDATE

2026-05-09 16:55:06 +03:30
parent 1679825ae2
commit cead7dafe2
51 changed files with 7514 additions and 1221 deletions
@@ -0,0 +1,476 @@
+from __future__ import annotations
+
+import math
+import os
+from dataclasses import dataclass
+from datetime import date
+from decimal import Decimal
+from typing import Any
+
+from .models import AnalysisGridCell
+
+
+DEFAULT_OPENEO_BACKEND_URL = "https://openeofed.dataspace.copernicus.eu"
+DEFAULT_OPENEO_PROVIDER = "openeo"
+
+SENTINEL2_COLLECTION = "SENTINEL2_L2A"
+SENTINEL3_LST_COLLECTION = "SENTINEL3_SLSTR_L2_LST"
+SENTINEL1_COLLECTION = "SENTINEL1_GRD"
+COPERNICUS_DEM_COLLECTION = "COPERNICUS_30"
+
+VALID_SCL_CLASSES = (4, 5, 6)
+METRIC_NAMES = (
+    "ndvi",
+    "ndwi",
+    "lst_c",
+    "soil_vv",
+    "soil_vv_db",
+    "dem_m",
+    "slope_deg",
+)
+
+
+class OpenEOServiceError(Exception):
+    """Base exception for openEO service failures."""
+
+
+class OpenEOAuthenticationError(OpenEOServiceError):
+    """Raised when authentication with the openEO backend fails."""
+
+
+class OpenEOExecutionError(OpenEOServiceError):
+    """Raised when a metric process graph can not be executed successfully."""
+
+
+@dataclass(frozen=True)
+class OpenEOConnectionSettings:
+    backend_url: str = DEFAULT_OPENEO_BACKEND_URL
+    auth_method: str = "client_credentials"
+    client_id: str = ""
+    client_secret: str = ""
+    provider_id: str = ""
+    username: str = ""
+    password: str = ""
+    allow_interactive_oidc: bool = False
+
+    @classmethod
+    def from_env(cls) -> "OpenEOConnectionSettings":
+        return cls(
+            backend_url=os.environ.get("OPENEO_BACKEND_URL", DEFAULT_OPENEO_BACKEND_URL).strip(),
+            auth_method=os.environ.get("OPENEO_AUTH_METHOD", "client_credentials").strip().lower(),
+            client_id=os.environ.get("OPENEO_AUTH_CLIENT_ID", "").strip(),
+            client_secret=os.environ.get("OPENEO_AUTH_CLIENT_SECRET", "").strip(),
+            provider_id=os.environ.get("OPENEO_AUTH_PROVIDER_ID", "").strip(),
+            username=os.environ.get("OPENEO_USERNAME", "").strip(),
+            password=os.environ.get("OPENEO_PASSWORD", "").strip(),
+            allow_interactive_oidc=os.environ.get("OPENEO_ALLOW_INTERACTIVE_OIDC", "0").strip().lower()
+            in {"1", "true", "yes", "on"},
+        )
+
+
+def connect_openeo(settings: OpenEOConnectionSettings | None = None):
+    """
+    Build an authenticated openEO connection using environment-driven configuration.
+
+    Preferred authentication mode in production is OIDC client credentials.
+    """
+    settings = settings or OpenEOConnectionSettings.from_env()
+    try:
+        import openeo
+    except ImportError as exc:  # pragma: no cover - runtime dependency guard
+        raise OpenEOServiceError("The `openeo` Python client is required for remote sensing jobs.") from exc
+
+    connection = openeo.connect(settings.backend_url)
+    try:
+        if settings.auth_method == "client_credentials":
+            if not settings.client_id or not settings.client_secret:
+                raise OpenEOAuthenticationError(
+                    "OPENEO_AUTH_CLIENT_ID and OPENEO_AUTH_CLIENT_SECRET must be configured."
+                )
+            auth_kwargs = {
+                "client_id": settings.client_id,
+                "client_secret": settings.client_secret,
+            }
+            if settings.provider_id:
+                auth_kwargs["provider_id"] = settings.provider_id
+            return connection.authenticate_oidc_client_credentials(**auth_kwargs)
+
+        if settings.auth_method == "password":
+            if not settings.username or not settings.password:
+                raise OpenEOAuthenticationError(
+                    "OPENEO_USERNAME and OPENEO_PASSWORD must be configured for password auth."
+                )
+            auth_kwargs = {
+                "username": settings.username,
+                "password": settings.password,
+            }
+            if settings.provider_id:
+                auth_kwargs["provider_id"] = settings.provider_id
+            return connection.authenticate_oidc_resource_owner_password_credentials(**auth_kwargs)
+
+        if settings.auth_method == "oidc":
+            if not settings.allow_interactive_oidc:
+                raise OpenEOAuthenticationError(
+                    "Interactive OIDC auth is disabled. Use client credentials in Celery workers."
+                )
+            auth_kwargs = {}
+            if settings.provider_id:
+                auth_kwargs["provider_id"] = settings.provider_id
+            return connection.authenticate_oidc(**auth_kwargs)
+
+        raise OpenEOAuthenticationError(f"Unsupported OPENEO_AUTH_METHOD: {settings.auth_method}")
+    except Exception as exc:
+        if isinstance(exc, OpenEOServiceError):
+            raise
+        raise OpenEOAuthenticationError(f"Failed to authenticate with openEO backend: {exc}") from exc
+
+
+def build_feature_collection(cells: list[AnalysisGridCell]) -> dict[str, Any]:
+    features = []
+    for cell in cells:
+        features.append(
+            {
+                "type": "Feature",
+                "id": cell.cell_code,
+                "properties": {
+                    "cell_code": cell.cell_code,
+                    "block_code": cell.block_code,
+                    "soil_location_id": cell.soil_location_id,
+                },
+                "geometry": cell.geometry,
+            }
+        )
+    return {"type": "FeatureCollection", "features": features}
+
+
+def build_spatial_extent(cells: list[AnalysisGridCell]) -> dict[str, float]:
+    if not cells:
+        raise ValueError("At least one analysis grid cell is required.")
+
+    west = None
+    east = None
+    south = None
+    north = None
+    for cell in cells:
+        coordinates = ((cell.geometry or {}).get("coordinates") or [[]])[0]
+        for lon, lat in coordinates:
+            west = lon if west is None else min(west, lon)
+            east = lon if east is None else max(east, lon)
+            south = lat if south is None else min(south, lat)
+            north = lat if north is None else max(north, lat)
+
+    return {
+        "west": float(west),
+        "south": float(south),
+        "east": float(east),
+        "north": float(north),
+    }
+
+
+def build_empty_metric_payload() -> dict[str, Any]:
+    return {metric_name: None for metric_name in METRIC_NAMES}
+
+
+def initialize_metric_result_map(cells: list[AnalysisGridCell]) -> dict[str, dict[str, Any]]:
+    return {cell.cell_code: build_empty_metric_payload() for cell in cells}
+
+
+def compute_remote_sensing_metrics(
+    cells: list[AnalysisGridCell],
+    *,
+    temporal_start: date | str,
+    temporal_end: date | str,
+    connection=None,
+) -> dict[str, Any]:
+    """
+    Compute all requested remote sensing metrics in batch mode per metric.
+
+    Returns a normalized structure keyed by `cell_code`, plus execution metadata
+    that can be stored by Celery tasks and Django models.
+    """
+    if not cells:
+        return {
+            "results": {},
+            "metadata": {
+                "backend": DEFAULT_OPENEO_PROVIDER,
+                "collections_used": [],
+                "slope_supported": False,
+                "job_refs": {},
+                "failed_metrics": [],
+            },
+        }
+
+    connection = connection or connect_openeo()
+    feature_collection = build_feature_collection(cells)
+    spatial_extent = build_spatial_extent(cells)
+    results = initialize_metric_result_map(cells)
+    metadata = {
+        "backend": DEFAULT_OPENEO_PROVIDER,
+        "backend_url": DEFAULT_OPENEO_BACKEND_URL,
+        "collections_used": [
+            SENTINEL2_COLLECTION,
+            SENTINEL3_LST_COLLECTION,
+            SENTINEL1_COLLECTION,
+            COPERNICUS_DEM_COLLECTION,
+        ],
+        "slope_supported": True,
+        "job_refs": {},
+        "failed_metrics": [],
+    }
+
+    metric_runners = [
+        ("ndvi", compute_ndvi),
+        ("ndwi", compute_ndwi),
+        ("lst_c", compute_lst_c),
+        ("soil_vv", compute_soil_vv),
+        ("dem_m", compute_dem_m),
+        ("slope_deg", compute_slope_deg),
+    ]
+    for metric_name, runner in metric_runners:
+        try:
+            metric_payload = runner(
+                connection=connection,
+                feature_collection=feature_collection,
+                spatial_extent=spatial_extent,
+                temporal_start=temporal_start,
+                temporal_end=temporal_end,
+            )
+            merge_metric_results(results, metric_payload["results"])
+            metadata["job_refs"][metric_name] = metric_payload.get("job_ref")
+            if metric_name == "slope_deg" and not metric_payload.get("supported", True):
+                metadata["slope_supported"] = False
+        except Exception as exc:
+            if metric_name == "slope_deg":
+                metadata["slope_supported"] = False
+                metadata["failed_metrics"].append(
+                    {"metric": metric_name, "error": str(exc), "non_fatal": True}
+                )
+                continue
+            raise OpenEOExecutionError(f"Failed to compute metric `{metric_name}`: {exc}") from exc
+
+    for cell_code, payload in results.items():
+        soil_vv = payload.get("soil_vv")
+        payload["soil_vv_db"] = linear_to_db(soil_vv)
+
+    return {"results": results, "metadata": metadata}
+
+
+def compute_ndvi(*, connection, feature_collection, spatial_extent, temporal_start, temporal_end) -> dict[str, Any]:
+    cube = connection.load_collection(
+        SENTINEL2_COLLECTION,
+        spatial_extent=spatial_extent,
+        temporal_extent=[_normalize_date(temporal_start), _normalize_date(temporal_end)],
+        bands=["B03", "B04", "B08", "SCL"],
+    )
+    scl = cube.band("SCL")
+    invalid_mask = (scl != VALID_SCL_CLASSES[0]) & (scl != VALID_SCL_CLASSES[1]) & (scl != VALID_SCL_CLASSES[2])
+    red = cube.band("B04") * 0.0001
+    nir = cube.band("B08") * 0.0001
+    ndvi = ((nir - red) / (nir + red)).mask(invalid_mask.resample_cube_spatial(red))
+    aggregated = ndvi.mean_time().aggregate_spatial(geometries=feature_collection, reducer="mean").execute()
+    return {"results": parse_aggregate_spatial_response(aggregated, "ndvi")}
+
+
+def compute_ndwi(*, connection, feature_collection, spatial_extent, temporal_start, temporal_end) -> dict[str, Any]:
+    cube = connection.load_collection(
+        SENTINEL2_COLLECTION,
+        spatial_extent=spatial_extent,
+        temporal_extent=[_normalize_date(temporal_start), _normalize_date(temporal_end)],
+        bands=["B03", "B08", "SCL"],
+    )
+    scl = cube.band("SCL")
+    invalid_mask = (scl != VALID_SCL_CLASSES[0]) & (scl != VALID_SCL_CLASSES[1]) & (scl != VALID_SCL_CLASSES[2])
+    green = cube.band("B03") * 0.0001
+    nir = cube.band("B08") * 0.0001
+    ndwi = ((green - nir) / (green + nir)).mask(invalid_mask.resample_cube_spatial(green))
+    aggregated = ndwi.mean_time().aggregate_spatial(geometries=feature_collection, reducer="mean").execute()
+    return {"results": parse_aggregate_spatial_response(aggregated, "ndwi")}
+
+
+def compute_lst_c(*, connection, feature_collection, spatial_extent, temporal_start, temporal_end) -> dict[str, Any]:
+    cube = connection.load_collection(
+        SENTINEL3_LST_COLLECTION,
+        spatial_extent=spatial_extent,
+        temporal_extent=[_normalize_date(temporal_start), _normalize_date(temporal_end)],
+    )
+    band_name = infer_band_name(cube, preferred=("LST", "LST_in", "LST", "band_0"))
+    lst_k = cube.band(band_name) if band_name else cube
+    lst_c = lst_k - 273.15
+    aggregated = lst_c.mean_time().aggregate_spatial(geometries=feature_collection, reducer="mean").execute()
+    return {"results": parse_aggregate_spatial_response(aggregated, "lst_c")}
+
+
+def compute_soil_vv(*, connection, feature_collection, spatial_extent, temporal_start, temporal_end) -> dict[str, Any]:
+    cube = connection.load_collection(
+        SENTINEL1_COLLECTION,
+        spatial_extent=spatial_extent,
+        temporal_extent=[_normalize_date(temporal_start), _normalize_date(temporal_end)],
+        bands=["VV"],
+    )
+    vv = cube.band("VV")
+    aggregated = vv.mean_time().aggregate_spatial(geometries=feature_collection, reducer="mean").execute()
+    return {"results": parse_aggregate_spatial_response(aggregated, "soil_vv")}
+
+
+def compute_dem_m(*, connection, feature_collection, spatial_extent, temporal_start, temporal_end) -> dict[str, Any]:
+    cube = connection.load_collection(
+        COPERNICUS_DEM_COLLECTION,
+        spatial_extent=spatial_extent,
+        temporal_extent=[_normalize_date(temporal_start), _normalize_date(temporal_end)],
+    )
+    band_name = infer_band_name(cube, preferred=("DEM", "elevation", "band_0"))
+    dem = cube.band(band_name) if band_name else cube
+    aggregated = dem.aggregate_spatial(geometries=feature_collection, reducer="mean").execute()
+    return {"results": parse_aggregate_spatial_response(aggregated, "dem_m")}
+
+
+def compute_slope_deg(*, connection, feature_collection, spatial_extent, temporal_start, temporal_end) -> dict[str, Any]:
+    cube = connection.load_collection(
+        COPERNICUS_DEM_COLLECTION,
+        spatial_extent=spatial_extent,
+        temporal_extent=[_normalize_date(temporal_start), _normalize_date(temporal_end)],
+    )
+    band_name = infer_band_name(cube, preferred=("DEM", "elevation", "band_0"))
+    dem = cube.band(band_name) if band_name else cube
+    try:
+        slope_rad = dem.slope()
+        slope_deg = slope_rad * (180.0 / math.pi)
+        aggregated = slope_deg.aggregate_spatial(geometries=feature_collection, reducer="mean").execute()
+        return {
+            "results": parse_aggregate_spatial_response(aggregated, "slope_deg"),
+            "supported": True,
+        }
+    except Exception:
+        return {
+            "results": {feature["id"]: {"slope_deg": None} for feature in feature_collection.get("features", [])},
+            "supported": False,
+        }
+
+
+def parse_aggregate_spatial_response(payload: Any, metric_name: str) -> dict[str, dict[str, Any]]:
+    """
+    Parse different JSON shapes returned by openEO aggregate_spatial executions.
+    """
+    if payload is None:
+        return {}
+
+    if isinstance(payload, dict) and payload.get("type") == "FeatureCollection":
+        return _parse_feature_collection_results(payload, metric_name)
+
+    if isinstance(payload, dict) and "features" in payload:
+        return _parse_feature_collection_results(payload, metric_name)
+
+    if isinstance(payload, dict):
+        return _parse_mapping_results(payload, metric_name)
+
+    if isinstance(payload, list):
+        return _parse_list_results(payload, metric_name)
+
+    raise OpenEOExecutionError(f"Unsupported openEO aggregate_spatial response type: {type(payload)!r}")
+
+
+def _parse_feature_collection_results(payload: dict[str, Any], metric_name: str) -> dict[str, dict[str, Any]]:
+    results: dict[str, dict[str, Any]] = {}
+    for feature in payload.get("features", []):
+        feature_id = str(
+            feature.get("id")
+            or (feature.get("properties") or {}).get("cell_code")
+            or (feature.get("properties") or {}).get("id")
+        )
+        if not feature_id:
+            continue
+        properties = feature.get("properties") or {}
+        value = _extract_aggregate_value(properties)
+        results[feature_id] = {metric_name: _coerce_float(value)}
+    return results
+
+
+def _parse_mapping_results(payload: dict[str, Any], metric_name: str) -> dict[str, dict[str, Any]]:
+    if "data" in payload and isinstance(payload["data"], (dict, list)):
+        return parse_aggregate_spatial_response(payload["data"], metric_name)
+
+    results: dict[str, dict[str, Any]] = {}
+    for feature_id, value in payload.items():
+        if feature_id in {"type", "links", "meta"}:
+            continue
+        results[str(feature_id)] = {metric_name: _coerce_float(_extract_aggregate_value(value))}
+    return results
+
+
+def _parse_list_results(payload: list[Any], metric_name: str) -> dict[str, dict[str, Any]]:
+    results: dict[str, dict[str, Any]] = {}
+    for index, item in enumerate(payload):
+        if isinstance(item, dict):
+            feature_id = str(item.get("id") or item.get("cell_code") or item.get("feature_id") or index)
+            value = _extract_aggregate_value(item)
+        else:
+            feature_id = str(index)
+            value = item
+        results[feature_id] = {metric_name: _coerce_float(value)}
+    return results
+
+
+def _extract_aggregate_value(value: Any) -> Any:
+    if isinstance(value, dict):
+        for key in ("mean", "value", "result", "average"):
+            if key in value:
+                return _extract_aggregate_value(value[key])
+        if len(value) == 1:
+            return _extract_aggregate_value(next(iter(value.values())))
+        return None
+    if isinstance(value, list):
+        if not value:
+            return None
+        return _extract_aggregate_value(value[0])
+    return value
+
+
+def merge_metric_results(target: dict[str, dict[str, Any]], updates: dict[str, dict[str, Any]]) -> None:
+    for cell_code, values in updates.items():
+        target.setdefault(cell_code, build_empty_metric_payload())
+        target[cell_code].update(values)
+
+
+def linear_to_db(value: Any) -> float | None:
+    numeric = _coerce_float(value)
+    if numeric is None or numeric <= 0:
+        return None
+    return round(10.0 * math.log10(numeric), 6)
+
+
+def infer_band_name(cube, preferred: tuple[str, ...]) -> str | None:
+    """
+    Best-effort band name selection for collections with backend-specific naming.
+    """
+    metadata = getattr(cube, "metadata", None)
+    if metadata is None:
+        return None
+    band_dimension = getattr(metadata, "band_dimension", None)
+    bands = getattr(band_dimension, "bands", None)
+    if not bands:
+        return None
+    available = []
+    for band in bands:
+        name = getattr(band, "name", None) or str(band)
+        available.append(name)
+    for candidate in preferred:
+        if candidate in available:
+            return candidate
+    return available[0] if available else None
+
+
+def _coerce_float(value: Any) -> float | None:
+    if value is None:
+        return None
+    if isinstance(value, Decimal):
+        return float(value)
+    try:
+        return float(value)
+    except (TypeError, ValueError):
+        return None
+
+
+def _normalize_date(value: date | str) -> str:
+    if isinstance(value, date):
+        return value.isoformat()
+    return str(value)