PolicyEngine · NareshThotakuri · Jul 31, 2025 · Jul 31, 2025 · Jul 31, 2025 · Jul 31, 2025
diff --git a/.gitignore b/.gitignore
@@ -1,4 +1,6 @@
 .venv
+/venv
+__pycache__
 **/__pycache__
 *.egg-info
 .pytest_cache

diff --git a/changelog_entry.yaml b/changelog_entry.yaml
@@ -0,0 +1,4 @@
+- bump: patch
+  changes:
+    added:
+    - Added GCP logs in Household and Metadata services to assist further investigation of the 502 errors.
diff --git a/policyengine_api/endpoints/household.py b/policyengine_api/endpoints/household.py
@@ -11,6 +11,9 @@
 import json
 import logging
 from datetime import date
+from policyengine_api.structured_logger import get_logger, log_struct
+
+logger = get_logger()
 from policyengine_api.utils.payload_validators import validate_country
 
 
@@ -88,14 +91,61 @@ def get_household_under_policy(
 
     api_version = COUNTRY_PACKAGE_VERSIONS.get(country_id)
 
-    # Look in computed_households to see if already computed
+    # Log start of request
+    log_struct(
+        event="get_household_under_policy_start",
+        input_data={
+            "country_id": country_id,
+            "household_id": household_id,
+            "policy_id": policy_id,
+            "api_version": api_version,
+            "request_path": request.path,
+        },
+        message="Started processing household under policy request.",
+        severity="INFO",
+        logger=logger,  # optional if you've already called get_logger()
+    )
 
-    row = local_database.query(
-        f"SELECT * FROM computed_household WHERE household_id = ? AND policy_id = ? AND api_version = ?",
-        (household_id, policy_id, api_version),
-    ).fetchone()
+    # Look in computed_household cache table
+    try:
+        row = local_database.query(
+            f"SELECT * FROM computed_household WHERE household_id = ? AND policy_id = ? AND api_version = ?",
+            (household_id, policy_id, api_version),
+        ).fetchone()
+    except Exception as e:
+        log_struct(
+            event="computed_household_query_failed",
+            input_data={
+                "household_id": household_id,
+                "policy_id": policy_id,
+                "api_version": api_version,
+            },
+            message=f"Database query failed: {e}",
+            severity="ERROR",
+        )
+        return Response(
+            json.dumps(
+                {
+                    "status": "error",
+                    "message": "Internal server error while querying computed_household.",
+                }
+            ),
+            status=500,
+            mimetype="application/json",
+        )
 
     if row is not None:
+        log_struct(
+            event="cached_computed_household_found",
+            input_data={
+                "household_id": household_id,
+                "policy_id": policy_id,
+                "api_version": api_version,
+            },
+            message="Found precomputed household result in cache.",
+            severity="INFO",
+        )
+
         result = dict(
             policy_id=row["policy_id"],
             household_id=row["household_id"],
@@ -122,7 +172,27 @@ def get_household_under_policy(
     if row is not None:
         household = dict(row)
         household["household_json"] = json.loads(household["household_json"])
+        log_struct(
+            event="household_data_loaded",
+            input_data={
+                "household_id": household_id,
+                "country_id": country_id,
+            },
+            message="Loaded household data from DB.",
+            severity="INFO",
+        )
+
     else:
+        log_struct(
+            event="household_not_found",
+            input_data={
+                "household_id": household_id,
+                "country_id": country_id,
+            },
+            message=f"Household #{household_id} not found.",
+            severity="WARNING",
+        )
+
         response_body = dict(
             status="error",
             message=f"Household #{household_id} not found.",
@@ -168,7 +238,28 @@ def get_household_under_policy(
             household_id,
             policy_id,
         )
+
+        log_struct(
+            event="calculation_success",
+            input_data={
+                "household_id": household_id,
+                "policy_id": policy_id,
+            },
+            message="Household calculation succeeded.",
+            severity="INFO",
+        )
+
     except Exception as e:
+        log_struct(
+            event="calculation_failed",
+            input_data={
+                "household_id": household_id,
+                "policy_id": policy_id,
+            },
+            message=f"Calculation failed: {e}",
+            severity="ERROR",
+        )
+
         logging.exception(e)
         response_body = dict(
             status="error",
@@ -193,7 +284,27 @@ def get_household_under_policy(
                 api_version,
             ),
         )
-    except Exception:
+        log_struct(
+            event="computed_household_inserted",
+            input_data={
+                "household_id": household_id,
+                "policy_id": policy_id,
+            },
+            message="Inserted new computed_household record.",
+            severity="INFO",
+        )
+
+    except Exception as e:
+        log_struct(
+            event="computed_household_insert_failed_updating",
+            input_data={
+                "household_id": household_id,
+                "policy_id": policy_id,
+            },
+            message=f"Insert failed; updated existing record instead. Error: {e}",
+            severity="ERROR",
+        )
+
         # Update the result if it already exists
         local_database.query(
             f"UPDATE computed_household SET computed_household_json = ? WHERE country_id = ? AND household_id = ? AND policy_id = ?",
@@ -227,7 +338,25 @@ def get_calculate(country_id: str, add_missing: bool = False) -> dict:
 
     try:
         result = country.calculate(household_json, policy_json)
+        log_struct(
+            event="calculation_success",
+            input_data={
+                "country_id": country_id,
+            },
+            message="Calculation completed successfully.",
+            severity="INFO",
+        )
+
     except Exception as e:
+        log_struct(
+            event="calculation_failed",
+            input_data={
+                "country_id": country_id,
+            },
+            message=f"Error calculating household under policy: {e}",
+            severity="ERROR",
+        )
+
         logging.exception(e)
         response_body = dict(
             status="error",

diff --git a/policyengine_api/services/metadata_service.py b/policyengine_api/services/metadata_service.py
@@ -1,12 +1,62 @@
 from policyengine_api.country import COUNTRIES
+from policyengine_api.structured_logger import get_logger, log_struct
+
+logger = get_logger()
 
 
 class MetadataService:
     def get_metadata(self, country_id: str) -> dict:
-        country = COUNTRIES.get(country_id)
-        if country == None:
-            raise RuntimeError(
-                f"Attempted to get metadata for a nonexistant country: '{country_id}'"
+
+        # Log the metadata retrieval attempt
+        log_struct(
+            event="MetadataService.get_metadata_called",
+            input_data={
+                "country_id": country_id,
+            },
+            message="Metadata retrieval called.",
+            severity="INFO",
+        )
+
+        try:
+            country = COUNTRIES.get(country_id)
+            if country == None:
+                error_msg = f"Attempted to get metadata for a nonexistant country: '{country_id}'"
+                log_struct(
+                    event="MetadataService.get_metadata_failed",
+                    input_data={
+                        "country_id": country_id,
+                        "error": error_msg,
+                    },
+                    message=f"Metadata successfully retrieved for country_id '{country_id}'",
+                    severity="ERROR",
+                )
+
+                raise RuntimeError(error_msg)
+
+            metadata = country.metadata
+
+            log_struct(
+                event="MetadataService.get_metadata_success",
+                input_data={
+                    "country_id": country_id,
+                },
+                message="Metadata successfully retrieved.",
+                severity="INFO",
             )
 
-        return country.metadata
+            return metadata
+
+        except Exception as e:
+            log_struct(
+                event="MetadataService.get_metadata_exception",
+                input_data={
+                    "country_id": country_id,
+                    "error": str(e),
+                },
+                message="Exception occurred while retrieving metadata.",
+                severity="ERROR",
+            )
+
+            raise RuntimeError(
+                f"Unexpected error retrieving metadata for country_id '{country_id}': {e}"
+            ) from e
diff --git a/policyengine_api/structured_logger.py b/policyengine_api/structured_logger.py
@@ -0,0 +1,58 @@
+import logging
+import json
+import sys
+
+# Only import if using GCP logging
+try:
+    from google.cloud import logging as gcp_logging
+    from google.cloud.logging.handlers import CloudLoggingHandler
+except ImportError:
+    gcp_logging = None
+    CloudLoggingHandler = None
+
+
+class JsonFormatter(logging.Formatter):
+    """Formatter that outputs logs as structured JSON."""
+
+    def format(self, record):
+        log_record = {
+            "severity": record.levelname,
+            "event": getattr(record, "event", None),
+            "input": getattr(record, "input", None),
+            "message": record.getMessage(),
+        }
+        if record.exc_info:
+            log_record["exception"] = self.formatException(record.exc_info)
+        return json.dumps(log_record)
+
+
+def get_logger(name="policyengine-api", level=logging.INFO):
+    logger = logging.getLogger(name)
+    logger.setLevel(level)
+
+    # If no handlers are set, add a StreamHandler with JSON formatting
+    if not logger.handlers:
+        handler = logging.StreamHandler(sys.stdout)
+        handler.setFormatter(JsonFormatter())
+        logger.addHandler(handler)
+
+        # If using GCP logging, add a CloudLoggingHandler
+        # For more advanced GCP integration, consider enabling CloudLoggingHandler.
+        # if gcp_logging and CloudLoggingHandler:
+        #         client = gcp_logging.Client()
+        #         gcp_handler = CloudLoggingHandler(client, name=name)
+        #         gcp_handler.setFormatter(JsonFormatter())  # Optional
+        #         logger.addHandler(gcp_handler)
+
+    return logger
+
+
+def log_struct(event, input_data, message, severity="INFO", logger=None):
+    """
+    Implementation-agnostic structured logger.
+    """
+    if logger is None:
+        logger = get_logger()
+
+    log_func = getattr(logger, severity.lower(), logger.info)
+    log_func(message, extra={"event": event, "input": input_data})