{
  "model_details": {
    "provider": "vertex",
    "model_requested": "gemini-3-flash-preview",
    "model_for_requests": "google/gemini-3-flash-preview",
    "api_base_url": "https://aiplatform.googleapis.com/v1/projects/gen-lang-client-0461875984/locations/global/endpoints/openapi",
    "chat_completions_endpoint": "https://aiplatform.googleapis.com/v1/projects/gen-lang-client-0461875984/locations/global/endpoints/openapi/chat/completions",
    "vertex_cache_model": "projects/gen-lang-client-0461875984/locations/global/publishers/google/models/gemini-3-flash-preview"
  },
  "cache_padding": {
    "enabled": true,
    "target_shared_prefix_tokens": 1200,
    "calibration_shared_prefix_tokens": 496,
    "target_prompt_tokens": 1200,
    "calibration_prompt_tokens": 496,
    "calibration_example_id": "water-3",
    "applied_padding_tokens_estimate": 302,
    "examples_with_padding_applied": 1200
  },
  "request_control_summary": {
    "configured": {
      "thinking_level": "minimal"
    },
    "attempts_total": 1316,
    "attempts_with_control_telemetry": 1182,
    "per_control": {
      "reasoning_effort": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "thinking_level": {
        "configured_value": "minimal",
        "requested_attempts": 1182,
        "sent_attempts": 1182,
        "accepted_attempts": 1182,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": 1.0,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "effort": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "verbosity": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "prompt_cache_key": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "gemini_cached_content": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "requesty_auto_cache": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      }
    }
  },
  "usage_metadata_summary": {
    "attempts_total": 1316,
    "attempts_with_usage_metadata": 1182,
    "attempts_with_cached_token_signals": 0,
    "cached_tokens_total_estimate": 0,
    "cache_read_tokens_total": 0,
    "cache_write_tokens_total": 0,
    "cache_token_fields_totals": {},
    "attempts_with_gemini_cached_content_token_signals": 0,
    "gemini_cached_content_token_count_total": 0,
    "gemini_cached_content_token_fields_totals": {}
  },
  "token_usage_totals": {
    "attempts_total": 1316,
    "attempts_with_token_usage": 1182,
    "attempts_with_output_tokens": 1182,
    "attempts_with_cached_input_tokens": 0,
    "attempts_with_thinking_tokens": 0,
    "input_tokens_total": 1597210,
    "cached_input_tokens_total": 0,
    "non_cached_input_tokens_total": 1597210,
    "output_tokens_total": 184244,
    "thinking_tokens_total": 0,
    "output_tokens_definition": "total_tokens - prompt_tokens (or completion_tokens + thinking_tokens fallback)"
  },
  "truth_label_count": 1200,
  "prediction_count": 1200,
  "evaluated_example_count": 1200,
  "calibration_metrics": {
    "available": true,
    "sample_count": 1182,
    "bin_count": 10,
    "ece": 0.02106598984772024,
    "mce": 0.3416666666666667,
    "brier_score": 0.026831641285956005
  },
  "first_prompt_timestamp": "2026-03-10T20:18:02.213187Z",
  "last_prompt_timestamp": "2026-03-10T20:42:40.400510Z",
  "overall_time_seconds": 1478.187323,
  "overall_time_human": "24m 38s",
  "accuracy": 0.955,
  "macro_precision": 0.6341371824209353,
  "macro_recall": 0.6360927622140594,
  "macro_f1": 0.6349124730020009,
  "per_label": {
    "plural": {
      "precision": 0.9157894736842105,
      "recall": 0.9525547445255474,
      "f1": 0.9338103756708408,
      "support": 274
    },
    "singular": {
      "precision": 0.9866220735785953,
      "recall": 0.9557235421166307,
      "f1": 0.9709270433351619,
      "support": 926
    },
    "unclassified": {
      "precision": 0.0,
      "recall": 0.0,
      "f1": 0.0,
      "support": 0
    }
  },
  "confusion_matrix": {
    "plural": {
      "plural": 261,
      "singular": 12,
      "unclassified": 1
    },
    "singular": {
      "plural": 24,
      "singular": 885,
      "unclassified": 17
    },
    "unclassified": {
      "plural": 0,
      "singular": 0,
      "unclassified": 0
    }
  },
  "labels": [
    "plural",
    "singular",
    "unclassified"
  ],
  "total_examples": 1200,
  "label_metrics_available": true,
  "run_config": {
    "task_name": "OE number",
    "prompt_layout": "standard",
    "task_description": "Determining  grammatical number (sg./pl.) in Old English nouns.",
    "tags": "Old English;morphology;number"
  },
  "source_input_csv": "",
  "source_output_csv": "data/output/OE_number__vertex__gemini3flashpreview__2026-03-10-21-17.csv",
  "source_labels_csv": ""
}
