{
  "model_details": {
    "provider": "e-infra",
    "model_requested": "qwen3.5",
    "model_for_requests": "qwen3.5",
    "api_base_url": "https://llm.ai.e-infra.cz/v1",
    "chat_completions_endpoint": "https://llm.ai.e-infra.cz/v1/chat/completions"
  },
  "run_config": {
    "input": [
      "data/input/prepositions.csv"
    ],
    "labels": "",
    "task_name": "Err. correct. prepositions",
    "task_description": "Correcting errors in prepositions in a transcription of learners' dialogue.",
    "tags": "error;correction;preposition;English",
    "model": "qwen3.5",
    "temperature": null,
    "top_p": null,
    "top_k": null,
    "service_tier": "standard",
    "verbosity": null,
    "reasoning_effort": null,
    "thinking_level": null,
    "effort": null,
    "strict_control_acceptance": true,
    "provider": "e-infra",
    "system_prompt": "You are a meticulous annotator focusing on grammatical errors in the use of prepositions.\nYou will receive a short excerpt of a transcribed dialogue where the node word is a preposition.\nDecide whether it is a correct preposition given the context.\n\nReturn the correct preposition (even if it already is correct). \nIf the preposition should be omitted (i.e. the grammatical correct solution is leaving it out), return 0.\n\nIn your decisions, follow these rules:\n- Do not correct unless necessary: if the preposition is acceptable, even if non-standard (but used in a variety of English) or less idiomatic. In such cases return the preposition as is.\n- Expect spoken language features such as fragments, disfluencies, repetitions, and false starts; treat transcription artifacts (e.g. <B>, </B>, <overlap />, pauses, broken words) as signals of turn structure rather than reliable syntax. If the preposition appears within a short turn delimited by <B> and </B>, prioritize interpreting it within that turn rather than relying on the broader context. \n- If a correct preposition is repeated, which usually signals hesitation, do not correct it. In such cases return the preposition as is. \n- If the speaker self-corrects, evaluate the final intended form.\n- Expect other errors in tense, word choice, or sentence structure, and if the issue is not the preposition itself, do not correct it. In such cases return the preposition as is.\n- If multiple prepositions are possible and none is clearly wrong, do not correct it. In such cases return the preposition as is.",
    "system_prompt_b64": null,
    "few_shot_examples": 0,
    "prompt_layout": "standard",
    "cache_pad_target_tokens": 0,
    "prompt_cache_key": null,
    "gemini_cached_content": null,
    "requesty_auto_cache": null,
    "vertex_auto_adc_login": null,
    "vertex_access_token_refresh_seconds": null,
    "create_gemini_cache": false,
    "gemini_cache_ttl": 3600,
    "gemini_cache_ttl_autoupdate": true,
    "keep_gemini_cache": false,
    "enable_cot": true,
    "no_explanation": false,
    "logprobs": true,
    "calibration": true,
    "confusion_heatmap": true,
    "api_key_var": "E-INFRA_API_KEY",
    "api_base_var": "E-INFRA_BASE_URL",
    "max_retries": 3,
    "retry_delay": 5.0,
    "request_interval_ms": 0,
    "request_timeout_seconds": 600.0,
    "threads": 3,
    "prompt_log_detail": "full",
    "flush_rows": 100,
    "flush_seconds": 2.0,
    "validator_cmd": null,
    "validator_args": "",
    "validator_timeout": 5.0,
    "validator_prompt_max_candidates": 50,
    "validator_prompt_max_chars": 8000,
    "validator_exhausted_policy": "accept_blank_confidence",
    "validator_debug": false,
    "log_level": "INFO"
  },
  "source_input_csv": "data/input/prepositions.csv",
  "source_output_csv": "data/output/prepositions__einfra__qwen35__2026-04-04-12-31.csv",
  "source_labels_csv": "",
  "cache_padding": {
    "enabled": false,
    "target_shared_prefix_tokens": 0,
    "calibration_shared_prefix_tokens": null,
    "target_prompt_tokens": 0,
    "calibration_prompt_tokens": null,
    "calibration_example_id": null,
    "applied_padding_tokens_estimate": 0,
    "examples_with_padding_applied": 0
  },
  "request_control_summary": {
    "configured": {},
    "attempts_total": 1402,
    "attempts_with_control_telemetry": 1375,
    "per_control": {
      "reasoning_effort": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "thinking_level": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "effort": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "verbosity": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "prompt_cache_key": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "gemini_cached_content": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      },
      "requesty_auto_cache": {
        "configured_value": null,
        "requested_attempts": 0,
        "sent_attempts": 0,
        "accepted_attempts": 0,
        "rejected_attempts": 0,
        "missing_from_final_request_attempts": 0,
        "acceptance_rate": null,
        "rejected_reasons": {},
        "rejected_example_ids": []
      }
    }
  },
  "usage_metadata_summary": {
    "attempts_total": 1402,
    "attempts_with_usage_metadata": 1375,
    "attempts_with_cached_token_signals": 0,
    "cached_tokens_total_estimate": 0,
    "cache_read_tokens_total": 0,
    "cache_write_tokens_total": 0,
    "cache_token_fields_totals": {},
    "attempts_with_gemini_cached_content_token_signals": 0,
    "gemini_cached_content_token_count_total": 0,
    "gemini_cached_content_token_fields_totals": {}
  },
  "token_usage_totals": {
    "attempts_total": 1402,
    "attempts_with_token_usage": 1375,
    "attempts_with_output_tokens": 1375,
    "attempts_with_cached_input_tokens": 0,
    "attempts_with_thinking_tokens": 0,
    "input_tokens_total": 1205752,
    "cached_input_tokens_total": 0,
    "non_cached_input_tokens_total": 1205752,
    "output_tokens_total": 3889029,
    "thinking_tokens_total": 0,
    "output_tokens_definition": "total_tokens - prompt_tokens (or completion_tokens + thinking_tokens fallback)"
  },
  "truth_label_count": 1283,
  "prediction_count": 1283,
  "evaluated_example_count": 1283,
  "calibration_metrics": {
    "available": true,
    "sample_count": 1237,
    "bin_count": 10,
    "ece": 0.06569118835894076,
    "mce": 0.3916666666666668,
    "brier_score": 0.08632821341956314
  },
  "first_prompt_timestamp": "2026-04-04T10:31:49.198333Z",
  "last_prompt_timestamp": "2026-04-04T12:47:46.833694Z",
  "overall_time_seconds": 8157.635361,
  "overall_time_human": "2h 15m 58s",
  "accuracy": 0.9033515198752923,
  "cohen_kappa": 0.7803725157791852,
  "macro_precision": 0.5803088737271155,
  "macro_recall": 0.4577276302911533,
  "macro_f1": 0.4822783726198404,
  "per_label": {
    "0": {
      "precision": 0.5357142857142857,
      "recall": 0.6,
      "f1": 0.5660377358490566,
      "support": 25
    },
    "about": {
      "precision": 1.0,
      "recall": 0.5,
      "f1": 0.6666666666666666,
      "support": 2
    },
    "around": {
      "precision": 0.0,
      "recall": 0.0,
      "f1": 0.0,
      "support": 1
    },
    "as": {
      "precision": 1.0,
      "recall": 1.0,
      "f1": 1.0,
      "support": 1
    },
    "at": {
      "precision": 0.9312169312169312,
      "recall": 0.8756218905472637,
      "f1": 0.9025641025641026,
      "support": 201
    },
    "behind": {
      "precision": 1.0,
      "recall": 1.0,
      "f1": 1.0,
      "support": 1
    },
    "during": {
      "precision": 0.0,
      "recall": 0.0,
      "f1": 0.0,
      "support": 4
    },
    "from": {
      "precision": 1.0,
      "recall": 0.5,
      "f1": 0.6666666666666666,
      "support": 2
    },
    "in": {
      "precision": 0.9284210526315789,
      "recall": 0.9597388465723613,
      "f1": 0.9438202247191012,
      "support": 919
    },
    "into": {
      "precision": 0.0,
      "recall": 0.0,
      "f1": 0.0,
      "support": 1
    },
    "of": {
      "precision": 0.0,
      "recall": 0.0,
      "f1": 0.0,
      "support": 2
    },
    "on": {
      "precision": 0.7289719626168224,
      "recall": 0.8478260869565217,
      "f1": 0.7839195979899496,
      "support": 92
    },
    "to": {
      "precision": 1.0,
      "recall": 0.125,
      "f1": 0.2222222222222222,
      "support": 32
    },
    "with": {
      "precision": 0.0,
      "recall": 0.0,
      "f1": 0.0,
      "support": 0
    }
  },
  "labels": [
    "0",
    "about",
    "around",
    "as",
    "at",
    "behind",
    "during",
    "from",
    "in",
    "into",
    "of",
    "on",
    "to",
    "with"
  ],
  "label_count": 14,
  "total_examples": 1283,
  "confusion_matrix": {
    "0": {
      "0": 15,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 1,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 7,
      "into": 0,
      "of": 0,
      "on": 2,
      "to": 0,
      "with": 0
    },
    "about": {
      "0": 0,
      "about": 1,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 1,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    },
    "around": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 1,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    },
    "as": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 1,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 0,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    },
    "at": {
      "0": 1,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 176,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 17,
      "into": 0,
      "of": 0,
      "on": 7,
      "to": 0,
      "with": 0
    },
    "behind": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 1,
      "during": 0,
      "from": 0,
      "in": 0,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    },
    "during": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 3,
      "into": 0,
      "of": 0,
      "on": 1,
      "to": 0,
      "with": 0
    },
    "from": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 1,
      "in": 1,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    },
    "in": {
      "0": 9,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 11,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 882,
      "into": 0,
      "of": 0,
      "on": 17,
      "to": 0,
      "with": 0
    },
    "into": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 1,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    },
    "of": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 1,
      "into": 0,
      "of": 0,
      "on": 1,
      "to": 0,
      "with": 0
    },
    "on": {
      "0": 3,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 11,
      "into": 0,
      "of": 0,
      "on": 78,
      "to": 0,
      "with": 0
    },
    "to": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 1,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 25,
      "into": 0,
      "of": 0,
      "on": 1,
      "to": 4,
      "with": 1
    },
    "with": {
      "0": 0,
      "about": 0,
      "around": 0,
      "as": 0,
      "at": 0,
      "behind": 0,
      "during": 0,
      "from": 0,
      "in": 0,
      "into": 0,
      "of": 0,
      "on": 0,
      "to": 0,
      "with": 0
    }
  },
  "label_metrics_available": true
}