{
  "schema_version": "sensebench-run-v2",
  "run_id": "deepseek-v4-pro-high-reasoning-p002-lexen-v1-20260614",
  "created_at": "2026-06-14T18:31:09.158241+00:00",
  "git_commit": "acc066861d4500c1144a3bb5cea415f8c47b8389",
  "runner": {
    "github_handle": "vassiliphilippov",
    "name": "Vassili Philippov",
    "contact": null
  },
  "dataset": {
    "dataset_id": "lexen",
    "dataset_version": "lexen-v1",
    "dataset_revision": null,
    "content_hash": "sha256:5fd4382b93f19087a1e31f6dd7d1db17c1eb17ff80fcbe1d3fdd55c0c3ecefe8",
    "item_count": 4861
  },
  "prompt": {
    "id": "p002",
    "sensebench_version": "0.1.0"
  },
  "model": {
    "kind": "cloud_llm",
    "display_name": "openrouter/deepseek/deepseek-v4-pro",
    "requested_model": "openrouter/deepseek/deepseek-v4-pro",
    "resolved_model": "deepseek/deepseek-v4-pro-20260423",
    "resolved_model_counts": {
      "deepseek/deepseek-v4-pro-20260423": 4904
    },
    "llm_vendor": "DeepSeek",
    "api_provider": "OpenRouter",
    "source_kind": "open_source",
    "license": null,
    "model_url": null,
    "reasoning_effort": "high",
    "endpoint_base_url": null
  },
  "sampling": {
    "temperature": null,
    "top_p": null,
    "max_tokens": 8192,
    "seed": null,
    "extra": {}
  },
  "policy": {
    "votes_per_item": 1,
    "semantic_reasks_per_invalid_vote": 1,
    "tie_break": "earliest_vote",
    "monosemous_policy": "short_circuit",
    "shuffle_senses_per_vote": false
  },
  "machine": null,
  "execution": {
    "concurrency": 48,
    "warmup_call_count": 0,
    "timing": {
      "benchmark_started_at": "2026-06-14T18:08:04.702911+00:00",
      "benchmark_ended_at": "2026-06-14T18:31:09.155695+00:00",
      "benchmark_seconds": 1384.4682261659764,
      "setup_seconds": 0.9577432500082068
    }
  },
  "totals": {
    "item_count": 4861,
    "correct_count": 4448,
    "accuracy": 0.9150380580127546,
    "call_count": 4904,
    "usage": {
      "input_tokens": 1122876,
      "cached_input_tokens": 128,
      "output_tokens": 2067138,
      "reasoning_output_tokens": 2112679
    },
    "cost": {
      "currency": "USD",
      "total_usd": 6.501680728,
      "input_uncached_usd": 1.387367175,
      "input_cached_usd": null,
      "output_usd": 5.183211195,
      "input_uncached_unit_price_usd": null,
      "input_cached_unit_price_usd": null,
      "output_unit_price_usd": null,
      "source": "provider_reported"
    },
    "elapsed_seconds": 1384.4682261659764
  }
}
