(no commit message)

2026-04-25 15:15:05 -07:00
parent 39990697bb
commit 2946901428
3 changed files with 135 additions and 1 deletions
--- a/README.md
+++ b/README.md
@@ -1,2 +1,10 @@
-# writing-style-judge
+---
 a: 3.537087
 b: -1.616884
 is_arbiter: true
 probe_model: modaic/gpt-oss-120b-probe
 size: large
 supports_reasoning: true
 ---
 # writing-style-judge
--- a/config.json
+++ b/config.json
@@ -0,0 +1,73 @@
 {
  "model": null,
  "signature": {
    "$defs": {
      "Reasoning": {
        "type": "dspy.Reasoning"
      }
    },
    "description": "Evaluate whether this writing is good or bad for the life simulation game.\n\nJudge it as a deeply human problem: whether it is good enough, specific enough, and rewarding enough for the player.\n\nIdentify when the writing is too wordy, too cute with its phrasing, or dangles off into something nonspecific.\n\nPrefer writing that feels specific, meaningful, and reaches a logical arc conclusion rather than stopping at a flat or unrewarding next thing that happens.\n\nReturn a qualitative score, whether it passes overall, the issues or none if it passes.",
    "properties": {
      "text": {
        "__dspy_field_type": "input",
        "desc": "The generated writing to evaluate.",
        "prefix": "Text:",
        "title": "Text",
        "type": "string"
      },
      "scenario_context": {
        "__dspy_field_type": "input",
        "desc": "Context about the event, choice, or outcome so the writing can be judged in context.",
        "prefix": "Scenario Context:",
        "title": "Scenario Context",
        "type": "string"
      },
      "writing_quality_score": {
        "__dspy_field_type": "output",
        "desc": "A qualitative score for the writing (0-10).",
        "prefix": "Writing Quality Score:",
        "title": "Writing Quality Score",
        "type": "integer"
      },
      "passes": {
        "__dspy_field_type": "output",
        "desc": "Whether the writing passes overall.",
        "prefix": "Passes:",
        "title": "Passes",
        "type": "boolean"
      },
      "reasoning": {
        "$ref": "#/$defs/Reasoning",
        "__dspy_field_type": "output",
        "desc": "Your reasoning for your answer. Inlude any uncertainties about your answer or ambiguity in the task.",
        "prefix": "Reasoning:"
      },
      "issues": {
        "__dspy_field_type": "output",
        "desc": "Problems identified in the writing.",
        "enum": [
          "too_wordy",
          "too_cute",
          "nonspecific",
          "poor_writing",
          "weak_outcome",
          "unfulfilled_future",
          "none"
        ],
        "prefix": "Issues:",
        "title": "Issues",
        "type": "string"
      }
    },
    "required": [
      "text",
      "scenario_context",
      "writing_quality_score",
      "passes",
      "reasoning",
      "issues"
    ],
    "title": "StringSignature",
    "type": "object"
  }
 }
--- a/program.json
+++ b/program.json
@@ -0,0 +1,53 @@
 {
  "traces": [],
  "train": [],
  "demos": [],
  "signature": {
    "instructions": "Evaluate whether this writing is good or bad for the life simulation game.\n\nJudge it as a deeply human problem: whether it is good enough, specific enough, and rewarding enough for the player.\n\nIdentify when the writing is too wordy, too cute with its phrasing, or dangles off into something nonspecific.\n\nPrefer writing that feels specific, meaningful, and reaches a logical arc conclusion rather than stopping at a flat or unrewarding next thing that happens.\n\nReturn a qualitative score, whether it passes overall, the issues or none if it passes.",
    "fields": [
      {
        "prefix": "Text:",
        "description": "The generated writing to evaluate."
      },
      {
        "prefix": "Scenario Context:",
        "description": "Context about the event, choice, or outcome so the writing can be judged in context."
      },
      {
        "prefix": "Writing Quality Score:",
        "description": "A qualitative score for the writing (0-10)."
      },
      {
        "prefix": "Passes:",
        "description": "Whether the writing passes overall."
      },
      {
        "prefix": "Reasoning:",
        "description": "Your reasoning for your answer. Inlude any uncertainties about your answer or ambiguity in the task."
      },
      {
        "prefix": "Issues:",
        "description": "Problems identified in the writing."
      }
    ]
  },
  "lm": {
    "model": "openrouter/openai/gpt-oss-120b",
    "model_type": "chat",
    "cache": true,
    "num_retries": 3,
    "finetuning_model": null,
    "launch_kwargs": {},
    "train_kwargs": {},
    "temperature": null,
    "max_tokens": null,
    "base_url": "https://openrouter.ai/api/v1"
  },
  "metadata": {
    "dependency_versions": {
      "python": "3.13",
      "dspy": "3.2.0",
      "cloudpickle": "3.1"
    }
  }
 }