sql_query_env/models.py at main · rajdeepchatale/sql_query_env · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
"""
Pydantic models for the SQL environment's action/observation space.

We tried keeping the observation minimal at first but realized the agent
needs way more context to actually improve between steps - so we added
diagnostics, efficiency notes, history etc. Bit of a chonky payload but
it's all text so doesn't matter much for perf.
"""

from typing import Dict, List, Optional

from openenv.core.env_server.types import Action, Observation
from pydantic import Field


class SqlQueryAction(Action):
    """Agent submits a SQL query string."""

    query: str = Field(
        ...,
        description="SQL query to execute against the database. Must be a valid SELECT statement.",
    )


class SqlQueryObservation(Observation):
    """
    Full observation returned after each step.

    We pack a lot in here because the agent needs to understand what went
    wrong and how to fix it. The alternative was returning just a score,
    but that gives basically zero learning signal.
    """

    # task context
    task_id: str = Field(default="", description="Current task identifier")
    difficulty: str = Field(default="easy", description="easy, medium, or hard")
    database_domain: str = Field(
        default="company", description="Which database domain this task uses"
    )
    question: str = Field(default="", description="Natural language question to answer with SQL")
    schema_description: str = Field(
        default="", description="Full database schema with table definitions"
    )

    # query feedback
    query_result: str = Field(default="", description="Formatted result of the last query")
    query_error: Optional[str] = Field(default=None, description="SQL error message, if any")
    feedback: str = Field(default="", description="Detailed grading feedback")

    # structured diagnostics - these are the key differentiator
    diagnostics: List[Dict] = Field(
        default_factory=list,
        description="Structured error diagnostics: type, severity, message, suggestion",
    )
    efficiency_notes: List[str] = Field(
        default_factory=list,
        description="SQL best-practice tips based on the submitted query",
    )

    # hints to help the agent
    expected_row_count: int = Field(default=0, description="Expected number of result rows")
    expected_columns: List[str] = Field(default_factory=list, description="Expected column names")

    # episode progress
    steps_remaining: int = Field(default=0, description="Attempts left in this episode")
    current_score: float = Field(default=0.0, description="Best score so far (0.0-1.0)")
    history: List[Dict] = Field(default_factory=list, description="Previous queries and scores")