Spaces:

Eishaan
/

sql-migration-env

Sleeping

App Files Files Community

Eishaan commited on about 1 month ago

Commit

ba3f47d

1 Parent(s): 5f32203

final: complete airtight hardening (strict constraints, numerical stability, performance metrics)

Browse files

Files changed (4) hide show

server/__pycache__/environment.cpython-312.pyc +0 -0
server/__pycache__/grader.cpython-312.pyc +0 -0
server/environment.py +12 -2
server/grader.py +58 -13

server/__pycache__/environment.cpython-312.pyc CHANGED Viewed

Binary files a/server/__pycache__/environment.cpython-312.pyc and b/server/__pycache__/environment.cpython-312.pyc differ

server/__pycache__/grader.cpython-312.pyc CHANGED Viewed

Binary files a/server/__pycache__/grader.cpython-312.pyc and b/server/__pycache__/grader.cpython-312.pyc differ

server/environment.py CHANGED Viewed

@@ -351,19 +351,27 @@ class DbMigrationEnvironment(Environment):
                 metadata={"error": "not_initialized"},
             )
         self._step_count += 1
         sql_command = action.sql_command.strip()
         # --- A3: Dangerous SQL Blacklist ---
         sql_lower = sql_command.lower()
         if re.search(r"pragma\s+foreign_keys\s*=\s*(off|0)", sql_lower):
-            execution_result = "Security Error: Disabling PRAGMA foreign_keys is strictly explicitly forbidden."
             action_error = "pragma_off_blocked"
         elif _DANGEROUS_PATTERNS.search(sql_command):
             execution_result = (
                 "Error: This SQL command is not allowed for security reasons. "
                 "ATTACH DATABASE, DETACH DATABASE, LOAD_EXTENSION, and "
-                "PRAGMA writable_schema are blocked."
             )
             action_error = "blocked_command"
         else:
@@ -443,10 +451,12 @@ class DbMigrationEnvironment(Environment):
         self._state.migration_progress = current_score
         # Build metadata with reasoning and debug info
         meta = {
             "reasoning": action.reasoning,
             "sql_executed": action.sql_command,
             "step": self._step_count,
         }
         if action_error:
             meta["error"] = action_error

                 metadata={"error": "not_initialized"},
             )
+        import time
+        start_time = time.time()
         self._step_count += 1
         sql_command = action.sql_command.strip()
         # --- A3: Dangerous SQL Blacklist ---
         sql_lower = sql_command.lower()
         if re.search(r"pragma\s+foreign_keys\s*=\s*(off|0)", sql_lower):
+            execution_result = (
+                "Security Error: Disabling PRAGMA foreign_keys is strictly forbidden. "
+                "Tip: To maintain integrity, perform your migration using temporary tables "
+                "or deferred constraints instead of disabling enforcement."
+            )
             action_error = "pragma_off_blocked"
         elif _DANGEROUS_PATTERNS.search(sql_command):
             execution_result = (
                 "Error: This SQL command is not allowed for security reasons. "
                 "ATTACH DATABASE, DETACH DATABASE, LOAD_EXTENSION, and "
+                "PRAGMA writable_schema are blocked. "
+                "Tip: Use standard DML (INSERT/UPDATE/DELETE) and DDL (CREATE/DROP) within a single database."
             )
             action_error = "blocked_command"
         else:
         self._state.migration_progress = current_score
         # Build metadata with reasoning and debug info
+        execution_ms = int((time.time() - start_time) * 1000)
         meta = {
             "reasoning": action.reasoning,
             "sql_executed": action.sql_command,
             "step": self._step_count,
+            "execution_ms": execution_ms,
         }
         if action_error:
             meta["error"] = action_error

server/grader.py CHANGED Viewed

@@ -47,9 +47,15 @@ def _get_table_names(conn: sqlite3.Connection) -> Set[str]:
 def _get_column_info(conn: sqlite3.Connection, table: str) -> List[dict]:
     """Get column info for a table. Returns list of {name, type, notnull, pk}."""
     try:
-        cursor = conn.execute(f"PRAGMA table_info({table})")
         return [
-            {"name": row[1].lower(), "type": row[2].upper(), "notnull": row[3], "pk": row[5]}
             for row in cursor.fetchall()
         ]
     except Exception:
@@ -61,9 +67,12 @@ def _get_column_names(conn: sqlite3.Connection, table: str) -> Set[str]:
     return {col["name"] for col in _get_column_info(conn, table)}
-def _get_column_signatures(conn: sqlite3.Connection, table: str) -> Set[Tuple[str, str]]:
-    """Get (name, type) tuples for strict schema grading."""
-    return {(col["name"], col["type"]) for col in _get_column_info(conn, table)}
 def _get_row_count(conn: sqlite3.Connection, table: str) -> int:
@@ -158,24 +167,60 @@ def _compare_row_data(
     # Per-row comparison (order-independent for flexibility)
     golden_set = set()
     for row in golden_rows:
-        # Normalize: convert all values to strings for loose comparison
-        golden_set.add(tuple(str(v).strip() if v is not None else "" for v in row))
     matched = 0
     for row in agent_rows:
-        normalized = tuple(str(v).strip() if v is not None else "" for v in row)
-        if normalized in golden_set:
-            matched += 1
-            golden_set.discard(normalized)
     if len(golden_rows) == 0:
-        content_match = 0.0
     else:
         content_match = matched / len(golden_rows)
     # Penalize extra rows (data bloat)
     if len(agent_rows) > len(golden_rows):
-        bloat_penalty = max(0, 1.0 - (len(agent_rows) - len(golden_rows)) / len(golden_rows))
         content_match *= bloat_penalty
     return 0.4 * count_match + 0.6 * content_match

 def _get_column_info(conn: sqlite3.Connection, table: str) -> List[dict]:
     """Get column info for a table. Returns list of {name, type, notnull, pk}."""
     try:
+        cursor = conn.execute(f"PRAGMA table_info([{table}])")
         return [
+            {
+                "name": row[1].lower(),
+                "type": row[2].upper(),
+                "notnull": row[3],
+                "dflt_value": row[4],  # Added check for default values
+                "pk": row[5]
+            }
             for row in cursor.fetchall()
         ]
     except Exception:
     return {col["name"] for col in _get_column_info(conn, table)}
+def _get_column_signatures(conn: sqlite3.Connection, table: str) -> Set[Tuple[str, str, int, Any]]:
+    """Get (name, type, notnull, dflt_value) tuples for absolute schema grading."""
+    return {
+        (col["name"], col["type"], col["notnull"], str(col["dflt_value"]))
+        for col in _get_column_info(conn, table)
+    }
 def _get_row_count(conn: sqlite3.Connection, table: str) -> int:
     # Per-row comparison (order-independent for flexibility)
     golden_set = set()
     for row in golden_rows:
+        # Normalize: try numerical comparison first, fallback to string
+        normalized_golden = []
+        for v in row:
+            if v is None: normalized_golden.append("")
+            else:
+                try:
+                    normalized_golden.append(float(v))
+                except (ValueError, TypeError):
+                    normalized_golden.append(str(v).strip())
+        golden_set.add(tuple(normalized_golden))
     matched = 0
     for row in agent_rows:
+        # Normalize: try numerical comparison first, fallback to string
+        normalized_agent = []
+        for v in row:
+            if v is None: normalized_agent.append("")
+            else:
+                try: # If it looks like a number, treat as a float for comparison
+                    normalized_agent.append(float(v))
+                except (ValueError, TypeError):
+                    normalized_agent.append(str(v).strip())
+        normalized_agent = tuple(normalized_agent)
+        # Look for match in golden set with numerical tolerance
+        found = False
+        for g_row in list(golden_set):
+            # Compare rows with float tolerance where applicable
+            match = True
+            if len(normalized_agent) != len(g_row): continue
+            for a_val, g_val in zip(normalized_agent, g_row):
+                if isinstance(a_val, float) and isinstance(g_val, float):
+                    if abs(a_val - g_val) > 1e-7:
+                        match = False; break
+                elif str(a_val) != str(g_val):
+                    match = False; break
+            if match:
+                matched += 1
+                golden_set.discard(g_row)
+                found = True
+                break
     if len(golden_rows) == 0:
+        content_match = 1.0 # Logic fix: if golden has no rows, agent with 0 rows is 1.0
     else:
         content_match = matched / len(golden_rows)
     # Penalize extra rows (data bloat)
     if len(agent_rows) > len(golden_rows):
+        # 1% penalty per extra row to prevent "guessing" by dumping all possible data
+        bloat_penalty = max(0.5, 1.0 - (len(agent_rows) - len(golden_rows)) * 0.01)
         content_match *= bloat_penalty
     return 0.4 * count_match + 0.6 * content_match