Spaces:

saadkhi
/

SQL_chatbot_API

Sleeping

saadkhi commited on 8 days ago

Commit

60e496e

verified ·

1 Parent(s): a93df3d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -26,9 +26,12 @@ print("Loading model...")
 # Load base model
 # ─────────────────────────
-# load config first and REMOVE quantization
 config = AutoConfig.from_pretrained(BASE_MODEL, trust_remote_code=True)
-config.quantization_config = None   # 🔴 important fix
 model = AutoModelForCausalLM.from_pretrained(
     BASE_MODEL,
@@ -46,9 +49,11 @@ print("Merging LoRA...")
 model = model.merge_and_unload()
 tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)
 model.eval()
 print("Model ready")
 # ─────────────────────────
 # Inference
 # ─────────────────────────

 # Load base model
 # ─────────────────────────
+# Load config
 config = AutoConfig.from_pretrained(BASE_MODEL, trust_remote_code=True)
+# 🔴 IMPORTANT FIX
+# Replace quantization config with empty dict (NOT None)
+config.quantization_config = {}
 model = AutoModelForCausalLM.from_pretrained(
     BASE_MODEL,
 model = model.merge_and_unload()
 tokenizer = AutoTokenizer.from_pretrained(BASE_MODEL)
 model.eval()
 print("Model ready")
 # ─────────────────────────
 # Inference
 # ─────────────────────────