Spaces:

Erpg12
/

code-reviewer

Sleeping

Erpg12 commited on Apr 19

Commit

5373208

1 Parent(s): f257ac1

feat: use larger model

Files changed (1) hide show

app.py CHANGED Viewed

@@ -11,8 +11,8 @@ from transformers import (
 # ▸ For a causal code model (no T5 errors):
 # MODEL_ID = "Salesforce/codegen-350M-multi"
 # ▸ Or, for a seq‑to‑seq model:
-# MODEL_ID = "google/flan-t5-base"
-MODEL_ID = "google/flan-t5-small"
 # MODEL_ID = "Salesforce/codegen-350M-multi"
 # ── 2) Load tokenizer + model ────────────────────────────────────────
@@ -46,10 +46,17 @@ def review_code(diff: str, guidelines: str):
         f"DIFF:\n{diff}\n\n"
         f"GUIDELINES:\n{guidelines}\n\n"
         "OUTPUT FORMAT EXAMPLE:\n"
-        '[{"line":12,"comment":"…"}]\n'
     )
     out = pipe(prompt)[0]["generated_text"]
     start = out.find("[")
     end   = out.rfind("]") + 1
     if start < 0 or end < 0:

 # ▸ For a causal code model (no T5 errors):
 # MODEL_ID = "Salesforce/codegen-350M-multi"
 # ▸ Or, for a seq‑to‑seq model:
+MODEL_ID = "google/flan-t5-base"
+# MODEL_ID = "google/flan-t5-small"
 # MODEL_ID = "Salesforce/codegen-350M-multi"
 # ── 2) Load tokenizer + model ────────────────────────────────────────
         f"DIFF:\n{diff}\n\n"
         f"GUIDELINES:\n{guidelines}\n\n"
         "OUTPUT FORMAT EXAMPLE:\n"
+        '[{"line":12,"comment":"…"}]\n\n'
+        "<<<END_JSON>>>\n"
     )
+    # Run the model
     out = pipe(prompt)[0]["generated_text"]
+    # Truncate at our stop marker, if present
+    if "<<<END_JSON>>>" in out:
+        out = out.split("<<<END_JSON>>>")[0]
     start = out.find("[")
     end   = out.rfind("]") + 1
     if start < 0 or end < 0: