Spaces:

osmankoc
/

zoa-llm-api

Sleeping

osmankoc commited on Feb 5

Commit

8358801

1 Parent(s): 039fbc1

fix according to zoa llm

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,25 +18,28 @@ def generate(prompt):
         {"role": "system", "content": "You are HTML Web Developer. enerate HTML code using Tailwind CSS framework and Shadcn UI components. Add HTML tags to the code. Don't forget to use the correct classes. Don't write inline styles and descriptions."},
         {"role": "user", "content": prompt}
     ]
-    text = tokenizer.apply_chat_template(
-        messages,
-        tokenize=False,
-        add_generation_prompt=True
-    )
-    model_inputs = tokenizer([text], return_tensors="pt").to("cuda")
-    # output = model.generate(**inputs, max_length=2500)
-    # response = tokenizer.decode(output[0], skip_special_tokens=True)
-    generated_ids = model.generate(
-        **model_inputs,
-        max_new_tokens=512
-    )
-    generated_ids = [
-        output_ids[len(input_ids):] for input_ids, output_ids in zip(model_inputs.input_ids, generated_ids)
-    ]
-    response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
     return response

         {"role": "system", "content": "You are HTML Web Developer. enerate HTML code using Tailwind CSS framework and Shadcn UI components. Add HTML tags to the code. Don't forget to use the correct classes. Don't write inline styles and descriptions."},
         {"role": "user", "content": prompt}
     ]
+    # text = tokenizer.apply_chat_template(
+    #     messages,
+    #     tokenize=False,
+    #     add_generation_prompt=True
+    # )
+    inputs = tokenizer(messages, return_tensors="pt").to("cuda")
+    output = model.generate(**inputs, max_length=2500)
+    response = tokenizer.decode(output[0], skip_special_tokens=True)
+    # model_inputs = tokenizer([text], return_tensors="pt").to("cuda")
+    # generated_ids = model.generate(
+    #     **model_inputs,
+    #     max_new_tokens=512
+    # )
+    # generated_ids = [
+    #     output_ids[len(input_ids):] for input_ids, output_ids in zip(model_inputs.input_ids, generated_ids)
+    # ]
+    # response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
     return response