Spaces:

akash418
/

bloom-zero-shot

Runtime error

App Files Files Community

akash418 commited on Jan 9, 2023

Commit

cabea5c

1 Parent(s): 6972c11

new

Browse files

Files changed (4) hide show

__pycache__/screenshot.cpython-37.pyc +0 -0
__pycache__/spaces_info.cpython-37.pyc +0 -0
app.py +33 -16
requirements.txt +2 -0

__pycache__/screenshot.cpython-37.pyc ADDED Viewed

Binary file (2.97 kB). View file

__pycache__/spaces_info.cpython-37.pyc ADDED Viewed

Binary file (2.99 kB). View file

app.py CHANGED Viewed

@@ -2,6 +2,7 @@ import gradio as gr
 import requests
 import json
 import os
 from screenshot import (
     before_prompt,
     prompt_to_generation,
@@ -10,11 +11,13 @@ from screenshot import (
     js_load_script,
 )
 from spaces_info import description, examples, initial_prompt_value
 #API_URL = os.getenv("API_URL")
 #HF_API_TOKEN = os.getenv("HF_API_TOKEN")
-API_URL = "https://api-inference.huggingface.co/models/bigscience/bloom-560m"
 HF_API_TOKEN = "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"
 def query(payload):
@@ -30,7 +33,7 @@ def inference(input_sentence, max_length, sample_or_greedy, seed=42):
             "max_new_tokens": max_length,
             "top_p": 0.9,
             "do_sample": True,
-            "seed": seed,
             "early_stopping": False,
             "length_penalty": 0.0,
             "eos_token_id": None,
@@ -39,29 +42,43 @@ def inference(input_sentence, max_length, sample_or_greedy, seed=42):
         parameters = {
             "max_new_tokens": max_length,
             "do_sample": False,
-            "seed": seed,
             "early_stopping": False,
             "length_penalty": 0.0,
             "eos_token_id": None,
         }
     payload = {"inputs": input_sentence, "parameters": parameters,"options" : {"use_cache": False} }
-    data = query(payload)
-    if "error" in data:
-        return (None, None, f"<span style='color:red'>ERROR: {data['error']} </span>")
-    generation = data[0]["generated_text"].split(input_sentence, 1)[1]
-    return (
-        before_prompt
-        + input_sentence
-        + prompt_to_generation
-        + generation
-        + after_generation,
-        data[0]["generated_text"],
-        "",
-    )
 if __name__ == "__main__":

 import requests
 import json
 import os
+from transformers import
 from screenshot import (
     before_prompt,
     prompt_to_generation,
     js_load_script,
 )
 from spaces_info import description, examples, initial_prompt_value
+from transformers import pipeline, AutoModelForCausalLM, AutoTokenizer, set_seed
 #API_URL = os.getenv("API_URL")
 #HF_API_TOKEN = os.getenv("HF_API_TOKEN")
+API_URL = "https://api-inference.huggingface.co/models/hf-internal-testing/tiny-random-bloom"
 HF_API_TOKEN = "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"
 def query(payload):
             "max_new_tokens": max_length,
             "top_p": 0.9,
             "do_sample": True,
+            #"seed": seed,
             "early_stopping": False,
             "length_penalty": 0.0,
             "eos_token_id": None,
         parameters = {
             "max_new_tokens": max_length,
             "do_sample": False,
+            #"seed": seed,
             "early_stopping": False,
             "length_penalty": 0.0,
             "eos_token_id": None,
         }
     payload = {"inputs": input_sentence, "parameters": parameters,"options" : {"use_cache": False} }
+    model_name = 'bigscience/bloomz-560m'
+    pipe = pipeline("text-generation",
+        model = model_name,
+        tokenizer = model_name,
+        max_new_tokens = max_length,
+        do_sample = False,
+        length_penalty = 0.0,
+        early_stopping = False,
+        eos_token_id = None
+    )
+    res = pipe(input_sentence)
+    generation = res["generated_text"]
+    #data = query(payload)
+    #if "error" in data:
+    #    return (None, None, f"<span style='color:red'>ERROR: {data['error']} </span>")
+    #generation = data[0]["generated_text"].split(input_sentence, 1)[1]
+    # return (
+    #     before_prompt
+    #     + input_sentence
+    #     + prompt_to_generation
+    #     + generation
+    #     + after_generation,
+    #     data[0]["generated_text"],
+    #     "",
+    # )
+    return generation
 if __name__ == "__main__":

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ transformers
2	+ accelerate