HFMODEL-translator-2

Runtime error

futranbg commited on Nov 7, 2023

Commit

4517722

1 Parent(s): 7c99e18

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -47,20 +47,20 @@ llm1 = HuggingFaceHub(repo_id=llama_repo, task="text-generation", model_kwargs=m
 llm2 = HuggingFaceHub(repo_id=starchat_repo, task="text-generation", model_kwargs=model_kwargs)
 llm3 = HuggingFaceHub(repo_id=bloom_repo, task="text-generation", model_kwargs=bloom_model_kwargs)
-def split_text_into_chunks(text, chunk_size=800):
-    lines = text.splitlines()
     chunks = []
-    temp_chunk = ""
     for line in lines:
         # If adding the current line doesn't exceed the chunk size, add the line to the chunk
-        if len(temp_chunk) + len(line) <= chunk_size:
-            temp_chunk += line + '\n'
         else:
             # If adding the line exceeds chunk size, store the current chunk and start a new one
-            chunks.append(temp_chunk)
-            temp_chunk = line + '\n'
     # Don't forget the last chunk
-    chunks.append(temp_chunk)
     return chunks
 def translation(source, target, text):
@@ -70,7 +70,7 @@ def translation(source, target, text):
         try:
             input_prompt = bloom_template.replace("{source}", source)
             input_prompt = input_prompt.replace("{target}", target)
-            input_prompt = input_prompt.replace("{query}", chunk.strip())
             stchunk = llm3(input_prompt)
             for eot in bloom_model_kwargs['stop']:
                 stchunk = stchunk.replace(eot,"")

 llm2 = HuggingFaceHub(repo_id=starchat_repo, task="text-generation", model_kwargs=model_kwargs)
 llm3 = HuggingFaceHub(repo_id=bloom_repo, task="text-generation", model_kwargs=bloom_model_kwargs)
+def split_text_into_chunks(text, chunk_size=1000):
+    lines = text.split('\n')
     chunks = []
+    chunk = ""
     for line in lines:
         # If adding the current line doesn't exceed the chunk size, add the line to the chunk
+        if len(chunk) + len(line) <= chunk_size:
+            chunk += line + '\n'
         else:
             # If adding the line exceeds chunk size, store the current chunk and start a new one
+            chunks.append(chunk)
+            chunk = line + '\n'
     # Don't forget the last chunk
+    chunks.append(chunk)
     return chunks
 def translation(source, target, text):
         try:
             input_prompt = bloom_template.replace("{source}", source)
             input_prompt = input_prompt.replace("{target}", target)
+            input_prompt = input_prompt.replace("{query}", chunk)
             stchunk = llm3(input_prompt)
             for eot in bloom_model_kwargs['stop']:
                 stchunk = stchunk.replace(eot,"")