Spaces:

ssocean
/

Newborn_Article_Impact_Predict

Running on Zero

App Files Files Community

ssocean commited on Dec 5, 2024

Commit

fb9334a

verified ·

1 Parent(s): 23551ad

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -6

app.py CHANGED Viewed

@@ -15,6 +15,8 @@ tokenizer = None
 @spaces.GPU(duration=60, enable_queue=True)
 def predict(title, abstract):
     global model, tokenizer
     if model is None:
         model = AutoModelForSequenceClassification.from_pretrained(
@@ -86,13 +88,10 @@ examples = [
 ]
 def validate_input(title, abstract):
-    """验证输入是否符合要求"""
-    # 黑名单：屏蔽非拉丁字符
     non_latin_pattern = re.compile(r'[^\u0000-\u007F]')
-    if len(title.split(' '))<4:
         return False, "The title must be at least 3 words long."
-    if len(abstract.split(' ')) < 50:
         return False, "The abstract must be at least 50 words long."
     if len((title + abstract).split(' '))>1024:
         return True, "Warning, The input length is approaching tokenization limits (1024) and may be truncated without further warning!"
@@ -104,7 +103,7 @@ def validate_input(title, abstract):
     return True, "Inputs are valid! Good to go!"
 def update_button_status(title, abstract):
-    """根据输入内容动态更新按钮状态"""
     valid, message = validate_input(title, abstract)
     if not valid:
         return gr.update(value="Error: " + message), gr.update(interactive=False)
@@ -116,6 +115,7 @@ with gr.Blocks() as iface:
     # 🧠 Predict Academic Impact of Newly Published Paper!
     ### Estimate the future academic impact of a paper using LLM
     [Read the full paper](https://arxiv.org/abs/2408.03934)
     """)
     with gr.Row():
         with gr.Column():

 @spaces.GPU(duration=60, enable_queue=True)
 def predict(title, abstract):
+    title = title.replace("\n", " ").strip()
+    abstract = abstract.replace("\n", " ").strip()
     global model, tokenizer
     if model is None:
         model = AutoModelForSequenceClassification.from_pretrained(
 ]
 def validate_input(title, abstract):
     non_latin_pattern = re.compile(r'[^\u0000-\u007F]')
+    if len(title.strip().split(' '))<3:
         return False, "The title must be at least 3 words long."
+    if len(abstract.strip().split(' ')) < 50:
         return False, "The abstract must be at least 50 words long."
     if len((title + abstract).split(' '))>1024:
         return True, "Warning, The input length is approaching tokenization limits (1024) and may be truncated without further warning!"
     return True, "Inputs are valid! Good to go!"
 def update_button_status(title, abstract):
     valid, message = validate_input(title, abstract)
     if not valid:
         return gr.update(value="Error: " + message), gr.update(interactive=False)
     # 🧠 Predict Academic Impact of Newly Published Paper!
     ### Estimate the future academic impact of a paper using LLM
     [Read the full paper](https://arxiv.org/abs/2408.03934)
+    Please note that due to the characteristics of ZeroGPU, quantized models cannot be preloaded. Each time you click "Predict," the model will need to be reinitialized, which may take additional time （usually less than 20s）.
     """)
     with gr.Row():
         with gr.Column():