Spaces:

shrey-14
/

text-summarizer

Sleeping

App Files Files Community

shrey-14 commited on Jul 27, 2024

Commit

a274d7c

verified ·

1 Parent(s): 242eda4

Final commit

Browse files

Files changed (4) hide show

app.py +82 -0
rouge_scores.csv +5 -0
summaries_results.csv +0 -0
text-summarization.ipynb +0 -0

app.py ADDED Viewed

	@@ -0,0 +1,82 @@

+from transformers import pipeline, AutoModelForSeq2SeqLM, AutoTokenizer
+import gradio as gr
+import re
+model_link = "text_summary_model"
+model = AutoModelForSeq2SeqLM.from_pretrained(model_link)
+tokenizer = AutoTokenizer.from_pretrained(model_link)
+pipe = pipeline('summarization', model=model, tokenizer=tokenizer)
+gen_kwargs = {'length_penalty': 0.8, 'num_beams': 8, "min_length": 30}
+def dummy_summarize(text):
+    text = clean_text(text)
+    return pipe(text, **gen_kwargs)[0]['summary_text']
+def clean_text(text):
+    # Remove Byte Order Marks (BOM)
+    text = text.replace('\ufeff', '')
+    # Replace \n with a space
+    text = text.replace('\n', ' ')
+    # Replace \r with a space
+    text = text.replace('\r', ' ')
+    # Remove backslashes
+    text = text.replace('\\', '')
+    # Remove Non-ASCII characters
+    text = re.sub(r'[^\x00-\x7F]+', '', text)
+    # Remove Non-printable characters
+    text = re.sub(r'[\x00-\x1F\x7F-\x9F]', '', text)
+    # Normalize whitespace
+    text = ' '.join(text.split())
+    return text
+# Custom HTML and CSS for the title and theme
+title_html = """
+<h1 style="font-size: 40px; text-align: center; color: white;">Text Summarization</h1>
+<p style="text-align: center; color: white; font-size:20px">Enter text to summarize it using a pretrained model.</p>
+"""
+css = """
+body {
+    background-color: #007BFF;
+    color: white;
+}
+.gr-textbox textarea {
+    background-color: #0056b3;
+    color: white;
+    border: 2px solid white;
+}
+.gr-button {
+    background-color: #0056b3;
+    color: white;
+    border: 2px solid white;
+}
+.gr-button:hover {
+    background-color: #004080;
+}
+.gr-textbox input {
+    background-color: #0056b3;
+    color: white;
+    border: 2px solid white;
+}
+"""
+# Create a Gradio interface with large input and output textboxes
+interface = gr.Interface(
+    fn=dummy_summarize,
+    inputs=gr.Textbox(lines=15, placeholder="Enter text here..."),
+    outputs=gr.Textbox(lines=15, placeholder="Summary will appear here..."),
+    description=title_html,
+    theme="compact",  # Use compact theme to reduce padding
+    css=css
+)
+# Launch the interface
+interface.launch()

rouge_scores.csv ADDED Viewed

	@@ -0,0 +1,5 @@

+metric,score
+rouge1,"Score(precision=0.5240761726639174, recall=0.5164609406411964, fmeasure=0.48813699709755287)"
+rouge2,"Score(precision=0.2750003463132431, recall=0.26328277298441694, fmeasure=0.2498681871552253)"
+rougeL,"Score(precision=0.4338563417029981, recall=0.42507261340158575, fmeasure=0.40241707690768413)"
+rougeLsum,"Score(precision=0.4330077769824946, recall=0.42511422355384887, fmeasure=0.4021251370419605)"

summaries_results.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

text-summarization.ipynb ADDED Viewed

The diff for this file is too large to render. See raw diff