Spaces:

Hafizhzpa
/

Indonesian_News_Analytic

Build error

Hafizhzpa commited on Aug 4, 2024

Commit

aecb12d

verified ·

1 Parent(s): 6bab979

add status

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ class NewsAnalytic():
         self.model = T5ForZeroShotClassification.from_pretrained('knowledgator/comprehend_it-multilingual-t5-base')
         self.tokenizer = T5Tokenizer.from_pretrained('knowledgator/comprehend_it-multilingual-t5-base')
         self.classifier = ZeroShotClassificationPipeline(model=self.model, tokenizer=self.tokenizer,ypothesis_template = '{}', encoder_decoder = True)
-        nltk.download('punkt')
     def anoted_sentence(self,content,candidate_labels):
         sentences = nltk.sent_tokenize(content)
         sentences = [sent for sent in sentences if "simak" not in sent.lower()]
@@ -24,6 +24,7 @@ class NewsAnalytic():
         else:
             summary_result="neutral"
         pair_result=[(res['sequence'],res['labels'][0]) if res['labels'][0]!="neutral" else res['sequence'] for res in result]
         return pair_result, summary_result
     def get_news_content(self,url):
         response = requests.get(url)
@@ -40,7 +41,7 @@ class NewsAnalytic():
         paragraphs = soup.find_all('p')
         content = ' '.join([p.get_text() for p in paragraphs])
         content = ' '.join([text for text in content.split("\n") if len(text)>100])
         return {'title': title.strip(), 'content': content.strip()}
     def streamlit_run(self):
         st.markdown("<h2 style='text-align: center;'>Indonesian News Analytic </h2>", unsafe_allow_html=True)

         self.model = T5ForZeroShotClassification.from_pretrained('knowledgator/comprehend_it-multilingual-t5-base')
         self.tokenizer = T5Tokenizer.from_pretrained('knowledgator/comprehend_it-multilingual-t5-base')
         self.classifier = ZeroShotClassificationPipeline(model=self.model, tokenizer=self.tokenizer,ypothesis_template = '{}', encoder_decoder = True)
+        print("load model berhasil!")
     def anoted_sentence(self,content,candidate_labels):
         sentences = nltk.sent_tokenize(content)
         sentences = [sent for sent in sentences if "simak" not in sent.lower()]
         else:
             summary_result="neutral"
         pair_result=[(res['sequence'],res['labels'][0]) if res['labels'][0]!="neutral" else res['sequence'] for res in result]
+        print("sentiment per sentence berhasil!")
         return pair_result, summary_result
     def get_news_content(self,url):
         response = requests.get(url)
         paragraphs = soup.find_all('p')
         content = ' '.join([p.get_text() for p in paragraphs])
         content = ' '.join([text for text in content.split("\n") if len(text)>100])
+        print("mendapatkan konten berita berhasil!")
         return {'title': title.strip(), 'content': content.strip()}
     def streamlit_run(self):
         st.markdown("<h2 style='text-align: center;'>Indonesian News Analytic </h2>", unsafe_allow_html=True)