Spaces:

Joshua1808
/

PaginaWeb

Runtime error

App Files Files Community

Joshua1808 commited on Feb 4, 2023

Commit

bb0de7f

1 Parent(s): d5291cb

Update app.py

Browse files

Files changed (1) hide show

app.py +60 -57

app.py CHANGED Viewed

@@ -80,95 +80,98 @@ with colT2:
     font-size:16px ; font-family: 'Times New Roman'; color: #3358ff;}
     </style> """, unsafe_allow_html=True)
 def analizar_tweets(search_words, number_of_tweets ):
   tweets = api.user_timeline(screen_name = search_words,tweet_mode="extended", count= number_of_tweets)
-  tweet_list = [i.full_text for i in tweets]
-  text= pd.DataFrame(tweet_list)
-  text[0] = text[0].apply(preprocess)
-  text_list = text[0].tolist()
   result = []
-  for text in text_list:
-      if (text.startswith('RT')):
           continue
       else:
-          prediction = pipeline_nlp(text)
           for predic in prediction:
-              etiqueta = {'Tweets': text,'Prediccion': predic['label'], 'Probabilidad': predic['score']}
               result.append(etiqueta)
   df = pd.DataFrame(result)
   df['Prediccion'] = np.where( df['Prediccion'] == 'LABEL_1', 'Sexista', 'No Sexista')
   tabla = st.table(df.reset_index(drop=True).head(30).style.applymap(color_survived, subset=['Prediccion']))
   return tabla
-def analizar_frase(frase):
-  predictions = pipeline_nlp(frase)
-  # convierte las predicciones en una lista de diccionarios
-  data = [{'Texto': frase, 'Prediccion': prediction['label'], 'Probabilidad': prediction['score']} for prediction in predictions]
-  # crea un DataFrame a partir de la lista de diccionarios
-  df = pd.DataFrame(data)
-  df['Prediccion'] = np.where( df['Prediccion'] == 'LABEL_1', 'Sexista', 'No Sexista')
-  # muestra el DataFrame
- #st.table(df.reset_index(drop=True).head(30).style.applymap(color_survived, subset=['Prediccion']))
-  tabla = st.table(df.reset_index(drop=True).head(30).style.applymap(color_survived, subset=['Prediccion']))
-  return tabla
 def tweets_localidad(buscar_localidad):
     tabla = []
     try:
         geolocator = Nominatim(user_agent="nombre_del_usuario")
         location = geolocator.geocode(buscar_localidad)
         radius = "10km"
-        tweets = api.search_tweets(q="",lang="es",geocode=f"{location.latitude},{location.longitude},{radius}", count = 30, tweet_mode="extended")
-        tweet_list = [i.full_text for i in tweets]
-        text= pd.DataFrame(tweet_list)
-        text[0] = text[0].apply(preprocess_tweet)
-        text_list = text[0].tolist()
         result = []
-        for text in text_list:
-            if (text.startswith('RT') ):
                 continue
-            elif not text.strip():
                 continue
             else:
                 prediction = pipeline_nlp(text)
                 for predic in prediction:
                     etiqueta = {'Tweets': text,'Prediccion': predic['label'], 'Probabilidad': predic['score']}
                     result.append(etiqueta)
         df = pd.DataFrame(result)
-        df['Prediccion'] = np.where( df['Prediccion'] == 'LABEL_1', 'Sexista', 'No Sexista')
-        df['Tweets'] = df['Tweets'].str.replace('RT|@', '')
-        #df['Probabilidad'] = df['Probabilidad'].apply(lambda x: '{:.2f}%'.format(x))
-        #df.sort_values(by='Probabilidad', ascending=False, inplace=True)
-        #df = df.sort_values(by=['Probabilidad', 'Prediccion'], ascending=[False, False])
-        df=df[df["Prediccion"] == 'Sexista']
-        df=df[df["Probabilidad"] > 0.8]
-        muestra = st.table(df.reset_index(drop=True).head(30).style.applymap(color_survived, subset=['Prediccion']))
-        tabla.append(muestra)
-        resultado=df.groupby('Prediccion')['Probabilidad'].sum()
-        colores=["#aae977","#EE3555"]
-        fig, ax = plt.subplots(figsize=(4, 4), subplotpars=None)
-        plt.pie(resultado,labels=resultado.index,autopct='%1.1f%%',colors=colores)
-        ax.set_title("Porcentajes por Categorias", fontsize=8, fontweight="bold")
-        plt.rcParams.update({'font.size':8, 'font.weight':'bold'})
-        ax.legend()
-        # Muestra el gráfico
-        plt.show()
-        st.set_option('deprecation.showPyplotGlobalUse', False)
-        st.pyplot()
     except AttributeError:
         st.text("No existe ninguna localidad con ese nombre")
-    return tabla
 def run():
  with st.form("my_form"):
    col,buff1, buff2 = st.columns([2,2,1])

     font-size:16px ; font-family: 'Times New Roman'; color: #3358ff;}
     </style> """, unsafe_allow_html=True)
 def analizar_tweets(search_words, number_of_tweets ):
   tweets = api.user_timeline(screen_name = search_words,tweet_mode="extended", count= number_of_tweets)
   result = []
+  for tweet in tweets:
+      if (tweet.full_text.startswith('RT')):
+          continue
+      elif not  tweet.full_text.strip():
           continue
       else:
+          datos = preprocess(tweet.full_text)
+          prediction = pipeline_nlp(datos)
           for predic in prediction:
+              etiqueta = {'Tweets': datos,'Prediccion': predic['label'], 'Probabilidad': predic['score']}
               result.append(etiqueta)
   df = pd.DataFrame(result)
   df['Prediccion'] = np.where( df['Prediccion'] == 'LABEL_1', 'Sexista', 'No Sexista')
+  df = df[df["Prediccion"] == 'Sexista']
+  df = df[df["Probabilidad"] > 0.80]
   tabla = st.table(df.reset_index(drop=True).head(30).style.applymap(color_survived, subset=['Prediccion']))
+  resultado=df.groupby('Prediccion')['Probabilidad'].sum()
+  colores=["#aae977","#EE3555"]
+  fig, ax = plt.subplots(figsize=(2, 2), subplotpars=None)
+  plt.pie(resultado,labels=resultado.index,autopct='%1.1f%%',colors=colores)
+  ax.set_title("Porcentajes por Categorias", fontsize=8, fontweight="bold")
+  plt.rcParams.update({'font.size':8, 'font.weight':'bold'})
+  ax.legend()
+  # Muestra el gráfico
+  plt.show()
+  st.set_option('deprecation.showPyplotGlobalUse', False)
+  st.pyplot()
   return tabla
 def tweets_localidad(buscar_localidad):
     tabla = []
     try:
         geolocator = Nominatim(user_agent="nombre_del_usuario")
         location = geolocator.geocode(buscar_localidad)
         radius = "10km"
+        tweets = api.search_tweets(q="",lang="es",geocode=f"{location.latitude},{location.longitude},{radius}", count = 50, tweet_mode="extended")
         result = []
+        for tweet in tweets:
+            if (tweet.full_text.startswith):
                 continue
+            elif not  tweet.full_text.strip():
                 continue
             else:
+                datos = preprocess(tweet.full_text)
                 prediction = pipeline_nlp(text)
                 for predic in prediction:
                     etiqueta = {'Tweets': text,'Prediccion': predic['label'], 'Probabilidad': predic['score']}
                     result.append(etiqueta)
         df = pd.DataFrame(result)
+        if df.empty:
+          muestra = st.table("No se encontraron tweets sexistas dentro de la localidad")
+          tabla.append(muestra)
+        else:
+          df['Prediccion'] = np.where( df['Prediccion'] == 'LABEL_1', 'Sexista', 'No Sexista')
+          df = df[df["Prediccion"] == 'Sexista']
+          df = df[df["Probabilidad"] > 0.80]
+          muestra = st.table(df.reset_index(drop=True).head(5).style.applymap(color_survived, subset=['Prediccion']))
+          tabla.append(muestra)
+          resultado=df.groupby('Prediccion')['Probabilidad'].sum()
+          colores=["#aae977","#EE3555"]
+          fig, ax = plt.subplots(figsize=(4, 4), subplotpars=None)
+          plt.pie(resultado,labels=resultado.index,autopct='%1.1f%%',colors=colores)
+          ax.set_title("Porcentajes por Categorias", fontsize=8, fontweight="bold")
+          plt.rcParams.update({'font.size':8, 'font.weight':'bold'})
+          ax.legend()
+          # Muestra el gráfico
+          plt.show()
+          st.set_option('deprecation.showPyplotGlobalUse', False)
+          st.pyplot()
     except AttributeError:
         st.text("No existe ninguna localidad con ese nombre")
+    return tabla
+def analizar_frase(frase):
+  predictions = pipeline_nlp(frase)
+  # convierte las predicciones en una lista de diccionarios
+  data = [{'Texto': frase, 'Prediccion': prediction['label'], 'Probabilidad': prediction['score']} for prediction in predictions]
+  # crea un DataFrame a partir de la lista de diccionarios
+  df = pd.DataFrame(data)
+  df['Prediccion'] = np.where( df['Prediccion'] == 'LABEL_1', 'Sexista', 'No Sexista')
+  # muestra el DataFrame
+  tabla = st.table(df.reset_index(drop=True).head(5).style.applymap(color_survived, subset=['Prediccion']))
+  return tabla
 def run():
  with st.form("my_form"):
    col,buff1, buff2 = st.columns([2,2,1])