Spaces:

Kuautli
/

ProyectoDS-AnalizaTube

Runtime error

App Files Files Community

Kuautli commited on Jan 28

Commit

97e7318

verified ·

1 Parent(s): 0b29bd8

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -7

app.py CHANGED Viewed

@@ -34,21 +34,23 @@ def index():
     sentiment_count = None
     current_directory = os.getcwd()
-    print("Directorio de trabajo actual:", current_directory)
     if request.method == "POST":
         url = request.form["url"]
         if url:
             video_details = clustering.get_youtube_video_details(url, api_key)
             comments_df = clustering.get_youtube_comments(api_key, url)
             comments_df = clustering.add_normalized_embeddings_to_dataframe(
                 comments_df, "comment"
             )
             comments_df["published_at"] = pd.to_datetime(
                 comments_df["published_at"]
             ).dt.date
             comments_df = clustering.classify_sentiment_df(comments_df)
             comments_df.to_pickle(
                 "./data/Comentarios-Youtube/comments_df.pkl"
@@ -64,14 +66,14 @@ def index():
             umap_df, min_eps, max_eps = clustering.transform_embeddings(
                 comments_df, embeddings_col="embeddings"
             )
             image_path = os.path.join("static", "wordcloud.png")
             clustering.plot_wordcloud(comments_df, text_column="comment", output_filename=image_path)
             total = comments_df.shape[0]
             min_items_by_cluster = clustering.determine_min_items_by_cluster(total)
             (
                 cluster_assignments,
                 cluster_counts,
@@ -84,7 +86,7 @@ def index():
                 threshold_values=[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9],
                 embeddings_col="embeddings"
             )
             labels, source, target, values, comments = clustering.build_sankey_data(
                 cluster_assignments,
                 cluster_counts,

     sentiment_count = None
     current_directory = os.getcwd()
+    print("Iniciando procesamiento...")
     if request.method == "POST":
         url = request.form["url"]
         if url:
+            print("Obteniendo datos")
             video_details = clustering.get_youtube_video_details(url, api_key)
             comments_df = clustering.get_youtube_comments(api_key, url)
+            print("Generando embeddings")
             comments_df = clustering.add_normalized_embeddings_to_dataframe(
                 comments_df, "comment"
             )
+            print("Procesamiento de los datos")
             comments_df["published_at"] = pd.to_datetime(
                 comments_df["published_at"]
             ).dt.date
+            print("Clasificación de los sentimientos")
             comments_df = clustering.classify_sentiment_df(comments_df)
             comments_df.to_pickle(
                 "./data/Comentarios-Youtube/comments_df.pkl"
             umap_df, min_eps, max_eps = clustering.transform_embeddings(
                 comments_df, embeddings_col="embeddings"
             )
+            print("Generación de wordcloud")
             image_path = os.path.join("static", "wordcloud.png")
             clustering.plot_wordcloud(comments_df, text_column="comment", output_filename=image_path)
             total = comments_df.shape[0]
+            print("Evaluación de métricas")
             min_items_by_cluster = clustering.determine_min_items_by_cluster(total)
+            print("Modelado")
             (
                 cluster_assignments,
                 cluster_counts,
                 threshold_values=[0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9],
                 embeddings_col="embeddings"
             )
+            print("Creación de gráfico de Sankey")
             labels, source, target, values, comments = clustering.build_sankey_data(
                 cluster_assignments,
                 cluster_counts,