Spaces:

mabzak
/

Youtube-Comment-Sentimen-Analisis

Runtime error

App Files Files Community

mabzak commited on Nov 1, 2023

Commit

251ffe3

•

1 Parent(s): 5a8fbe1

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -7

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ tokenizer = AutoTokenizer.from_pretrained(pretrained)
 sentiment_analysis = pipeline("sentiment-analysis", model=model, tokenizer=tokenizer)
 label_index = {'LABEL_0': 'positive', 'LABEL_1': 'neutral', 'LABEL_2': 'negative'}
-st.title("Youtube Comment Sentimen Analisis Indonesia")
 st.write("Program ini akan menganalisis komentar dalam sebuah video di youtube menggunakan sentiment analysis, tidak termasuk komentar dalam komentar dan khusus untuk komentar bahasa indonesia")
 # Input URL video
@@ -34,6 +34,8 @@ def analisis_sentimen(text):
     return label, score
 if st.button("Mulai Analisis"):
     # Inisialisasi YoutubeCommentDownloader
     downloader = YoutubeCommentDownloader()
@@ -63,22 +65,32 @@ if st.button("Mulai Analisis"):
     st.info("Memulai analisis sentimen....")
     # List untuk menyimpan hasil analisis sentimen
-    hasil_analisis = []
     # Membaca data dari file CSV
     with open('comments.csv', mode='r', encoding='utf-8') as file:
         reader = csv.DictReader(file)
         for row in tqdm(reader):
             comment_text = row['text']
-            label, score = analisis_sentimen(comment_text)
-            hasil_analisis.append((comment_text, label, score))
     # Menampilkan hasil analisis sentimen
     st.subheader("Hasil Analisis Sentimen")
-    #st.write(hasil_analisis)
     # Menampilkan histogram
-    labels, scores = zip(*[(label, score) for _, label, score in hasil_analisis])
     plt.hist(labels, bins=30, color='blue', alpha=0.7, edgecolor='black')
     plt.xlabel('Skor Sentimen')
     plt.ylabel('Jumlah Komentar')

 sentiment_analysis = pipeline("sentiment-analysis", model=model, tokenizer=tokenizer)
 label_index = {'LABEL_0': 'positive', 'LABEL_1': 'neutral', 'LABEL_2': 'negative'}
+st.title("Indonesia Youtube Comment Sentiment Analysis")
 st.write("Program ini akan menganalisis komentar dalam sebuah video di youtube menggunakan sentiment analysis, tidak termasuk komentar dalam komentar dan khusus untuk komentar bahasa indonesia")
 # Input URL video
     return label, score
 if st.button("Mulai Analisis"):
+    #Memulai Download Komentar
+    st.info("Memulai Download Komentar....")
     # Inisialisasi YoutubeCommentDownloader
     downloader = YoutubeCommentDownloader()
     st.info("Memulai analisis sentimen....")
     # List untuk menyimpan hasil analisis sentimen
+    scores = []
+    labels = []
+    # hasil_analisis = []
     # Membaca data dari file CSV
     with open('comments.csv', mode='r', encoding='utf-8') as file:
         reader = csv.DictReader(file)
         for row in tqdm(reader):
             comment_text = row['text']
+             # Bagi teks menjadi bagian-bagian dengan panjang maksimum 512 token
+            parts = [comment_text[i:i+512] for i in range(0, len(comment_text), 512)]
+            for part in parts:
+                # Analisis sentimen
+                result = sentiment_analysis(part)
+                label = label_index[result[0]['label']]
+                score = result[0]['score'] * 100
+                labels.append(label)
+                scores.append(score)
+                # hasil_analisis.append((comment_text, label, score))
     # Menampilkan hasil analisis sentimen
     st.subheader("Hasil Analisis Sentimen")
+    # st.write(hasil_analisis)
     # Menampilkan histogram
+    # labels, scores = zip(*[(label, score) for _, label, score in hasil_analisis])
     plt.hist(labels, bins=30, color='blue', alpha=0.7, edgecolor='black')
     plt.xlabel('Skor Sentimen')
     plt.ylabel('Jumlah Komentar')