ahmadluay commited on
Commit
4d91248
β€’
1 Parent(s): 1ed79ac

update dataset now 50000 data,model,eda add more analysis

Browse files
best_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d8856473cb9906cc5a5c1ebb2292e5b7b39b0a3b6e79f14f208a8d735909a996
3
- size 78004048
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f619954d49dfbaf511d493e8da74073896a5f10142fb52f2bf5fb61669946cbb
3
+ size 77868880
dataset_20000_rows.csv β†’ dataset_50000_rows.csv RENAMED
The diff for this file is too large to render. See raw diff
 
eda.py CHANGED
@@ -35,7 +35,7 @@ def run():
35
  st.write('Dataset used is amazon review dataset from [kaggle]("https://www.kaggle.com/datasets/yacharki/amazon-reviews-for-sa-binary-negative-positive-csv").')
36
 
37
  # show dataframe
38
- df2 = pd.read_csv('dataset_20000_rows.csv')
39
  df2 = df2.drop(['Unnamed: 0'],axis=1)
40
  st.dataframe(df2)
41
  # add description of Dataset
@@ -57,7 +57,7 @@ def run():
57
  fig = px.pie(review,values='class_index', names='index',color_discrete_sequence=['red','blue'])
58
  fig.update_layout(title_text = "Type of Review")
59
  st.plotly_chart(fig)
60
- st.write('Based on the table and visualization above, it can be seen that both negative and positive reviews consist of 10,000 reviews each.')
61
  elif select_eda == 'Example of Positive and Negative Review':
62
  # Print sample reviews
63
  pd.set_option('display.width', None)
@@ -77,6 +77,10 @@ def run():
77
  for i in range(0,20):
78
  st.write(sample_positive_review.iloc[i,2])
79
  st.write('-'*100)
 
 
 
 
80
 
81
  elif select_eda == 'Number of Words':
82
  # Count the number of words in each review
 
35
  st.write('Dataset used is amazon review dataset from [kaggle]("https://www.kaggle.com/datasets/yacharki/amazon-reviews-for-sa-binary-negative-positive-csv").')
36
 
37
  # show dataframe
38
+ df2 = pd.read_csv('dataset_50000_rows.csv')
39
  df2 = df2.drop(['Unnamed: 0'],axis=1)
40
  st.dataframe(df2)
41
  # add description of Dataset
 
57
  fig = px.pie(review,values='class_index', names='index',color_discrete_sequence=['red','blue'])
58
  fig.update_layout(title_text = "Type of Review")
59
  st.plotly_chart(fig)
60
+ st.write('Based on the table and visualization above, it can be seen that both negative and positive reviews consist of 25,000 reviews each.')
61
  elif select_eda == 'Example of Positive and Negative Review':
62
  # Print sample reviews
63
  pd.set_option('display.width', None)
 
77
  for i in range(0,20):
78
  st.write(sample_positive_review.iloc[i,2])
79
  st.write('-'*100)
80
+ st.write('Based on the examples of various reviews above, what distinguishes between positive reviews and negative reviews :')
81
+ st.write('1. **Positive reviews** generally express satisfaction with a product, service, or experience, highlighting the positive aspects and benefits that were experienced. They often use positive language and may include specific examples of what the reviewer liked about the product or service. They may also mention the quality, value for money, or ease of use.')
82
+ st.write('2. **Negative reviews**, on the other hand, typically express dissatisfaction or disappointment with a product, service, or experience. They often highlight specific problems or issues that the reviewer experienced, such as poor quality, bad customer service, or difficulty using the product. Negative reviews may use negative language and may also include suggestions for how the product or service could be improved.')
83
+ st.write('Overall, the key difference between positive and negative reviews is the attitude of the reviewer and their overall satisfaction with the product or service. Positive reviews reflect a positive experience, while negative reviews reflect a negative experience.')
84
 
85
  elif select_eda == 'Number of Words':
86
  # Count the number of words in each review
t.pickle CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81511b93c63c33d81015ede057cb169ca619cc49c3c8a83cbe8e5b78c651a9af
3
- size 2066705
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:942c8fa939686e4632a7964cc2a9e222db65c203a0eaed24032a6a6438751426
3
+ size 2062767