Spaces:

Faisalaldwaish1
/

Sentiment-Analysis-of-Restaurant-Reviews

Sleeping

App Files Files Community

Faisalaldwaish1 commited on Sep 11, 2024

Commit

248d873

verified ·

1 Parent(s): 38f87e8

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -32

app.py CHANGED Viewed

@@ -8,89 +8,72 @@ from fuzzywuzzy import fuzz
 # تحميل البيانات
 reviews_df = pd.read_csv('Restaurant_reviews.csv')
-# تحميل نموذج التصنيف العاطفي من Hugging Face (distilbert-base-uncased-finetuned-sst-2-english)
 sentiment_model = pipeline("sentiment-analysis", model="distilbert-base-uncased-finetuned-sst-2-english")
-# وظيفة لتصنيف المراجعة بناءً على التقييم أو باستخدام نموذج Hugging Face
 def classify_review(user_review):
     try:
-        # التحقق من وجود نص في المدخل
         if not user_review.strip():
             return "Please enter a valid review."
-        # البحث عن المراجعة في قاعدة البيانات باستخدام مطابقة غامضة
         best_match = None
         best_score = 0
-        # تكرار على كل المراجعات الموجودة في قاعدة البيانات
         for _, row in reviews_df.iterrows():
-            # التأكد من أن عمود المراجعات يحتوي على نصوص وليس قيم مفقودة
             if pd.isna(row['Review']):
                 continue
-            # حساب درجة المطابقة بين مراجعة المستخدم والمراجعة في مجموعة البيانات
             score = fuzz.token_sort_ratio(user_review.lower(), str(row['Review']).lower())
             if score > best_score:
                 best_score = score
                 best_match = row
-        # إذا تم العثور على مراجعة ذات تطابق جيد
-        if best_score > 80:  # نستخدم عتبة 80% للتأكد من أن المطابقة دقيقة
             rating = best_match['Rating']
-            # تصنيف المراجعة بناءً على التقييم
-            if int(rating) >= 4:
-                rating_based_classification = f"Positive review based on rating: {rating}"
-            else:
-                rating_based_classification = f"Negative review based on rating: {rating}"
-            # تحليل المراجعة باستخدام نموذج Hugging Face
             sentiment_result = sentiment_model(user_review)[0]
             sentiment = sentiment_result['label']
             confidence = sentiment_result['score']
             sentiment_based_classification = f"Model prediction: {sentiment} with confidence: {confidence:.2f}"
-            # إرجاع النتائج
             return f"{rating_based_classification}\n{sentiment_based_classification}\nMatching Score: {best_score}%"
         else:
             return "Review not found in the dataset."
     except Exception as e:
-        # طباعة الخطأ للحصول على معلومات أكثر حوله
         return f"An error occurred: {str(e)}"
 # وظيفة لرسم توزيع التقييمات
 def plot_rating_distribution():
     plt.figure(figsize=(8, 6))
-    sns.countplot(x='Rating', data=reviews_df, order=[1, 2, 3, 4, 5])  # ترتيب التقييمات تصاعديًا
     plt.title('Distribution of Ratings')
     plt.xlabel('Rating')
     plt.ylabel('Count')
     plt.tight_layout()
     return plt.gcf()
-# إنشاء واجهة Gradio لتصنيف المراجعات
-interface = gr.Interface(
     fn=classify_review,
     inputs=gr.Textbox(lines=2, placeholder="Enter your review here", label="Reviews"),
     outputs="text",
     title="Review Classifier Based on Rating and Hugging Face Model",
-    description="Enter a restaurant review. The system will classify it based on the dataset rating and use a sentiment analysis model if found. If not found, it will notify you."
 )
-# إنشاء واجهة Gradio للرسومات البيانية
-plot_interface_ratings = gr.Interface(
     fn=plot_rating_distribution,
     inputs=[],
     outputs="plot",
     title="Rating Distribution",
     description="Shows the distribution of ratings in the dataset."
 )
-# تشغيل الواجهات
-interface.launch()
-plot_interface_ratings.launch()

 # تحميل البيانات
 reviews_df = pd.read_csv('Restaurant_reviews.csv')
+# تحميل نموذج التصنيف العاطفي
 sentiment_model = pipeline("sentiment-analysis", model="distilbert-base-uncased-finetuned-sst-2-english")
+# وظيفة لتصنيف المراجعة
 def classify_review(user_review):
     try:
         if not user_review.strip():
             return "Please enter a valid review."
         best_match = None
         best_score = 0
         for _, row in reviews_df.iterrows():
             if pd.isna(row['Review']):
                 continue
             score = fuzz.token_sort_ratio(user_review.lower(), str(row['Review']).lower())
             if score > best_score:
                 best_score = score
                 best_match = row
+        if best_score > 80:
             rating = best_match['Rating']
+            rating_based_classification = f"Positive review based on rating: {rating}" if int(rating) >= 4 else f"Negative review based on rating: {rating}"
             sentiment_result = sentiment_model(user_review)[0]
             sentiment = sentiment_result['label']
             confidence = sentiment_result['score']
             sentiment_based_classification = f"Model prediction: {sentiment} with confidence: {confidence:.2f}"
             return f"{rating_based_classification}\n{sentiment_based_classification}\nMatching Score: {best_score}%"
         else:
             return "Review not found in the dataset."
     except Exception as e:
         return f"An error occurred: {str(e)}"
 # وظيفة لرسم توزيع التقييمات
 def plot_rating_distribution():
     plt.figure(figsize=(8, 6))
+    sns.countplot(x='Rating', data=reviews_df, order=[1, 2, 3, 4, 5])
     plt.title('Distribution of Ratings')
     plt.xlabel('Rating')
     plt.ylabel('Count')
     plt.tight_layout()
     return plt.gcf()
+# إنشاء واجهات Gradio
+review_interface = gr.Interface(
     fn=classify_review,
     inputs=gr.Textbox(lines=2, placeholder="Enter your review here", label="Reviews"),
     outputs="text",
     title="Review Classifier Based on Rating and Hugging Face Model",
+    description="Enter a restaurant review. The system will classify it based on the dataset rating and use a sentiment analysis model."
 )
+plot_interface = gr.Interface(
     fn=plot_rating_distribution,
     inputs=[],
     outputs="plot",
     title="Rating Distribution",
     description="Shows the distribution of ratings in the dataset."
 )
+# دمج الواجهتين باستخدام تبويبات
+tabbed_interface = gr.TabbedInterface([review_interface, plot_interface], ["Review Classifier", "Rating Distribution"])
+# إطلاق الواجهات
+tabbed_interface.launch()