0% found this document useful (0 votes)

4 views3 pages

f12

The document outlines a customer preference analysis focusing on the relationship between cuisine types and restaurant ratings. It includes steps to analyze average ratings, popularity based on votes, and the percentage of high-rated restaurants for various cuisines, along with visualizations for better understanding. The analysis aims to identify top cuisines by rating, votes, and high rating percentages while exploring the relationship between popularity and ratings.

Uploaded by

sambhaviasingh

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

4 views3 pages

f12

Uploaded by

sambhaviasingh

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

# LEVEL 3 - TASK 2: CUSTOMER PREFERENCE ANALYSIS

print("LEVEL 3 - TASK 2: CUSTOMER PREFERENCE ANALYSIS")

print("============================================")

# 1. Analyze the relationship between the type of cuisine and the restaurant's
rating
# First, we need to create a dataframe with cuisine-level data
cuisine_data = []

for _, row in df_processed.iterrows():

if pd.isna(row['Cuisines']):
continue

cuisines = [cuisine.strip() for cuisine in row['Cuisines'].split(',')]

rating = row['Aggregate rating']
votes = row['Votes']

for cuisine in cuisines:

cuisine_data.append({
'Cuisine': cuisine,
'Rating': rating,
'Votes': votes
})

cuisine_df = pd.DataFrame(cuisine_data)

# Calculate average rating for each cuisine

cuisine_ratings = cuisine_df.groupby('Cuisine').agg({
'Rating': 'mean',
'Votes': 'sum',
'Cuisine': 'count'
}).rename(columns={'Cuisine': 'Count'}).reset_index()

# Filter cuisines with at least 10 restaurants

cuisine_ratings_filtered = cuisine_ratings[cuisine_ratings['Count'] >=
10].sort_values('Rating', ascending=False)

print("\nTop 20 Cuisines by Average Rating (min 10 restaurants):")

print(cuisine_ratings_filtered.head(20))

# Visualize top cuisines by rating

plt.figure(figsize=(14, 10))
sns.barplot(x='Rating', y='Cuisine', data=cuisine_ratings_filtered.head(20),
palette='viridis')
plt.title('Top 20 Cuisines by Average Rating', fontsize=16)
plt.xlabel('Average Rating', fontsize=14)
plt.ylabel('Cuisine', fontsize=14)
plt.xticks(fontsize=12)
plt.yticks(fontsize=12)
plt.grid(axis='x', alpha=0.3)
plt.tight_layout()
plt.show()

# 2. Identify the most popular cuisines among customers based on the number of
votes
cuisine_popularity = cuisine_ratings.sort_values('Votes', ascending=False)

print("\nTop 20 Most Popular Cuisines by Total Votes:")

print(cuisine_popularity.head(20))
# Visualize top cuisines by votes
plt.figure(figsize=(14, 10))
sns.barplot(x='Votes', y='Cuisine', data=cuisine_popularity.head(20),
palette='viridis')
plt.title('Top 20 Most Popular Cuisines by Total Votes', fontsize=16)
plt.xlabel('Total Votes', fontsize=14)
plt.ylabel('Cuisine', fontsize=14)
plt.xticks(fontsize=12)
plt.yticks(fontsize=12)
plt.grid(axis='x', alpha=0.3)
plt.tight_layout()
plt.show()

# Calculate average votes per restaurant for each cuisine

cuisine_ratings['Avg_Votes_Per_Restaurant'] = cuisine_ratings['Votes'] /
cuisine_ratings['Count']
cuisine_avg_votes = cuisine_ratings[cuisine_ratings['Count'] >=
10].sort_values('Avg_Votes_Per_Restaurant', ascending=False)

print("\nTop 20 Cuisines by Average Votes per Restaurant (min 10 restaurants):")

print(cuisine_avg_votes.head(20))

# Visualize top cuisines by average votes per restaurant

plt.figure(figsize=(14, 10))
sns.barplot(x='Avg_Votes_Per_Restaurant', y='Cuisine',
data=cuisine_avg_votes.head(20), palette='viridis')
plt.title('Top 20 Cuisines by Average Votes per Restaurant', fontsize=16)
plt.xlabel('Average Votes per Restaurant', fontsize=14)
plt.ylabel('Cuisine', fontsize=14)
plt.xticks(fontsize=12)
plt.yticks(fontsize=12)
plt.grid(axis='x', alpha=0.3)
plt.tight_layout()
plt.show()

# 3. Determine if there are any specific cuisines that tend to receive higher
ratings
# Calculate the percentage of high-rated restaurants (4.0+ stars) for each cuisine
high_rating_threshold = 4.0

cuisine_df['Is_High_Rating'] = cuisine_df['Rating'] >= high_rating_threshold

cuisine_high_ratings = cuisine_df.groupby('Cuisine').agg({
'Is_High_Rating': ['sum', 'count'],
'Rating': 'mean'
})

cuisine_high_ratings.columns = ['High_Rating_Count', 'Total_Count', 'Avg_Rating']

cuisine_high_ratings['High_Rating_Percentage'] =
(cuisine_high_ratings['High_Rating_Count'] / cuisine_high_ratings['Total_Count']) *
100
cuisine_high_ratings = cuisine_high_ratings.reset_index()

# Filter cuisines with at least 10 restaurants

cuisine_high_ratings_filtered =
cuisine_high_ratings[cuisine_high_ratings['Total_Count'] >=
10].sort_values('High_Rating_Percentage', ascending=False)

print(f"\nTop 20 Cuisines by Percentage of High Ratings ({high_rating_threshold}+

stars, min 10 restaurants):")
print(cuisine_high_ratings_filtered.head(20))

# Visualize top cuisines by percentage of high ratings

plt.figure(figsize=(14, 10))
sns.barplot(x='High_Rating_Percentage', y='Cuisine',
data=cuisine_high_ratings_filtered.head(20), palette='viridis')
plt.title(f'Top 20 Cuisines by Percentage of High Ratings ({high_rating_threshold}+
stars)', fontsize=16)
plt.xlabel('Percentage of High-Rated Restaurants', fontsize=14)
plt.ylabel('Cuisine', fontsize=14)
plt.xticks(fontsize=12)
plt.yticks(fontsize=12)
plt.grid(axis='x', alpha=0.3)
plt.tight_layout()
plt.show()

# Create a scatter plot to visualize the relationship between popularity and rating
plt.figure(figsize=(14, 10))
sns.scatterplot(
x='Votes',
y='Rating',
size='Count',
sizes=(50, 500),
alpha=0.7,
data=cuisine_ratings[cuisine_ratings['Count'] >= 10]
)

# Annotate some interesting points

for _, row in cuisine_ratings[cuisine_ratings['Count'] >= 50].sort_values('Rating',
ascending=False).head(10).iterrows():
plt.annotate(
row['Cuisine'],
xy=(row['Votes'], row['Rating']),
xytext=(5, 0),
textcoords='offset points',
fontsize=10
)

plt.title('Relationship Between Cuisine Popularity and Rating', fontsize=16)

plt.xlabel('Total Votes (Popularity)', fontsize=14)
plt.ylabel('Average Rating', fontsize=14)
plt.xticks(fontsize=12)
plt.yticks(fontsize=12)
plt.grid(alpha=0.3)
plt.tight_layout()
plt.show()

Foodhub Project Full Code .HTML
88% (8)
Foodhub Project Full Code .HTML
30 pages
Zomato Restaurant Clustering & Sentiment Analysis - Ipynb - Colaboratory
No ratings yet
Zomato Restaurant Clustering & Sentiment Analysis - Ipynb - Colaboratory
27 pages
Pandas
No ratings yet
Pandas
43 pages
Capstone Project Final Report
No ratings yet
Capstone Project Final Report
13 pages
Erikson Identity Youth and Crisis PDF
0% (2)
Erikson Identity Youth and Crisis PDF
2 pages
Connectivity Service PDF
0% (1)
Connectivity Service PDF
368 pages
Zomoto Data analysis using python
No ratings yet
Zomoto Data analysis using python
10 pages
f14
No ratings yet
f14
3 pages
Zomoto Data Analysis Using Python_1
No ratings yet
Zomoto Data Analysis Using Python_1
10 pages
f13
No ratings yet
f13
3 pages
Zomato Data Analysis Presentation
No ratings yet
Zomato Data Analysis Presentation
16 pages
Final Project Report DA
No ratings yet
Final Project Report DA
3 pages
EDA Zomato 1681401606
No ratings yet
EDA Zomato 1681401606
15 pages
f7
No ratings yet
f7
2 pages
f9
No ratings yet
f9
2 pages
Food Recommendation System
No ratings yet
Food Recommendation System
13 pages
Zomato Data Analysis (1) (1)
No ratings yet
Zomato Data Analysis (1) (1)
11 pages
RESTAURANT RECOMMANDATION SYSTEM(1)
No ratings yet
RESTAURANT RECOMMANDATION SYSTEM(1)
15 pages
f10
No ratings yet
f10
3 pages
DA - Project 1
No ratings yet
DA - Project 1
12 pages
Data report
No ratings yet
Data report
7 pages
PANDAS_LEC_2
No ratings yet
PANDAS_LEC_2
21 pages
Zomato Rating Prediction
No ratings yet
Zomato Rating Prediction
11 pages
Understanding Indian Cuisine: A Data-Driven Study
No ratings yet
Understanding Indian Cuisine: A Data-Driven Study
15 pages
Zomato Data Aanalysis Using Machine Learning Algorithms
No ratings yet
Zomato Data Aanalysis Using Machine Learning Algorithms
7 pages
Project Template Notebook Ipynb 1
No ratings yet
Project Template Notebook Ipynb 1
23 pages
Restaurants Rating Prediction Using Machine Learning Algorithms
No ratings yet
Restaurants Rating Prediction Using Machine Learning Algorithms
4 pages
Restaurants Rating Prediction Using Machine Learning Algorithms
No ratings yet
Restaurants Rating Prediction Using Machine Learning Algorithms
4 pages
Project Presentation
No ratings yet
Project Presentation
34 pages
PYF_Project_LearnerNotebook_LowCode
No ratings yet
PYF_Project_LearnerNotebook_LowCode
6 pages
Task 1 - Data preparation and customer analytics - Jupyter Notebook
No ratings yet
Task 1 - Data preparation and customer analytics - Jupyter Notebook
64 pages
Zomato Problem Statement
No ratings yet
Zomato Problem Statement
2 pages
DWM Project
No ratings yet
DWM Project
16 pages
Project Report1
No ratings yet
Project Report1
9 pages
Finalproj Aml
No ratings yet
Finalproj Aml
69 pages
Tasks
No ratings yet
Tasks
2 pages
Zomato Ishani Abhi
No ratings yet
Zomato Ishani Abhi
33 pages
Swiggy Food Restaurant Analysis Using SQL: BY Akhilesh Maurya
No ratings yet
Swiggy Food Restaurant Analysis Using SQL: BY Akhilesh Maurya
12 pages
BCD3002 Business Intelligence and Analytics
No ratings yet
BCD3002 Business Intelligence and Analytics
5 pages
上海餐饮情况分析
No ratings yet
上海餐饮情况分析
17 pages
Yelp Vs Zomato Analysis
No ratings yet
Yelp Vs Zomato Analysis
8 pages
The Location Recommendation To New Restaurants: Foursquare API
No ratings yet
The Location Recommendation To New Restaurants: Foursquare API
4 pages
Introduction To Text Mining
No ratings yet
Introduction To Text Mining
54 pages
Project Detailed Review
No ratings yet
Project Detailed Review
9 pages
Data Mining Capstone Project Report
No ratings yet
Data Mining Capstone Project Report
15 pages
Restaurant Performance Analysis for Burgerville USA
No ratings yet
Restaurant Performance Analysis for Burgerville USA
3 pages
Data Visualization 2
No ratings yet
Data Visualization 2
12 pages
Swiggy_project_ppt
No ratings yet
Swiggy_project_ppt
13 pages
The Location Recommendatio Ntonew Restaurants: Eva Li
No ratings yet
The Location Recommendatio Ntonew Restaurants: Eva Li
9 pages
FINAL_PROJECT
No ratings yet
FINAL_PROJECT
17 pages
food_hub_businees_report
No ratings yet
food_hub_businees_report
15 pages
Exercise#9 Instructions 2021
No ratings yet
Exercise#9 Instructions 2021
5 pages
Evaluation of Customer Ratings On Restaurant by Clustering Techniques Using R
No ratings yet
Evaluation of Customer Ratings On Restaurant by Clustering Techniques Using R
8 pages
Report-Converted Sip
No ratings yet
Report-Converted Sip
14 pages
f5
No ratings yet
f5
2 pages
Swiggy Analysis Using MYSQL Report
No ratings yet
Swiggy Analysis Using MYSQL Report
5 pages
lab6_67c1438e2e100fc6064332edf210c414
No ratings yet
lab6_67c1438e2e100fc6064332edf210c414
3 pages
SMDM Guided Project Ashish
No ratings yet
SMDM Guided Project Ashish
25 pages
Restaurant Case Study PDF
No ratings yet
Restaurant Case Study PDF
6 pages
PHYTON
No ratings yet
PHYTON
7 pages
Documentation Final
No ratings yet
Documentation Final
53 pages
How to Start a Catering Business
From Everand
How to Start a Catering Business
J.H. Dies
No ratings yet
Rockwell Hardness Testing
No ratings yet
Rockwell Hardness Testing
5 pages
Silva Miranda Diana Irina Act11
No ratings yet
Silva Miranda Diana Irina Act11
8 pages
Madhurya Alankaar (RJ Maddy)
No ratings yet
Madhurya Alankaar (RJ Maddy)
3 pages
PLSQL
No ratings yet
PLSQL
131 pages
CentOS 5 QmailToaster Install
No ratings yet
CentOS 5 QmailToaster Install
15 pages
Students' Orientation
100% (1)
Students' Orientation
123 pages
[FREE PDF sample] Presence Volume II The Intimacy of All Experience Rupert Spira ebooks
100% (2)
[FREE PDF sample] Presence Volume II The Intimacy of All Experience Rupert Spira ebooks
47 pages
GRasd
No ratings yet
GRasd
11 pages
Seismic Acquisition
100% (1)
Seismic Acquisition
88 pages
Amandaresume
No ratings yet
Amandaresume
1 page
Kernels Cover Letter
No ratings yet
Kernels Cover Letter
1 page
Shubham Agnihotri - Random Motors Project
No ratings yet
Shubham Agnihotri - Random Motors Project
11 pages
Angle of Deppression and Elevation
No ratings yet
Angle of Deppression and Elevation
2 pages
MNL Still No Flying Cars The Future Promises Something Better Adv
No ratings yet
MNL Still No Flying Cars The Future Promises Something Better Adv
5 pages
Ic6601 C0HBB0000057 Eveke2f3524b
No ratings yet
Ic6601 C0HBB0000057 Eveke2f3524b
1 page
Higgs (2005)
No ratings yet
Higgs (2005)
6 pages
Element of Landscape: Natural (Earth Form, Water, Vegetation), Manmade
100% (3)
Element of Landscape: Natural (Earth Form, Water, Vegetation), Manmade
55 pages
Legendre Polynomials
No ratings yet
Legendre Polynomials
8 pages
DEMO LESSON PLAN IN SCIENCE 6
No ratings yet
DEMO LESSON PLAN IN SCIENCE 6
11 pages
Untitled
No ratings yet
Untitled
2 pages
Struktur Organisasi Stasiun
No ratings yet
Struktur Organisasi Stasiun
5 pages
Ed Unit 1
100% (1)
Ed Unit 1
25 pages
UDS Protocol Implementation in Automotiv PDF
No ratings yet
UDS Protocol Implementation in Automotiv PDF
6 pages
HIPAA Basics
100% (5)
HIPAA Basics
38 pages
Stressors and Coping Mechanisms
No ratings yet
Stressors and Coping Mechanisms
1 page
Reflection English 2010
No ratings yet
Reflection English 2010
2 pages
Bio-Engineering Erosion Control in Nepal
No ratings yet
Bio-Engineering Erosion Control in Nepal
7 pages
FRFFRR
No ratings yet
FRFFRR
1 page

f12

Uploaded by

f12

Uploaded by

# LEVEL 3 - TASK 2: CUSTOMER PREFERENCE ANALYSIS

print("LEVEL 3 - TASK 2: CUSTOMER PREFERENCE ANALYSIS")

for _, row in df_processed.iterrows():

cuisines = [cuisine.strip() for cuisine in row['Cuisines'].split(',')]

for cuisine in cuisines:

# Calculate average rating for each cuisine

# Filter cuisines with at least 10 restaurants

print("\nTop 20 Cuisines by Average Rating (min 10 restaurants):")

# Visualize top cuisines by rating

print("\nTop 20 Most Popular Cuisines by Total Votes:")

# Calculate average votes per restaurant for each cuisine

print("\nTop 20 Cuisines by Average Votes per Restaurant (min 10 restaurants):")

# Visualize top cuisines by average votes per restaurant

cuisine_df['Is_High_Rating'] = cuisine_df['Rating'] >= high_rating_threshold

cuisine_high_ratings.columns = ['High_Rating_Count', 'Total_Count', 'Avg_Rating']

# Filter cuisines with at least 10 restaurants

print(f"\nTop 20 Cuisines by Percentage of High Ratings ({high_rating_threshold}+

# Visualize top cuisines by percentage of high ratings

# Annotate some interesting points

plt.title('Relationship Between Cuisine Popularity and Rating', fontsize=16)

You might also like