0% found this document useful (0 votes)

9 views

Mayank Chaudhary DEV Practicals

The document contains practical exercises involving data manipulation and analysis using NumPy, Pandas, and visualization libraries like Seaborn and Plotly. It includes tasks such as creating and reshaping arrays, performing statistical analysis on datasets, and visualizing data distributions and relationships. The exercises cover various datasets including penguins and titanic, as well as the iris dataset for visualization tasks.

Uploaded by

arnavdhankar422

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

9 views

Mayank Chaudhary DEV Practicals

Uploaded by

arnavdhankar422

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 14

Dev Lab Practicals

Ques 1.
import numpy as np

# Part A
print("=== Part A ===")
arr_A = np.arange(50, 100, 5).reshape(5, 2)
print("Original 5x2 Array:\n", arr_A)

reshaped_arr_A = arr_A.reshape(10, 1)
print("Reshaped 10x1 Array:\n", reshaped_arr_A)

# Part B
print("\n=== Part B ===")
arr_B = np.random.randint(1, 101, size=30)
print("Random Array:\n", arr_B)

min_val = np.min(arr_B)
max_val = np.max(arr_B)
mean_val = np.mean(arr_B)
median_val = np.median(arr_B)
std_dev = np.std(arr_B)
unique_vals, counts = np.unique(arr_B,
return_counts=True)
most_frequent = unique_vals[np.argmax(counts)]

print(f"Min: {min_val}")
print(f"Max: {max_val}")
print(f"Mean: {mean_val}")
print(f"Median: {median_val}")
print(f"Standard Deviation: {std_dev}")
print(f"Number of Unique Values: {len(unique_vals)}")
unique_counts = {int(k): int(v) for k, v in
zip(unique_vals, counts)}
print(f"Count of Unique Values: {unique_counts}")
print(f"Most Frequent Value: {most_frequent}")

# Part C
print("\n=== Part C ===")
identity_matrix = np.identity(5) * 5
print("5x5 Identity Matrix with Diagonal = 5:\n",
identity_matrix)

# Part D
print("\n=== Part D ===")

# a.
heights = np.array([165, 170, 175, 168, 172, 180, 160,
169, 176, 171,
174, 182, 158, 167, 173, 179, 163, 166, 177,
181])
weights = np.array([60, 65, 70, 75, 80, 85, 55, 58, 63,
68,
72, 77, 50, 62, 67, 74, 52, 57, 69, 73])

# b.
combined = np.column_stack((heights, weights))
print("Combined Array (20x2):\n", combined)

# c.
mean_height = np.mean(heights)
mean_weight = np.mean(weights)
print(f"Mean Height: {mean_height}")
print(f"Mean Weight: {mean_weight}")

# d.
shortest_idx = np.argmin(heights)
tallest_idx = np.argmax(heights)
print(f"Index of Shortest Individual: {shortest_idx}")
print(f"Index of Tallest Individual: {tallest_idx}")

# e.
sorted_by_height = combined[combined[:, 0].argsort()]
print("Sorted by Height:\n", sorted_by_height)

# f.
swapped = combined[:, ::-1]
print("Swapped Columns (Weight, Height):\n",
swapped)

# g.
below_70 = combined[combined[:, 1] < 70]
print("Individuals with Weight < 70kg:\n", below_70)

Ques 2.
import pandas as pd
import seaborn as sns

print("=== Penguins Dataset Analysis ===")

# A.
df = sns.load_dataset("penguins")

# B.
num_rows, num_cols = df.shape
print(f"\nNumber of Observations (Rows):
{num_rows}")
print(f"Number of Attributes (Columns): {num_cols}")

# C.
print("\nAttribute Names:", df.columns.tolist())
print(f"Row Index starts at {df.index.start} and ends at
{df.index.stop - 1}")
'''we can also use
df.index.tolist() --> But it returns all the indexes
which becomes too long.
df.index --> Looks a bit ugly.
'''

print("\nData Types of Each Attribute:\n", df.dtypes)

# D.
print("\nFirst 5 Records:\n", df.head())
print("\nLast 5 Records:\n", df.tail())

# E.
second_col = df.columns[1]
values_3rd_4th = df.iloc[[2, 3], 1]
print(f"\nValues in 2nd Column ({second_col}) for 3rd &
4th records:\n", values_3rd_4th)

# F.
print("\nSummary of Data Distribution:\n",
df.describe(include="all"))

# G.
print("\nPairwise Correlation:\n",
df.corr(numeric_only=True))

Ques 3.
import seaborn as sns
import pandas as pd

#A
df = sns.load_dataset('titanic')

#B.
Dup_count = df.duplicated().sum()
print(f"Total duplicate values : {Dup_count}")
New_df = df.drop_duplicates()
print(f'Record before removing duplicates : {df.shape}')
print(f'Record after removing duplicates :
{New_df.shape}')
Miss_count = df.isnull().sum()
print(f"Total missing values : \n {Miss_count}")
New_df1 = New_df.dropna()
print(f'Records after removing missing values :
{New_df1.shape}\n')

#C.
df_C1 = df.loc[df['survived'] == 1]
print(f'Total Number of passengers who survived :
{len(df_C1)}')

df_C2 = df.loc[df['survived'] == 0]
print(f'Total Number of passengers who did not
survived : {len(df_C2)} \n')

#D.
df_D = df.loc[df['age'] < 18]
print(f'Passengers with age under 18 : {len(df_D)} \n')

#E.
print("Average age of Passengers from each Class : ")
df_E = df.groupby('pclass')['age'].mean()
print(df_E)
print()

#F.
print("New DataFrame inluding Famaily Size : ")
df['Family Size'] = df['sibsp'] + df['parch'] + 1
print(df)

#G.
print(f'Correlation b/w e{df['age'].corr(df['fare'])} \n')

#H.
print("Contingency table : ")
DataTab = pd.crosstab(df['class'], df['survived'])
print(DataTab)
Ques 4 .
import pandas as pd
import seaborn as sns
import matplotlib.pyplot as plt
from sklearn.datasets import load_iris

iris = load_iris()
df = pd.DataFrame(data=iris.data,
columns=iris.feature_names)
df['species'] = iris.target
df['species'] = df['species'].map(dict(zip(range(3),
iris.target_names)))

# A.
plt.figure(figsize=(8, 6))
sns.scatterplot(data=df, x='petal length (cm)', y='petal
width (cm)', hue='species', palette='Set2')
plt.title("Petal Length vs Petal Width")
plt.xlabel("Petal Length (cm)")
plt.ylabel("Petal Width (cm)")
plt.legend(title='Species')
plt.grid(True)
plt.tight_layout()
plt.show()

# B.
df.drop('species', axis=1).hist(bins=15, figsize=(10, 6),
edgecolor='black', color='skyblue')
plt.suptitle("Histograms of Iris Features", fontsize=14)
plt.tight_layout()
plt.show()

# C.
species_counts = df['species'].value_counts()
plt.figure(figsize=(6, 6))
plt.pie(species_counts, labels=species_counts.index,
autopct='%1.1f%%', startangle=140,
colors=['#66c2a5','#fc8d62','#8da0cb'])
plt.title("Distribution of Iris Species")
plt.axis('equal')
plt.tight_layout()
plt.show()
# D.
sns.pairplot(df, hue='species', palette='husl',
diag_kind='hist')
plt.suptitle("Pair Plot of Iris Dataset", y=1.02)
plt.show()

Ques 5.
import pandas as pd
import plotly.express as px
from sklearn.datasets import load_iris

iris = load_iris()
df = pd.DataFrame(data=iris.data,
columns=iris.feature_names)
df['species'] = iris.target
df['species'] = df['species'].map(dict(zip(range(3),
iris.target_names)))

# A.
fig_scatter = px.scatter(
df,
x='petal length (cm)',
y='petal width (cm)',
color='species',
title='Petal Length vs Petal Width (Iris Dataset)',
labels={'petal length (cm)': 'Petal Length (cm)', 'petal
width (cm)': 'Petal Width (cm)'},
symbol='species'
)
fig_scatter.show()

# C.
fig_pie = px.pie(
df,
names='species',
title='Distribution of Iris Species',
color_discrete_sequence=px.colors.qualitative.Set3
)
fig_pie.update_traces(textposition='inside',
textinfo='percent+label')
fig_pie.show()

RL800 Series ONU User Manual
No ratings yet
RL800 Series ONU User Manual
45 pages
Python Cheat Sheet: Pandas - Numpy - Sklearn Matplotlib - Seaborn BS4 - Selenium - Scrapy
100% (3)
Python Cheat Sheet: Pandas - Numpy - Sklearn Matplotlib - Seaborn BS4 - Selenium - Scrapy
9 pages
Print Print Print Print: Import As
No ratings yet
Print Print Print Print: Import As
6 pages
Ai Tools and Applications-Lab
No ratings yet
Ai Tools and Applications-Lab
33 pages
DAV Practicals
No ratings yet
DAV Practicals
26 pages
23bet10114 Naman Gupta Assignment-1
No ratings yet
23bet10114 Naman Gupta Assignment-1
17 pages
Presentation 1
No ratings yet
Presentation 1
30 pages
1DA (1)
No ratings yet
1DA (1)
18 pages
GEC PRACTICALS
No ratings yet
GEC PRACTICALS
31 pages
Python Course Cheat Sheet
No ratings yet
Python Course Cheat Sheet
30 pages
batch1 ds
No ratings yet
batch1 ds
15 pages
Data Science Practical Book - Ipynb
No ratings yet
Data Science Practical Book - Ipynb
21 pages
FDS All Practicals
No ratings yet
FDS All Practicals
10 pages
AI Final PDF
No ratings yet
AI Final PDF
38 pages
DAVP PYQ 2023 SOLUTION
No ratings yet
DAVP PYQ 2023 SOLUTION
15 pages
DAV Practical
No ratings yet
DAV Practical
12 pages
Fds SLOT 2
No ratings yet
Fds SLOT 2
12 pages
Vanshika Goyal Gec Practicals
No ratings yet
Vanshika Goyal Gec Practicals
31 pages
Dav Lab Manual
No ratings yet
Dav Lab Manual
28 pages
Data Science Practicals - Ipynb
No ratings yet
Data Science Practicals - Ipynb
54 pages
Data_Analyzer
No ratings yet
Data_Analyzer
10 pages
DAV_practicle_File
No ratings yet
DAV_practicle_File
28 pages
AD3411 (2)
No ratings yet
AD3411 (2)
28 pages
Ge Sem II Dav Upc 2344001201 Sl. No. Qp. 2012 July 2023
No ratings yet
Ge Sem II Dav Upc 2344001201 Sl. No. Qp. 2012 July 2023
16 pages
MLFILE
No ratings yet
MLFILE
21 pages
hw-1
No ratings yet
hw-1
11 pages
Python Solution
No ratings yet
Python Solution
30 pages
Time Series Analysis Group 9
No ratings yet
Time Series Analysis Group 9
16 pages
DSA_1
No ratings yet
DSA_1
8 pages
DP prog
No ratings yet
DP prog
10 pages
DAV Guidelines
No ratings yet
DAV Guidelines
4 pages
Solution
No ratings yet
Solution
8 pages
2023 Data Analysis and Visualization Using Python
100% (2)
2023 Data Analysis and Visualization Using Python
9 pages
Hypothesis Testing PDF
No ratings yet
Hypothesis Testing PDF
9 pages
ml lab
No ratings yet
ml lab
14 pages
numpy_dataframe
No ratings yet
numpy_dataframe
12 pages
Machine Learning Group Project
No ratings yet
Machine Learning Group Project
22 pages
keeratsi_HW8
No ratings yet
keeratsi_HW8
17 pages
GE Python Visualization 2023
No ratings yet
GE Python Visualization 2023
16 pages
ModuleAr Merged
No ratings yet
ModuleAr Merged
42 pages
MLRecord
No ratings yet
MLRecord
24 pages
FDA_BATCH2PROGRAM
No ratings yet
FDA_BATCH2PROGRAM
18 pages
prgm 4
No ratings yet
prgm 4
3 pages
Stats Assignment
No ratings yet
Stats Assignment
20 pages
External
No ratings yet
External
11 pages
Lab
No ratings yet
Lab
13 pages
Ad3411 - Student
No ratings yet
Ad3411 - Student
27 pages
Python Slips
No ratings yet
Python Slips
9 pages
exp_2_sdk_ok
No ratings yet
exp_2_sdk_ok
18 pages
Fds Slips
No ratings yet
Fds Slips
6 pages
data-science-practical-with-solutions-bsc-cs-sem-6
No ratings yet
data-science-practical-with-solutions-bsc-cs-sem-6
29 pages
FDS Lab Manual
No ratings yet
FDS Lab Manual
48 pages
GE- COMPUTER SCIENCE DATA ANALYSIS
No ratings yet
GE- COMPUTER SCIENCE DATA ANALYSIS
16 pages
CS-3361-Data-science-lab Manual
No ratings yet
CS-3361-Data-science-lab Manual
36 pages
Fha-pyhton Program Unit 1-4.Docx
No ratings yet
Fha-pyhton Program Unit 1-4.Docx
13 pages
DALab Part-B BCU&BU
No ratings yet
DALab Part-B BCU&BU
12 pages
ml_labmanual (3)
No ratings yet
ml_labmanual (3)
33 pages
data science practicals
No ratings yet
data science practicals
47 pages
FDS Slot 1
No ratings yet
FDS Slot 1
19 pages
GE Practical Sem 2 (2)
No ratings yet
GE Practical Sem 2 (2)
28 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
Communication Protocols: Energus Power Solutions LTD
No ratings yet
Communication Protocols: Energus Power Solutions LTD
27 pages
R-LINK Evolution Software Installation Guide: How To Perform Updates
No ratings yet
R-LINK Evolution Software Installation Guide: How To Perform Updates
8 pages
Mrittika Chatterjee Contact: +91 8971496566 Location: BTM 2 Stage, Bangalore
No ratings yet
Mrittika Chatterjee Contact: +91 8971496566 Location: BTM 2 Stage, Bangalore
2 pages
Tales From Ukraine
No ratings yet
Tales From Ukraine
379 pages
Should I Give My First Salary As Firstfruits Offering
No ratings yet
Should I Give My First Salary As Firstfruits Offering
4 pages
Building Inspection Report Assignment
No ratings yet
Building Inspection Report Assignment
5 pages
DLL 8 Week 1 Day 4
No ratings yet
DLL 8 Week 1 Day 4
7 pages
Application Procedure - Study in Sweden - SWEDEN
No ratings yet
Application Procedure - Study in Sweden - SWEDEN
2 pages
Acs Molpharmaceut 6b00248
No ratings yet
Acs Molpharmaceut 6b00248
7 pages
Grout 100
No ratings yet
Grout 100
5 pages
Statistical Process Control
100% (1)
Statistical Process Control
37 pages
Lab Report 5 - Friction
No ratings yet
Lab Report 5 - Friction
7 pages
B 001 001 064
No ratings yet
B 001 001 064
69 pages
1 Introduction To Electrical Drives
75% (4)
1 Introduction To Electrical Drives
45 pages
Message Authentication
No ratings yet
Message Authentication
21 pages
Tcs 1
No ratings yet
Tcs 1
2 pages
Dicionário Assírio L
No ratings yet
Dicionário Assírio L
280 pages
Equivalent Record Form: (Surname) (Given) (M.I.)
No ratings yet
Equivalent Record Form: (Surname) (Given) (M.I.)
1 page
Barrier Analysis For The Supply Chain of Palm Oil Processing Biomass (Empty Fruit Bunch) As Renewable Fuel
100% (1)
Barrier Analysis For The Supply Chain of Palm Oil Processing Biomass (Empty Fruit Bunch) As Renewable Fuel
100 pages
Our Lady of Manaoag Innovative School, Inc.: The Problem
No ratings yet
Our Lady of Manaoag Innovative School, Inc.: The Problem
90 pages
Labview: Statistical Process Control Toolkit Reference Manual
No ratings yet
Labview: Statistical Process Control Toolkit Reference Manual
107 pages
301 Prome Series Laser Pointer Manual
No ratings yet
301 Prome Series Laser Pointer Manual
2 pages
The Development of The Adamic Myth in Ge
No ratings yet
The Development of The Adamic Myth in Ge
16 pages
XP Deus V3.0 - User Manual UK
100% (1)
XP Deus V3.0 - User Manual UK
64 pages
User Attributes AD Command
No ratings yet
User Attributes AD Command
3 pages
The History of Maintenance
No ratings yet
The History of Maintenance
3 pages
Divorce Kids
100% (1)
Divorce Kids
6 pages
Water Level Control Functions: 30-FL Modulating Float Valve
No ratings yet
Water Level Control Functions: 30-FL Modulating Float Valve
1 page
Phonetic Foolishness (Tongue Twister Poem)
No ratings yet
Phonetic Foolishness (Tongue Twister Poem)
2 pages

Mayank Chaudhary DEV Practicals

Uploaded by

Mayank Chaudhary DEV Practicals

Uploaded by

Dev Lab Practicals

print("=== Penguins Dataset Analysis ===")

print("\nData Types of Each Attribute:\n", df.dtypes)

You might also like