Python Data Science Practical Complete
Python Data Science Practical Complete
Question 1.a:
# 1D array
array_1d = np.array([1, 2, 3, 4, 5])
print("1D Array:", array_1d)
# 2D array
array_2d = np.array([[1, 2, 3], [4, 5, 6]])
print("2D Array:\n", array_2d)
# 3D array
array_3d = np.array([[[1, 2], [3, 4]], [[5, 6], [7, 8]]])
print("3D Array:\n", array_3d)
print("Zeros:\n", zeros)
print("Ones:\n", ones)
print("Arange:\n", arange_array)
print("Linspace:\n", linspace_array)
Python for Data Science Practical Codes
Question 1.b:
# Bivariate Analysis
sns.pairplot(data, hue='Outcome')
plt.show()
# Logistic Regression
X = data.drop('Outcome', axis=1)
y = data['Outcome']
Question 2.a:
a = np.array([1, 2, 3])
b = np.array([4, 5, 6])
print("Addition:", a + b)
print("Subtraction:", a - b)
print("Multiplication:", a * b)
print("Division:", a / b)
print("Power:", a ** 2)
Python for Data Science Practical Codes
Question 2.b:
# Density plot
sns.kdeplot(data=data, x='age', hue='income', fill=True)
plt.title('Density Plot of Age by Income')
plt.show()
Question 3.a:
Question 3.b:
Question 4.a:
data = {
'Name': ['Alice', 'Bob', 'Charlie'],
'Age': [25, 30, 35],
'City': ['New York', 'Los Angeles', 'Chicago']
}
df = pd.DataFrame(data)
print(df)
Python for Data Science Practical Codes
Question 4.b:
iris = load_iris()
df = pd.DataFrame(data=iris.data, columns=iris.feature_names)
df['target'] = iris.target
Question 5.a:
Question 5.b:
print(data.describe())
print("\nOutcome Counts:\n", data['Outcome'].value_counts())
Python for Data Science Practical Codes
Question 6.a:
X = data[['BMI']]
y = data['Glucose']
model = LinearRegression()
model.fit(X, y)
print("Coefficient:", model.coef_)
print("Intercept:", model.intercept_)
Python for Data Science Practical Codes
Question 6.b:
# 6.b Creation of different types of NumPy arrays and displaying basic information
import numpy as np
Question 7.a:
Question 7.b:
# 7.b Descriptive Analytics with Pandas on Iris Dataset (from path or web)
import pandas as pd
print(df.describe())
print(df['species'].value_counts())
Python for Data Science Practical Codes
Question 8.a:
fig = plt.figure()
ax = fig.add_subplot(111, projection='3d')
ax.scatter(df['age'], df['hours-per-week'], df['education-num'], c='red')
ax.set_xlabel('Age')
ax.set_ylabel('Hours per Week')
ax.set_zlabel('Education Num')
plt.show()
Python for Data Science Practical Codes
Question 8.b:
Question 9.a:
df['age'].hist(bins=20)
plt.title('Histogram of Age')
plt.xlabel('Age')
plt.ylabel('Frequency')
plt.show()
Python for Data Science Practical Codes
Question 9.b:
array = np.arange(1, 6)
print("Array:", array)
print("Squared:", array ** 2)
print("Mean:", np.mean(array))
print("Standard Deviation:", np.std(array))
Python for Data Science Practical Codes
Question 10.a:
Question 10.b:
a = np.linspace(1, 10, 5)
b = np.full((2, 2), 7)
print("Linspace Array:", a)
print("Full Array:\n", b)
Python for Data Science Practical Codes
Question 11.a:
# Scatter plot
sns.scatterplot(data=df, x='age', y='hours-per-week')
plt.title("Scatter Plot: Age vs Hours-per-week")
plt.show()
Python for Data Science Practical Codes
Question 11.b: