Machine learning Lab Assignment 1
Machine learning Lab Assignment 1
1.Linear Regression
Code:
# Import required libraries
import pandas as pd
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_absolute_error, mean_squared_error,
r2_score
from sklearn.preprocessing import LabelEncoder, StandardScaler
# Load dataset
data = pd.read_csv('dataset.csv')
Input:
Output:
2.Logistic Regression
Code:
import numpy as np
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score,confusion_matrix
#Read the dataset using pandas (replace 'your_dataset.csv' with your actual file
path)
data = pd.read_csv('studyhours.csv')
print(data)
#Assuming the target column is 'target' and all other coulmnss are features
X = data.drop(columns=['status']) #Drop the target column to get features
y = data['status'] #Target variable
#Split the data into training and testing sets
X_train,X_test,y_train,y_test =
train_test_split(X,y,test_size=0.4,random_state=20)
#Initialize the Logistic Regression model
model = LogisticRegression()
#Train the model
model.fit(X_train,y_train)
#Make predictions on the test data
y_pred = model.predict(X_test)
#Evaluate the model
accuracy = accuracy_score(y_test,y_pred)
conf_matrix = confusion_matrix(y_test,y_pred)
#Print results
print("Accuracy.",accuracy)
print("Confusion Matrix.")
print(conf_matrix)
Dataset:
Input:
Output:
3.Random Forest Classification
Code:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, confusion_matrix,
classification_report
from sklearn.preprocessing import LabelEncoder
# Load the Titanic dataset
file_path = 'titanic.csv' # Replace with your Titanic dataset file path
data = pd.read_csv(file_path)
# Display the first few rows of the dataset
print("Dataset Preview:")
print(data.head())
# Drop columns not relevant for the model
data = data.drop(['PassengerId', 'Name', 'Ticket', 'Cabin'], axis=1,
errors='ignore')
# Fill missing values
data['Age'].fillna(data['Age'].median(), inplace=True)
data['Embarked'].fillna(data['Embarked'].mode()[0], inplace=True)
# Make predictions
y_pred = model.predict(X_test)
# Display results
print("\nModel Evaluation:")
print(f"Accuracy: {accuracy:.2f}")
print("\nConfusion Matrix:")
print(conf_matrix)
print("\nClassification Report:")
print(class_report)
Dataset:
Input:
Output:
4. Decision Tree id3
Code:
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.tree import DecisionTreeClassifier, plot_tree
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
Output: