0% found this document useful (0 votes)

26 views7 pages

AI Assignment-6

The document contains multiple Python scripts that demonstrate various machine learning techniques using libraries like pandas and scikit-learn. It includes generating synthetic datasets, training models such as K-Nearest Neighbors, Naive Bayes, and Decision Trees, and evaluating their performance with metrics like accuracy and F1 score. Additionally, it shows how to save datasets and results to CSV files for further analysis.

Uploaded by

mighty.wizard.op

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

26 views7 pages

AI Assignment-6

Uploaded by

mighty.wizard.op

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

Q1

import pandas as pd
from sklearn.model_selection import train_test_split
from [Link] import StandardScaler
from [Link] import KNeighborsRegressor

# Step 1: Generate synthetic dataset

data = {
'Experience': [5, 8, 3, 10, 2, 7],
'Written_Score': [8, 7, 6, 9, 5, 8],
'Interview_Score': [10, 6, 7, 8, 9, 5],
'Salary': [60000, 80000, 45000, 90000, 35000, 75000]
}

df = [Link](data)

# Step 2: Save dataset to a .csv file

df.to_csv('candidates_dataset.csv', index=False)

# Step 3: Load dataset

df = pd.read_csv('candidates_dataset.csv')

# Step 4: Split dataset into features and target

X = [Link]('Salary', axis=1)
y = df['Salary']

# Step 5: Split dataset into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y,
test_size=0.2, random_state=42)

# Step 6: Standardize features (optional)

scaler = StandardScaler()
X_train_scaled = scaler.fit_transform(X_train)
X_test_scaled = [Link](X_test)

# Step 7: Build KNN model

knn_model = KNeighborsRegressor(n_neighbors=3) # Specify the value of
K
# Step 8: Train the model
knn_model.fit(X_train_scaled, y_train)

# Step 9: Make predictions on the testing set

y_pred = knn_model.predict(X_test_scaled)

# Step 10: Use the trained model to predict salaries for new candidates
new_candidates = [Link]({
'Experience': [5, 8],
'Written_Score': [8, 7],
'Interview_Score': [10, 6]
})

# Standardize the new candidate data

new_candidates_scaled = [Link](new_candidates)

# Predict salaries for new candidates

predicted_salaries = knn_model.predict(new_candidates_scaled)
print("Predicted salaries for new candidates:")
for i, salary in enumerate(predicted_salaries):
print(f"Candidate {i+1}: ${salary:.2f}")

Q2
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import GaussianNB
from [Link] import accuracy_score, precision_score,
recall_score, f1_score

# Create dataset
data = {
'Graduation_Percentage': [80, 85, 70, 75, 90, 95, 85, 88, 92, 78,
83, 87, 79, 84, 91, 86, 93, 89, 76, 81, 74, 77, 82, 88, 94],
'Experience': [5, 8, 3, 6, 9, 2, 4, 7, 10, 2, 6, 3, 5, 7, 4, 8, 10,
9, 3, 7, 4, 6, 2, 8, 5],
'Written_Score': [8, 7, 6, 9, 5, 8, 7, 6, 9, 5, 8, 7, 6, 9, 5, 8,
7, 6, 9, 5, 8, 7, 6, 9, 5],
'Interview_Score': [10, 6, 7, 8, 9, 5, 8, 7, 6, 9, 5, 8, 7, 6, 9,
5, 8, 7, 6, 9, 5, 8, 7, 6, 9],
'Selection': [1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0,
1, 0, 1, 0, 1, 0, 1] # 1 for selected, 0 for not selected
}

df = [Link](data)

# Save dataset to a .csv file

df.to_csv('candidates_dataset.csv', index=False)

# Load dataset
df = pd.read_csv('candidates_dataset.csv')

# Split dataset into features and target

X = [Link]('Selection', axis=1)
y = df['Selection']
# Split dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y,
test_size=0.2, random_state=42)

# Build Bayesian learning model

bayes_model = GaussianNB()

# Train the model

bayes_model.fit(X_train, y_train)

# Make predictions on testing data

y_pred = bayes_model.predict(X_test)

# Calculate classification metrics

accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred)
recall = recall_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred)

# Print classification metrics

print("Classification Metrics:")
print("Accuracy:", accuracy)
print("Precision:", precision)
print("Recall:", recall)
print("F1 Score:", f1)

# Predict status for unseen data

unseen_data = [Link]({
'Graduation_Percentage': [90, 75],
'Experience': [5, 8],
'Written_Score': [8, 7],
'Interview_Score': [10, 6]
})

# Make predictions for unseen data

unseen_predictions = bayes_model.predict(unseen_data)

# Save classification metrics to a .csv file

metrics_data = {
'Metric': ['Accuracy', 'Precision', 'Recall', 'F1 Score'],
'Value': [accuracy, precision, recall, f1]
}

metrics_df = [Link](metrics_data)
metrics_df.to_csv('classification_metrics.csv', index=False)

# Save predictions for unseen data to a .csv file

unseen_data['Selection'] = unseen_predictions
unseen_data.to_csv('unseen_predictions.csv', index=False)

Q3
from [Link] import load_iris
from sklearn.model_selection import train_test_split
from [Link] import DecisionTreeClassifier
from [Link] import accuracy_score, precision_score,
recall_score, f1_score

# Load the IRIS dataset

iris = load_iris()
X = [Link]
y = [Link]

# Define function to evaluate model performance

def evaluate_model(X_train, X_test, y_train, y_test):
clf = DecisionTreeClassifier(criterion='entropy')
[Link](X_train, y_train)
y_pred = [Link](X_test)
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred, average='weighted')
recall = recall_score(y_test, y_pred, average='weighted')
f1 = f1_score(y_test, y_pred, average='weighted')
return accuracy, precision, recall, f1

# Vary percentage of training data

percentages = [0.6, 0.7, 0.8, 0.9]
for percentage in percentages:
X_train, X_test, y_train, y_test = train_test_split(X, y,
train_size=percentage, random_state=42)
accuracy, precision, recall, f1 = evaluate_model(X_train, X_test,
y_train, y_test)
print(f"Percentage of training data: {percentage}")
print(f"Accuracy: {accuracy:.2f}, Precision: {precision:.2f},
Recall: {recall:.2f}, F1 Score: {f1:.2f}")
print()

# Explore effect of other decision tree parameters

parameters = {'max_depth': [None, 3, 5, 10], 'min_samples_split': [2,
5, 10]}
for max_depth in parameters['max_depth']:
for min_samples_split in parameters['min_samples_split']:
clf = DecisionTreeClassifier(criterion='entropy',
max_depth=max_depth, min_samples_split=min_samples_split)
[Link](X_train, y_train)
y_pred = [Link](X_test)
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred, average='weighted')
recall = recall_score(y_test, y_pred, average='weighted')
f1 = f1_score(y_test, y_pred, average='weighted')
print(f"Max Depth: {max_depth}, Min Samples Split:
{min_samples_split}")
print(f"Accuracy: {accuracy:.2f}, Precision: {precision:.2f},
Recall: {recall:.2f}, F1 Score: {f1:.2f}")
print()

Q4
import pandas as pd
from sklearn.model_selection import train_test_split
from [Link] import KNeighborsClassifier
from sklearn.naive_bayes import GaussianNB
from [Link] import DecisionTreeClassifier
from [Link] import accuracy_score, precision_score,
recall_score, f1_score

# Load the Classified Data

classified_data = pd.read_csv('classified_data.csv')

# Prepare data
X = classified_data.drop('TARGET CLASS', axis=1)
y = classified_data['TARGET CLASS']
X_train, X_test, y_train, y_test = train_test_split(X, y,
test_size=0.3, random_state=42)

# Define functions to evaluate models

def evaluate_knn(n_neighbors):
clf = KNeighborsClassifier(n_neighbors=n_neighbors)
[Link](X_train, y_train)
y_pred = [Link](X_test)
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred)
recall = recall_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred)
return accuracy, precision, recall, f1

def evaluate_nb():
clf = GaussianNB()
[Link](X_train, y_train)
y_pred = [Link](X_test)
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred)
recall = recall_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred)
return accuracy, precision, recall, f1

def evaluate_decision_tree(max_depth, min_samples_split):

clf = DecisionTreeClassifier(max_depth=max_depth,
min_samples_split=min_samples_split)
[Link](X_train, y_train)
y_pred = [Link](X_test)
accuracy = accuracy_score(y_test, y_pred)
precision = precision_score(y_test, y_pred)
recall = recall_score(y_test, y_pred)
f1 = f1_score(y_test, y_pred)
return accuracy, precision, recall, f1

# Vary parameters for each model

knn_parameters = [1, 3, 5, 7, 9]
nb_parameters = []
decision_tree_parameters = [{'max_depth': None, 'min_samples_split':
2},
{'max_depth': 5, 'min_samples_split': 2},
{'max_depth': 10, 'min_samples_split': 2}]

# Evaluate models and save results to CSV

results = []
for n_neighbors in knn_parameters:
accuracy, precision, recall, f1 = evaluate_knn(n_neighbors)
[Link](['KNN', n_neighbors, accuracy, precision, recall,
f1])

accuracy, precision, recall, f1 = evaluate_nb()

[Link](['Naive Bayes', 'N/A', accuracy, precision, recall, f1])

for params in decision_tree_parameters:

accuracy, precision, recall, f1 =
evaluate_decision_tree(params['max_depth'],
params['min_samples_split'])
[Link](['Decision Tree', f"Max Depth:
{params['max_depth']}, Min Samples Split:
{params['min_samples_split']}", accuracy, precision, recall, f1])

# Create DataFrame and save to CSV

df = [Link](results, columns=['Model', 'Parameters', 'Accuracy',
'Precision', 'Recall', 'F1 Score'])
df.to_csv('model_comparison_results.csv', index=False)

The code below will create the .csv file for the above code ok Bro
import pandas as pd
import numpy as np

# Generate random data

[Link](42)
data = [Link]([Link](100, 5), columns=['Feature1',
'Feature2', 'Feature3', 'Feature4', 'Feature5'])

# Generate random target class (0 or 1)

data['TARGET CLASS'] = [Link](0, 2, size=len(data))

# Save data to CSV file

data.to_csv('classified_data.csv', index=False)

AI ML - Cycle 2 Programs
No ratings yet
AI ML - Cycle 2 Programs
15 pages
ML5 Implementation
No ratings yet
ML5 Implementation
32 pages
Basic ML Algo
No ratings yet
Basic ML Algo
10 pages
ML Lab Manual
No ratings yet
ML Lab Manual
12 pages
ML Lab
No ratings yet
ML Lab
29 pages
ML External Xerox
No ratings yet
ML External Xerox
1 page
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
Atul MLT Exp 4-11
No ratings yet
Atul MLT Exp 4-11
17 pages
Car Evaluation Data Analysis & Random Forest Model
No ratings yet
Car Evaluation Data Analysis & Random Forest Model
12 pages
MLT 1 - 7 Kanish
No ratings yet
MLT 1 - 7 Kanish
24 pages
Facebook Graph Link Prediction
No ratings yet
Facebook Graph Link Prediction
14 pages
MLA Lab 6:-Implementation of Decision Tree
No ratings yet
MLA Lab 6:-Implementation of Decision Tree
16 pages
Python ML Algorithms Guide
No ratings yet
Python ML Algorithms Guide
7 pages
Da Lab Mannual
No ratings yet
Da Lab Mannual
25 pages
MlLabManualdocx 2024 09 04 22 02 58
No ratings yet
MlLabManualdocx 2024 09 04 22 02 58
19 pages
ML (Experiment No 3)
No ratings yet
ML (Experiment No 3)
3 pages
Slip
No ratings yet
Slip
5 pages
Decision Tree
No ratings yet
Decision Tree
6 pages
Prakhar - Week 5
No ratings yet
Prakhar - Week 5
8 pages
Aiml Ex 4-7
No ratings yet
Aiml Ex 4-7
8 pages
Program
No ratings yet
Program
2 pages
Practical Machine Learning Code Examples
No ratings yet
Practical Machine Learning Code Examples
33 pages
Practicalpgm ML
No ratings yet
Practicalpgm ML
33 pages
23BCE7092 ML Lab Assignment
No ratings yet
23BCE7092 ML Lab Assignment
14 pages
1
No ratings yet
1
13 pages
ML Internal Answers
No ratings yet
ML Internal Answers
9 pages
23BCE7199 ML Lab Assignment
No ratings yet
23BCE7199 ML Lab Assignment
15 pages
ML Lab PT
No ratings yet
ML Lab PT
25 pages
Shobit Sharma (2124399) ML Lab File PDF
No ratings yet
Shobit Sharma (2124399) ML Lab File PDF
19 pages
ML Fat
No ratings yet
ML Fat
9 pages
ML Lab-1
No ratings yet
ML Lab-1
32 pages
Data Science Projects Overview
No ratings yet
Data Science Projects Overview
7 pages
Naïve Bayesian Classifier Example
No ratings yet
Naïve Bayesian Classifier Example
2 pages
LAB-4 Report
No ratings yet
LAB-4 Report
21 pages
ML Functions
No ratings yet
ML Functions
12 pages
ML Lab
No ratings yet
ML Lab
10 pages
Aml Lab
No ratings yet
Aml Lab
6 pages
Exp 5
No ratings yet
Exp 5
4 pages
Scikit Learn Cross-Validation Guide
No ratings yet
Scikit Learn Cross-Validation Guide
141 pages
Section 2
No ratings yet
Section 2
2 pages
Final-12-Lab Programs
No ratings yet
Final-12-Lab Programs
30 pages
Naive Bayes and Decision Trees in Python
No ratings yet
Naive Bayes and Decision Trees in Python
10 pages
AI
No ratings yet
AI
16 pages
Ai Int-1
No ratings yet
Ai Int-1
6 pages
ML PDF
No ratings yet
ML PDF
30 pages
Advance Machine Learning
No ratings yet
Advance Machine Learning
28 pages
Simple Linear Regression
No ratings yet
Simple Linear Regression
11 pages
ML (Experiment No 3)
No ratings yet
ML (Experiment No 3)
3 pages
I Avaliação Parcial - 25.0 PTS - Gabarito
No ratings yet
I Avaliação Parcial - 25.0 PTS - Gabarito
9 pages
Professional Machine Learning
No ratings yet
Professional Machine Learning
67 pages
Code and Output of Cancer Detection Model
No ratings yet
Code and Output of Cancer Detection Model
13 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
Assgn 06 ML - Ipynb - Colab
No ratings yet
Assgn 06 ML - Ipynb - Colab
5 pages
16BCB0126 VL2018195002535 Pe003
No ratings yet
16BCB0126 VL2018195002535 Pe003
40 pages
Machine Learning Algorithms Overview
No ratings yet
Machine Learning Algorithms Overview
13 pages
00 KNN Classification
No ratings yet
00 KNN Classification
8 pages
AIML Practical 02 22105A2021
No ratings yet
AIML Practical 02 22105A2021
8 pages
Platen 1999
No ratings yet
Platen 1999
51 pages
Discrete Memoryless Channel and Its Capacity Tutorial
No ratings yet
Discrete Memoryless Channel and Its Capacity Tutorial
16 pages
Optimized Hyperparameters Tuning of Multi-Class Classification Algorithms
No ratings yet
Optimized Hyperparameters Tuning of Multi-Class Classification Algorithms
17 pages
Resume of Damineni Sanketh - Data Scientist
No ratings yet
Resume of Damineni Sanketh - Data Scientist
2 pages
Bode Plot
No ratings yet
Bode Plot
4 pages
11.quality Management Ls
No ratings yet
11.quality Management Ls
4 pages
Term Project Report CIS 667
No ratings yet
Term Project Report CIS 667
20 pages
WELMEC Guide 8.10 2024
No ratings yet
WELMEC Guide 8.10 2024
13 pages
Data Science Chapitre 1
No ratings yet
Data Science Chapitre 1
54 pages
A Predictive Analysis Model For Students Grade Prediction by Supervised Machine Learning
No ratings yet
A Predictive Analysis Model For Students Grade Prediction by Supervised Machine Learning
9 pages
Image Denoising with Spatial Filters
No ratings yet
Image Denoising with Spatial Filters
21 pages
Inductive Moment Matching
No ratings yet
Inductive Moment Matching
36 pages
Data Structures and Algorithms Syllabus
80% (5)
Data Structures and Algorithms Syllabus
610 pages
Encrypted Document Analysis
No ratings yet
Encrypted Document Analysis
9 pages
Solutions For Exercise Sheet 1
No ratings yet
Solutions For Exercise Sheet 1
7 pages
DLD Midterm Examination Spring 2023 (Umt A1 D1)
No ratings yet
DLD Midterm Examination Spring 2023 (Umt A1 D1)
3 pages
Inventory and Queueing Analysis
No ratings yet
Inventory and Queueing Analysis
4 pages
Multi-Population DE for ED Challenges
No ratings yet
Multi-Population DE for ED Challenges
25 pages
Dsa CBP
No ratings yet
Dsa CBP
5 pages
Adaptive Huffman Coding Explained
No ratings yet
Adaptive Huffman Coding Explained
26 pages
Homework 8 2025 - Solutions
No ratings yet
Homework 8 2025 - Solutions
6 pages
Notes For The Applied Cryptography
No ratings yet
Notes For The Applied Cryptography
6 pages
(TechNeo) Design and Analysis of Algorithms U3-6 (2019 Pattern)
No ratings yet
(TechNeo) Design and Analysis of Algorithms U3-6 (2019 Pattern)
150 pages
Comprehensive ML Course Guide
No ratings yet
Comprehensive ML Course Guide
4 pages
Surge and Logistic Function Analysis
No ratings yet
Surge and Logistic Function Analysis
3 pages
Practice Questions For Simulation Lab - R
No ratings yet
Practice Questions For Simulation Lab - R
3 pages
Job Scheduling Techniques and Analysis
No ratings yet
Job Scheduling Techniques and Analysis
2 pages
S S 2 Marks
No ratings yet
S S 2 Marks
36 pages
Advanced Math Problem Solutions
No ratings yet
Advanced Math Problem Solutions
4 pages

AI Assignment-6

Uploaded by

AI Assignment-6

Uploaded by

Q1

# Step 1: Generate synthetic dataset

# Step 2: Save dataset to a .csv file

# Step 3: Load dataset

# Step 4: Split dataset into features and target

# Step 5: Split dataset into training and testing sets

# Step 6: Standardize features (optional)

# Step 7: Build KNN model

# Step 9: Make predictions on the testing set

# Standardize the new candidate data

# Predict salaries for new candidates

# Save dataset to a .csv file

# Split dataset into features and target

# Build Bayesian learning model

# Train the model

# Make predictions on testing data

# Calculate classification metrics

# Print classification metrics

# Predict status for unseen data

# Make predictions for unseen data

# Save classification metrics to a .csv file

# Save predictions for unseen data to a .csv file

# Load the IRIS dataset

# Define function to evaluate model performance

# Vary percentage of training data

# Explore effect of other decision tree parameters

# Load the Classified Data

# Define functions to evaluate models

def evaluate_decision_tree(max_depth, min_samples_split):

# Vary parameters for each model

# Evaluate models and save results to CSV

accuracy, precision, recall, f1 = evaluate_nb()

for params in decision_tree_parameters:

# Create DataFrame and save to CSV

# Generate random data

# Generate random target class (0 or 1)

# Save data to CSV file

You might also like