Open navigation menu

Scribd

0% found this document useful (0 votes)

33 views10 pages

Da Programs

Uploaded by

ailurophileas24

Copyright

© © All Rights Reserved

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

33 views10 pages

Da Programs

Uploaded by

ailurophileas24

Copyright

© © All Rights Reserved

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 10

1.

Implement word count / frequency programs

import string

def word_count(file_path):

# Initialize an empty dictionary to store word counts

word_counts = {}

try:

# Open the file in read mode

with open(file_path, 'r') as file:

# Read the entire content of the file

text = file.read()

# Remove punctuation and convert text to lowercase

text = text.translate(str.maketrans('', '', string.punctuation)).lower()

# Split the text into individual words

words = text.split()

# Count the frequency of each word

for word in words:

if word in word_counts:

word_counts[word] += 1

else:

word_counts[word] = 1

return word_counts

except FileNotFoundError:

print(f"Error: The file at {file_path} was not found.")

return None
# Example usage

file_path = 'example.txt' # Replace this with the path to your text file

word_counts = word_count(file_path)

# Display the word counts if the dictionary is populated

if word_counts is not None:

for word, count in word_counts.items():

print(f"{word}: {count}")

OUTPUT

2.Implement an python program that processes a weather dataset

import pandas as pd

# Read CSV file into a pandas DataFrame

df = pd.read_csv('weather.csv')
# Print the DataFrame to see the content

print(df)

output

3. Implement SVM / Decision tree classification techniques.

3 a) import matplotlib.pyplot as plt

from sklearn import datasets, svm

from sklearn.inspection import DecisionBoundaryDisplay

# import some data to play with

iris = datasets.load_iris()

# Take the first two features. We could avoid this by using a two-dim dataset

X = iris.data[:, :2]

y = iris.target
# we create an instance of SVM and fit out data. We do not scale our

# data since we want to plot the support vectors

C = 1.0 # SVM regularization parameter

models = (

svm.SVC(kernel="linear", C=C),

svm.LinearSVC(C=C, max_iter=10000),

svm.SVC(kernel="rbf", gamma=0.7, C=C),

svm.SVC(kernel="poly", degree=3, gamma="auto", C=C),

models = (clf.fit(X, y) for clf in models)

# title for the plots

titles = (

"SVC with linear kernel",

"LinearSVC (linear kernel)",

"SVC with RBF kernel",

"SVC with polynomial (degree 3) kernel",

# Set-up 2x2 grid for plotting.

fig, sub = plt.subplots(2, 2)

plt.subplots_adjust(wspace=0.4, hspace=0.4)

X0, X1 = X[:, 0], X[:, 1]

for clf, title, ax in zip(models, titles, sub.flatten()):

disp = DecisionBoundaryDisplay.from_estimator(

clf,

X,

response_method="predict",

cmap=plt.cm.coolwarm,
alpha=0.8,

ax=ax,

xlabel=iris.feature_names[0],

ylabel=iris.feature_names[1],

ax.scatter(X0, X1, c=y, cmap=plt.cm.coolwarm, s=20, edgecolors="k")

ax.set_xticks(())

ax.set_yticks(())

ax.set_title(title)

plt.show()

3b) Decision tree

# Import necessary libraries

from sklearn.datasets import load_iris

from sklearn.tree import DecisionTreeClassifier

from sklearn.model_selection import train_test_split

from sklearn.metrics import accuracy_score

# Load the Iris dataset

data = load_iris()

X = data.data # Features

y = data.target # Labels

# Split the data into training and testing sets

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

# Create and train the Decision Tree Classifier with optimized hyperparameters

clf = DecisionTreeClassifier(

criterion='entropy', # Use 'entropy' for Information Gain

max_depth=5, # Limit the depth of the tree

random_state=42

clf.fit(X_train, y_train)

# Make predictions on the test set

y_pred = clf.predict(X_test)

# Evaluate the performance

accuracy = accuracy_score(y_test, y_pred)

print("Accuracy:", accuracy)

# Optional: Visualize the Decision Tree

from sklearn.tree import plot_tree

import matplotlib.pyplot as plt

plt.figure(figsize=(12, 8))

plot_tree(clf, feature_names=data.feature_names, class_names=data.target_names, filled=True)

plt.show()
4. Visualize data using any plotting framework

import seaborn as sns

import matplotlib.pyplot as plt

from sklearn.datasets import load_iris

import pandas as pd

# Load the Iris dataset

data = load_iris()

# Convert it into a pandas DataFrame for easier visualization

df = pd.DataFrame(data.data, columns=data.feature_names)
df['species'] = data.target

df['species'] = df['species'].map({0: 'setosa', 1: 'versicolor', 2: 'virginica'})

# Pairplot to visualize relationships between features

sns.pairplot(df, hue='species', diag_kind='kde', corner=True)

plt.show()

# Heatmap to visualize feature correlations

plt.figure(figsize=(8, 6))

sns.heatmap(df.iloc[:, :-1].corr(), annot=True, cmap='coolwarm')

plt.title("Feature Correlation Heatmap")

plt.show()

# Boxplot to show feature distributions

plt.figure(figsize=(10, 6))

sns.boxplot(data=df.iloc[:, :-1], orient='h', palette='Set2')

plt.title("Boxplot of Features")

plt.show()

# Scatter plot for specific features

plt.figure(figsize=(8, 6))

sns.scatterplot(

data=df,

x='sepal length (cm)',

y='petal length (cm)',

hue='species',

style='species',

palette='deep',

s=100

plt.title("Scatterplot of Sepal Length vs Petal Length")

plt.show()

You might also like

MLA Lab 6:-Implementation of Decision Tree
No ratings yet
MLA Lab 6:-Implementation of Decision Tree
16 pages
Wa0009.
No ratings yet
Wa0009.
26 pages
Aiml 5-8
No ratings yet
Aiml 5-8
19 pages
Ex 6, EX 7 AIML
No ratings yet
Ex 6, EX 7 AIML
9 pages
VAMSHI PR (1) 2 Edit
No ratings yet
VAMSHI PR (1) 2 Edit
16 pages
Prathamesh KRAI
No ratings yet
Prathamesh KRAI
38 pages
ML Yogesh
No ratings yet
ML Yogesh
23 pages
Lab 6
No ratings yet
Lab 6
4 pages
Data Science Practical
No ratings yet
Data Science Practical
22 pages
ML5 Implementation
No ratings yet
ML5 Implementation
32 pages
Experiment 1
No ratings yet
Experiment 1
19 pages
Big Data Practical
No ratings yet
Big Data Practical
20 pages
Ashwin Report
No ratings yet
Ashwin Report
18 pages
ML Shristi File
No ratings yet
ML Shristi File
49 pages
ML Lab Prgms Split
No ratings yet
ML Lab Prgms Split
3 pages
ML Lab
No ratings yet
ML Lab
33 pages
AIML Lab 7 8 9 10
No ratings yet
AIML Lab 7 8 9 10
10 pages
AI & ML Lab Journal for MCA Students
No ratings yet
AI & ML Lab Journal for MCA Students
77 pages
Linearregression SVM
No ratings yet
Linearregression SVM
3 pages
1
No ratings yet
1
13 pages
SVM K NN MLP With Sklearn Jupyter NoteBo
No ratings yet
SVM K NN MLP With Sklearn Jupyter NoteBo
22 pages
ML 3
No ratings yet
ML 3
24 pages
Foundations of Python For AI
No ratings yet
Foundations of Python For AI
67 pages
22MCA1008 - Varun ML LAB ASSIGNMENTS
100% (1)
22MCA1008 - Varun ML LAB ASSIGNMENTS
41 pages
Karmbir 19 ML
No ratings yet
Karmbir 19 ML
20 pages
DM ML Practical
No ratings yet
DM ML Practical
13 pages
SVM Image Analysis Code
No ratings yet
SVM Image Analysis Code
18 pages
Machine Learning
No ratings yet
Machine Learning
16 pages
EX - NO:3: Algorithm
No ratings yet
EX - NO:3: Algorithm
11 pages
Aam Codes
No ratings yet
Aam Codes
8 pages
ML Keshav
No ratings yet
ML Keshav
23 pages
Decision Trees for Data Scientists
No ratings yet
Decision Trees for Data Scientists
1 page
Module 4 - Supervised Learning - First ML Model
No ratings yet
Module 4 - Supervised Learning - First ML Model
23 pages
DM Practical File
No ratings yet
DM Practical File
21 pages
Nitin ML Assignment 1
No ratings yet
Nitin ML Assignment 1
18 pages
ML LNB
No ratings yet
ML LNB
6 pages
Programs Lab Bca
No ratings yet
Programs Lab Bca
16 pages
AML Lab
No ratings yet
AML Lab
14 pages
178 hw1
No ratings yet
178 hw1
4 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
20 pages
AML Lab3 2021wb15156
No ratings yet
AML Lab3 2021wb15156
13 pages
ML LabReport Final Index Edited
No ratings yet
ML LabReport Final Index Edited
35 pages
ML Remaining Jds
No ratings yet
ML Remaining Jds
35 pages
ML - Lab Manual With Woad File
No ratings yet
ML - Lab Manual With Woad File
12 pages
Sentimental
No ratings yet
Sentimental
11 pages
Advance Machine Learning
No ratings yet
Advance Machine Learning
28 pages
Pattern Recognition
No ratings yet
Pattern Recognition
26 pages
AI&ML
No ratings yet
AI&ML
9 pages
Iris Flower Classification Project
100% (1)
Iris Flower Classification Project
14 pages
Efficient Python Tricks and Tools For Data Scientists - by Khuyen Tran
No ratings yet
Efficient Python Tricks and Tools For Data Scientists - by Khuyen Tran
20 pages
ML Lab Manual
No ratings yet
ML Lab Manual
6 pages
E22cseu1389 Assignment10 1
No ratings yet
E22cseu1389 Assignment10 1
5 pages
Mlaifile1 3
No ratings yet
Mlaifile1 3
27 pages
Importing Libraries: Pandas PD Matplotlib - Pyplot PLT Numpy NP
No ratings yet
Importing Libraries: Pandas PD Matplotlib - Pyplot PLT Numpy NP
10 pages
ML Short Code - Under Updating
No ratings yet
ML Short Code - Under Updating
4 pages
MANUAL
No ratings yet
MANUAL
33 pages
PR
No ratings yet
PR
17 pages
Tax Unit III
No ratings yet
Tax Unit III
26 pages
Implement Word Count
No ratings yet
Implement Word Count
2 pages
Unit 2
No ratings yet
Unit 2
101 pages
Tax - Unit-V
No ratings yet
Tax - Unit-V
11 pages
Instructions Guide Coluna BT Goodis Black Box
No ratings yet
Instructions Guide Coluna BT Goodis Black Box
44 pages
3914.practical Methods of Optimization. Volume 1. Unconstrained Optimization by R. Fletcher
100% (1)
3914.practical Methods of Optimization. Volume 1. Unconstrained Optimization by R. Fletcher
126 pages
Frequently Asked Questions (FAQ) About Firepower Licensing
No ratings yet
Frequently Asked Questions (FAQ) About Firepower Licensing
15 pages
Digital Image Processing - Chapter 7
No ratings yet
Digital Image Processing - Chapter 7
63 pages
Hacking PSP
No ratings yet
Hacking PSP
6 pages
Computer Shortcuts
50% (2)
Computer Shortcuts
2 pages
Digital Water Flow Meter
No ratings yet
Digital Water Flow Meter
1 page
Quadro Pascal p2000 Data Sheet Us Nvidia 704443 r2 Web
No ratings yet
Quadro Pascal p2000 Data Sheet Us Nvidia 704443 r2 Web
1 page
PowerPoint Kiểu
No ratings yet
PowerPoint Kiểu
20 pages
Week5worksheet 2
No ratings yet
Week5worksheet 2
9 pages
Adv C Question Bank
No ratings yet
Adv C Question Bank
2 pages
AHB Features
No ratings yet
AHB Features
12 pages
Trường Thpt Mai Thúc Loan: (Đề thi có 04 trang) Thời gian làm bài: 60 phút, không kể thời gian phát đề
No ratings yet
Trường Thpt Mai Thúc Loan: (Đề thi có 04 trang) Thời gian làm bài: 60 phút, không kể thời gian phát đề
5 pages
Assignment 2 PDF
0% (1)
Assignment 2 PDF
4 pages
Full Pivotcall Options Course Available Premiumcourses12: Generated Via PDF Scanner
No ratings yet
Full Pivotcall Options Course Available Premiumcourses12: Generated Via PDF Scanner
34 pages
OS Process Hierarchy Exercises
No ratings yet
OS Process Hierarchy Exercises
4 pages
HW3 PDF
No ratings yet
HW3 PDF
1 page
MAD Micro Project Report
No ratings yet
MAD Micro Project Report
10 pages
SGV Inverter Parameter Setting Instruction 4H50ZS1571P1
No ratings yet
SGV Inverter Parameter Setting Instruction 4H50ZS1571P1
14 pages
1.1.1 MSC Computer Science Syllabus
No ratings yet
1.1.1 MSC Computer Science Syllabus
57 pages
Infiniti Vision System - Service Manual PDF
100% (2)
Infiniti Vision System - Service Manual PDF
262 pages
MATISX
100% (1)
MATISX
2 pages
9500 MPR MPT-GC R4.0.0 User Manual 3DB19025AAAA - 02 PDF
67% (3)
9500 MPR MPT-GC R4.0.0 User Manual 3DB19025AAAA - 02 PDF
238 pages
Brand Guidelines 2002
No ratings yet
Brand Guidelines 2002
18 pages
CAD Basics for Beginners
No ratings yet
CAD Basics for Beginners
7 pages
New Oriental 1000NA - 202110
100% (1)
New Oriental 1000NA - 202110
10 pages
Missing Values Analysis & Data Imputation: Single User License. Do Not Copy or Post
No ratings yet
Missing Values Analysis & Data Imputation: Single User License. Do Not Copy or Post
26 pages
Liverpool Hospital RFID Blood Tracking
No ratings yet
Liverpool Hospital RFID Blood Tracking
4 pages
POSTERTemplate
No ratings yet
POSTERTemplate
1 page
Tabular Modeling in Microsoft SQL Server Analysis Services (Developer Reference) by Marco Russo and Alberto Ferrari
No ratings yet
Tabular Modeling in Microsoft SQL Server Analysis Services (Developer Reference) by Marco Russo and Alberto Ferrari
748 pages