0% found this document useful (0 votes)

14 views3 pages

Code For Ser

The document outlines a step-by-step guide for a Speech Emotion Recognition (SER) project, including project setup, dataset collection, audio preprocessing, feature extraction, model building, and evaluation. It details the creation of necessary folders, data processing functions, and the construction of a CNN-LSTM model for emotion classification. Additionally, it includes instructions for deploying the model using Streamlit for user interaction.

Uploaded by

kentkouhcwsmk

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

14 views3 pages

Code For Ser

Uploaded by

kentkouhcwsmk

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

# Speech Emotion Recognition (SER) Project - Step-by-Step Code

# STEP 1: Project Setup + Objective

# - Setup folders: data/, models/, utils/, notebooks/
# - Create requirements.txt with basic libraries
# - Create README.md

# STEP 2: Dataset Collection & Cleaning

import os
import shutil
import numpy as np
import pandas as pd
from tqdm import tqdm
from scipy.io import wavfile
from scipy.signal import resample
from sklearn.preprocessing import LabelEncoder
from sklearn.model_selection import train_test_split
import matplotlib.pyplot as plt
from sklearn.metrics import classification_report, confusion_matrix
import seaborn as sns
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Conv1D, MaxPooling1D, LSTM, Dense, Dropout

def create_data_folder():
os.makedirs('data/RAVDESS', exist_ok=True)
os.makedirs('data/TESS', exist_ok=True)
os.makedirs('data/CREMA-D', exist_ok=True)
print("Folders for datasets created.")

create_data_folder()

# STEP 3: Audio Preprocessing + Feature Extraction (MFCC replacement)

SAMPLE_RATE = 22050
MAX_LEN = 5 # seconds

def extract_features(file_path):
try:
sr, audio = wavfile.read(file_path)
if audio.ndim > 1:
audio = audio[:, 0] # Convert to mono
desired_len = SAMPLE_RATE * MAX_LEN
if len(audio) > desired_len:
audio = audio[:desired_len]
elif len(audio) < desired_len:
audio = np.pad(audio, (0, desired_len - len(audio)), 'constant')
audio_resampled = resample(audio, SAMPLE_RATE * MAX_LEN)
return np.mean(audio_resampled.reshape(-1, 100), axis=1) # crude feature
except Exception as e:
print(f"Error processing {file_path}: {e}")
return None

def extract_emotion_label(filename, emotion_map):

try:
emotion_code = int(filename.split('-')[2])
return emotion_map.get(emotion_code)
except:
return None

def process_dataset(dataset_path, emotion_map):

data = []
for root, _, files in os.walk(dataset_path):
for file in tqdm(files):
if file.endswith('.wav'):
path = os.path.join(root, file)
emotion = extract_emotion_label(file, emotion_map)
if emotion:
features = extract_features(path)
if features is not None:
data.append([features, emotion])
return pd.DataFrame(data, columns=['features', 'label'])

# Emotion map for RAVDESS

ravdess_emotion_map = {
1: 'neutral', 2: 'calm', 3: 'happy', 4: 'sad',
5: 'angry', 6: 'fearful', 7: 'disgust', 8: 'surprised'
}

# df_ravdess = process_dataset('data/RAVDESS', ravdess_emotion_map)

# df_ravdess.to_pickle('data/features_ravdess.pkl')

# STEP 4: Label Encoding + Data Split

def load_all_data():
df_ravdess = pd.read_pickle('data/features_ravdess.pkl')
df_tess = pd.read_pickle('data/features_tess.pkl')
df_crema = pd.read_pickle('data/features_crema.pkl')
df_all = pd.concat([df_ravdess, df_tess, df_crema], ignore_index=True)
return df_all

data_df = load_all_data()
X = np.array(data_df['features'].tolist())
y = LabelEncoder().fit_transform(data_df['label'])

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,

random_state=42)

# STEP 5: Model Building - CNN + LSTM

X_train_reshaped = X_train.reshape(X_train.shape[0], X_train.shape[1], 1)
X_test_reshaped = X_test.reshape(X_test.shape[0], X_test.shape[1], 1)

model = Sequential()
model.add(Conv1D(64, kernel_size=3, activation='relu',
input_shape=(X_train.shape[1], 1)))
model.add(MaxPooling1D(pool_size=2))
model.add(Dropout(0.3))
model.add(LSTM(128))
model.add(Dense(64, activation='relu'))
model.add(Dropout(0.3))
model.add(Dense(len(np.unique(y)), activation='softmax'))

model.compile(loss='sparse_categorical_crossentropy', optimizer='adam',
metrics=['accuracy'])
model.summary()
model.fit(X_train_reshaped, y_train, epochs=50, batch_size=32,
validation_split=0.1)

# STEP 6: Evaluation
y_pred = np.argmax(model.predict(X_test_reshaped), axis=1)
print(classification_report(y_test, y_pred))

cm = confusion_matrix(y_test, y_pred)
sns.heatmap(cm, annot=True, fmt='d', xticklabels=np.unique(y),
yticklabels=np.unique(y))
plt.xlabel('Predicted')
plt.ylabel('True')
plt.title('Confusion Matrix')
plt.show()

# STEP 7: App Demo (Streamlit/Gradio)

# Note: You'd use scipy.io.wavfile + resample here as well
# Save model: model.save("ser_model.h5")

# streamlit_app.py
'''
import streamlit as st
import numpy as np
from scipy.io import wavfile
from scipy.signal import resample
from tensorflow.keras.models import load_model

model = load_model("ser_model.h5")

st.title("Speech Emotion Recognizer")

uploaded_file = st.file_uploader("Upload an audio file", type=[".wav"])

if uploaded_file:
sr, audio = wavfile.read(uploaded_file)
if audio.ndim > 1:
audio = audio[:, 0]
audio = np.pad(audio, (0, max(0, sr*5 - len(audio))), 'constant')
audio = resample(audio, sr*5)
features = np.mean(audio.reshape(-1, 100), axis=1).reshape(1, -1, 1)
prediction = model.predict(features)
emotion = np.argmax(prediction)
st.write(f"Predicted Emotion: {emotion}")
'''
# Run using: streamlit run streamlit_app.py

Importing Libraries: Import As Import As Import Import
No ratings yet
Importing Libraries: Import As Import As Import Import
20 pages
Speech Emotion Recognition
No ratings yet
Speech Emotion Recognition
14 pages
Speech Emotion Recognition
No ratings yet
Speech Emotion Recognition
26 pages
Project Report - 092046
No ratings yet
Project Report - 092046
5 pages
Emotion Detection - Merged
No ratings yet
Emotion Detection - Merged
8 pages
TESS
No ratings yet
TESS
4 pages
Real-Time Speech Emotion Detection
No ratings yet
Real-Time Speech Emotion Detection
16 pages
Voice Emotion Recognition
No ratings yet
Voice Emotion Recognition
11 pages
4th Sem Project
No ratings yet
4th Sem Project
22 pages
4b Review 2
No ratings yet
4b Review 2
23 pages
NN - DL Project
No ratings yet
NN - DL Project
16 pages
Reality
No ratings yet
Reality
11 pages
Emotion Based Model Prediction - ANN - ESE
No ratings yet
Emotion Based Model Prediction - ANN - ESE
5 pages
Towards Generalizable SER: Soft Labeling and Data Augmentation For Modeling Temporal Emotion Shifts in Large-Scale Multilingual Speech
No ratings yet
Towards Generalizable SER: Soft Labeling and Data Augmentation For Modeling Temporal Emotion Shifts in Large-Scale Multilingual Speech
5 pages
Q 3
No ratings yet
Q 3
2 pages
Speech Emotion Detection (CNN Algorithm)
No ratings yet
Speech Emotion Detection (CNN Algorithm)
29 pages
Emotion Detection Through Speech
No ratings yet
Emotion Detection Through Speech
9 pages
AI Emotion Recognition Project
No ratings yet
AI Emotion Recognition Project
26 pages
Finetuning
No ratings yet
Finetuning
10 pages
Preprocessing Structure
No ratings yet
Preprocessing Structure
5 pages
Literature Review (2) Smaple
No ratings yet
Literature Review (2) Smaple
9 pages
Lec 9
No ratings yet
Lec 9
87 pages
Soft Computing Class Test
No ratings yet
Soft Computing Class Test
64 pages
FED
No ratings yet
FED
2 pages
Lec 5
No ratings yet
Lec 5
69 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Seizure Project
No ratings yet
Seizure Project
199 pages
Sentiment Analysis Using LSTM
No ratings yet
Sentiment Analysis Using LSTM
5 pages
Super Visionado VSRegras
No ratings yet
Super Visionado VSRegras
6 pages
Ass 8
No ratings yet
Ass 8
2 pages
Code
No ratings yet
Code
18 pages
Ass
No ratings yet
Ass
5 pages
Code
No ratings yet
Code
13 pages
Final Code 2
No ratings yet
Final Code 2
3 pages
Final Presentation
No ratings yet
Final Presentation
50 pages
Literature Study 2025
No ratings yet
Literature Study 2025
10 pages
ATI Ipynb
No ratings yet
ATI Ipynb
12 pages
Ex 7
No ratings yet
Ex 7
2 pages
Deep Learning Report 1 3
No ratings yet
Deep Learning Report 1 3
3 pages
MiniProject 5
No ratings yet
MiniProject 5
11 pages
Sentispeak Tone Mood Detector
No ratings yet
Sentispeak Tone Mood Detector
16 pages
Developing Application Steps
No ratings yet
Developing Application Steps
1 page
Emotion Dect
No ratings yet
Emotion Dect
4 pages
2023 Aug How To Prepare Data For A Neural Network A Step-by-Step Guide
No ratings yet
2023 Aug How To Prepare Data For A Neural Network A Step-by-Step Guide
7 pages
App Py
No ratings yet
App Py
2 pages
# Simple HGM-XA Multimodal Emotion
No ratings yet
# Simple HGM-XA Multimodal Emotion
3 pages
Chapter 3 - Meth-WPS Office
No ratings yet
Chapter 3 - Meth-WPS Office
8 pages
Heartbeat Disease Classifier
No ratings yet
Heartbeat Disease Classifier
21 pages
Mood Based Music Player Project Expanded
No ratings yet
Mood Based Music Player Project Expanded
12 pages
ML Week10.1
No ratings yet
ML Week10.1
5 pages
Minor Project G-24 (Audio Sentiment Analysis)
No ratings yet
Minor Project G-24 (Audio Sentiment Analysis)
15 pages
Machine Learning Code Explanation
No ratings yet
Machine Learning Code Explanation
33 pages
Sentimental Analysis
No ratings yet
Sentimental Analysis
3 pages
Code Try1
No ratings yet
Code Try1
4 pages
Speech-Emotion-Recognition Using SVM, Decision Tree and LDA Report
No ratings yet
Speech-Emotion-Recognition Using SVM, Decision Tree and LDA Report
7 pages
SER Implementation Guide
No ratings yet
SER Implementation Guide
3 pages
Day 2 S1
No ratings yet
Day 2 S1
4 pages
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
No ratings yet
Import As Import As Import As Import As From Import From Import From Import From Import From Import From Import From Import From Import From Import
8 pages
Doctor Job Application Letter Sample
No ratings yet
Doctor Job Application Letter Sample
20 pages
Two-Storey House Construction Costs
No ratings yet
Two-Storey House Construction Costs
2 pages
8 CTU 2022 Colao
No ratings yet
8 CTU 2022 Colao
23 pages
2 History and Examination
No ratings yet
2 History and Examination
55 pages
Renaissance Social Cultural Aspects
No ratings yet
Renaissance Social Cultural Aspects
4 pages
Sociology of Gender
No ratings yet
Sociology of Gender
36 pages
Philosophy Logic Basics
No ratings yet
Philosophy Logic Basics
4 pages
Laporan Skincare Bulan Juni 2023
No ratings yet
Laporan Skincare Bulan Juni 2023
2 pages
OWASP Top 10 Web Vulnerabilities
No ratings yet
OWASP Top 10 Web Vulnerabilities
37 pages
Lymphangioleiomyomatosis: Simon R. Johnson
No ratings yet
Lymphangioleiomyomatosis: Simon R. Johnson
13 pages
Aerodynamics: Aerodynamics Is A Branch of Dynamics
No ratings yet
Aerodynamics: Aerodynamics Is A Branch of Dynamics
13 pages
Story Structure Quizlet Test
No ratings yet
Story Structure Quizlet Test
4 pages
Aws 101 Presentation Deck August 2014 1
No ratings yet
Aws 101 Presentation Deck August 2014 1
47 pages
MMW Practice Exam Answer Key
No ratings yet
MMW Practice Exam Answer Key
6 pages
Lifebuoy Soap: Present By: Bheem Soothar 1539105 Naveed Iftikhar 1539117
No ratings yet
Lifebuoy Soap: Present By: Bheem Soothar 1539105 Naveed Iftikhar 1539117
5 pages
Figures of Speech Lesson Plan
No ratings yet
Figures of Speech Lesson Plan
4 pages
Myanmar: The Politics of Rakhine State
No ratings yet
Myanmar: The Politics of Rakhine State
48 pages
Asd Tug Simulator Brochure
No ratings yet
Asd Tug Simulator Brochure
5 pages
Link Belt LS 248H - II - 200T PDF
No ratings yet
Link Belt LS 248H - II - 200T PDF
62 pages
CCNA 4 Exam Answers & Networking Tips
No ratings yet
CCNA 4 Exam Answers & Networking Tips
28 pages
Steady-State Heat Transfer in Plane Walls
No ratings yet
Steady-State Heat Transfer in Plane Walls
14 pages
Bagong Barrio National High School
No ratings yet
Bagong Barrio National High School
14 pages
The Seven Golden Rules For Living As A Couple
No ratings yet
The Seven Golden Rules For Living As A Couple
2 pages
Resume - Jenica David
No ratings yet
Resume - Jenica David
1 page
Vinothkumar
No ratings yet
Vinothkumar
3 pages
Cluster A Personality Disorders Case Report by Slidesgo
No ratings yet
Cluster A Personality Disorders Case Report by Slidesgo
40 pages
Civil Engineer's Professional Profile
No ratings yet
Civil Engineer's Professional Profile
3 pages
Method Statement and Risk Assessment-Dredging PDF
100% (4)
Method Statement and Risk Assessment-Dredging PDF
27 pages
MikroTik Price List-May 2023-01.05.2023
No ratings yet
MikroTik Price List-May 2023-01.05.2023
5 pages
6 - Glaucoma
No ratings yet
6 - Glaucoma
34 pages

Code For Ser

Uploaded by

Code For Ser

Uploaded by

# Speech Emotion Recognition (SER) Project - Step-by-Step Code

# STEP 1: Project Setup + Objective

# STEP 2: Dataset Collection & Cleaning

# STEP 3: Audio Preprocessing + Feature Extraction (MFCC replacement)

def extract_emotion_label(filename, emotion_map):

def process_dataset(dataset_path, emotion_map):

# Emotion map for RAVDESS

# df_ravdess = process_dataset('data/RAVDESS', ravdess_emotion_map)

# STEP 4: Label Encoding + Data Split

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2,

# STEP 5: Model Building - CNN + LSTM

# STEP 7: App Demo (Streamlit/Gradio)

st.title("Speech Emotion Recognizer")

You might also like