0% found this document useful (0 votes)

0 views

app.py

This document is a Flask application for text classification using pre-trained machine learning models. It includes routes for classifying individual text inputs and CSV file uploads, where the text is cleaned, vectorized, and predictions are made for labels and subclasses. The results can be displayed on a webpage or downloaded as a new CSV file containing the predictions.

Uploaded by

niraj21it

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

0 views

app.py

Uploaded by

niraj21it

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

from flask import Flask, request, render_template, redirect, url_for, send_file

import pandas as pd
import pickle
import os
import re

# Initialize Flask app

app = Flask(__name__)

# Load models and vectorizer

with open('models/lr_label_model.pkl', 'rb') as label_model_file:
lr_label_model = pickle.load(label_model_file)

with open('models/lr_subclass_model.pkl', 'rb') as subclass_model_file:

lr_subclass_model = pickle.load(subclass_model_file)

with open('models/tfidf_vectorizer.pkl', 'rb') as vectorizer_file:

tfidf_vectorizer = pickle.load(vectorizer_file)

# Function to clean Marathi text

def clean_marathi_text(text):
# Use a regular expression to remove anything that is not a Marathi
character
marathi_only = re.sub(r'[^\u0900-\u097F\s]', '', text) # Unicode range for
Marathi characters
marathi_only = re.sub(r'\s+', ' ', marathi_only).strip() # Remove extra
spaces
return marathi_only

# Index route for rendering the form

@app.route('/')
def index():
return render_template('index.html')

# Route for handling text classification

@app.route('/classify-text', methods=['POST'])
def classify_text():
if request.method == 'POST':
# Get the text input from the form
input_text = request.form['text']

# Preprocess and vectorize input text

input_text_cleaned = clean_marathi_text(input_text)
input_vectorized = tfidf_vectorizer.transform([input_text_cleaned])

# Predict using both models

label_prediction = lr_label_model.predict(input_vectorized)[0]
subclass_prediction = lr_subclass_model.predict(input_vectorized)[0]

# Display results
return render_template('index.html', text=input_text,
predicted_label=label_prediction,
predicted_subclass=subclass_prediction)

# Route for handling CSV uploads

@app.route('/classify-csv', methods=['POST'])
def classify_csv():
if request.method == 'POST':
# Check if a file is uploaded
uploaded_file = request.files['file']
if uploaded_file.filename != '':
# Save the uploaded file
file_path = os.path.join('uploads', uploaded_file.filename)
uploaded_file.save(file_path)

# Read the uploaded CSV file

try:
df = pd.read_csv(file_path)

# Normalize the column names

df.columns = df.columns.str.strip().str.lower() # Convert to
lower case and strip whitespace

if 'text' in df.columns:
# Clean and vectorize the text data
df['cleaned_text'] = df['text'].apply(clean_marathi_text)
X_vectorized =
tfidf_vectorizer.transform(df['cleaned_text'])

# Predict using both models

df['Predicted_Label'] = lr_label_model.predict(X_vectorized)
df['Predicted_Subclass'] =
lr_subclass_model.predict(X_vectorized)

# Save the result to a new CSV file

output_file = os.path.join('uploads', 'classified_' +
uploaded_file.filename)
df.to_csv(output_file, index=False)

# Provide the file for download

return send_file(output_file, as_attachment=True)

else:
return "Error: 'Text' column not found in the uploaded
CSV.", 400

except pd.errors.ParserError as e:
return f"Error reading the CSV file: {e}", 400

return redirect(url_for('index'))

# Run the app

if __name__ == "__main__":
app.run(debug=True)

# from flask import Flask, request, render_template, redirect, url_for,

send_file
# import pandas as pd
# import pickle
# import os
#
# # Initialize Flask app
# app = Flask(__name__)
#
# # Load models and vectorizer
# with open('models/lr_label_model.pkl', 'rb') as label_model_file:
# lr_label_model = pickle.load(label_model_file)
#
# with open('models/lr_subclass_model.pkl', 'rb') as subclass_model_file:
# lr_subclass_model = pickle.load(subclass_model_file)
#
# with open('models/tfidf_vectorizer.pkl', 'rb') as vectorizer_file:
# tfidf_vectorizer = pickle.load(vectorizer_file)
#
# # Index route for rendering the form
# @app.route('/')
# def index():
# return render_template('index.html')
#
# # Route for handling text classification
# @app.route('/classify-text', methods=['POST'])
# def classify_text():
# if request.method == 'POST':
# # Get the text input from the form
# input_text = request.form['text']
#
# # Preprocess and vectorize input text
# input_text_cleaned = clean_marathi_text(input_text)
# input_vectorized = tfidf_vectorizer.transform([input_text_cleaned])
#
# # Predict using both models
# label_prediction = lr_label_model.predict(input_vectorized)[0]
# subclass_prediction = lr_subclass_model.predict(input_vectorized)[0]
#
# # Display results
# return render_template('index.html', text=input_text,
# predicted_label=label_prediction,
# predicted_subclass=subclass_prediction)
#
# # Route for handling CSV uploads
# @app.route('/classify-csv', methods=['POST'])
# def classify_csv():
# if request.method == 'POST':
# # Check if a file is uploaded
# uploaded_file = request.files['file']
# if uploaded_file.filename != '':
# # Save the uploaded file
# file_path = os.path.join('uploads', uploaded_file.filename)
# uploaded_file.save(file_path)
#
# # Read the uploaded CSV file
# df = pd.read_csv(file_path)
#
# # Clean and vectorize the text data
# df['cleaned_text'] = df['Text'].apply(clean_marathi_text)
# X_vectorized = tfidf_vectorizer.transform(df['cleaned_text'])
#
# # Predict using both models
# df['Predicted_Label'] = lr_label_model.predict(X_vectorized)
# df['Predicted_Subclass'] =
lr_subclass_model.predict(X_vectorized)
#
# # Save the result to a new CSV file
# output_file = os.path.join('uploads', 'classified_' +
uploaded_file.filename)
# df.to_csv(output_file, index=False)
#
# # Provide the file for download
# return send_file(output_file, as_attachment=True)
#
# return redirect(url_for('index'))
#
# # Function to clean Marathi text
# def clean_marathi_text(text):
# import re
# # Use a regular expression to remove anything that is not a Marathi
character
# marathi_only = re.sub(r'[^\u0900-\u097F\s]', '', text) # Unicode range
for Marathi characters
# marathi_only = re.sub(r'\s+', ' ', marathi_only).strip() # Remove extra
spaces
# return marathi_only
#
# # Run the app
# if __name__ == "__main__":
# app.run(debug=True)

# from flask import Flask, render_template, request, redirect, url_for,

send_file
# import pandas as pd
# import pickle
# from sklearn.feature_extraction.text import TfidfVectorizer
# from sklearn.linear_model import LogisticRegression
# import re
# import matplotlib.pyplot as plt
# import os
#
# # Load pre-trained models and vectorizer
# with open('lr_label_model.pkl', 'rb') as label_file:
# lr_label = pickle.load(label_file)
#
# with open('lr_subclass_model.pkl', 'rb') as subclass_file:
# lr_subclass = pickle.load(subclass_file)
#
# with open('tfidf_vectorizer.pkl', 'rb') as vectorizer_file:
# tfidf_vectorizer = pickle.load(vectorizer_file)
#
# # Initialize Flask app
# app = Flask(__name__)
#
# # Function to clean and process text (removing non-Marathi characters)
# def clean_marathi_text(text):
# marathi_only = re.sub(r'[^\u0900-\u097F\s]', '', text)
# marathi_only = re.sub(r'\s+', ' ', marathi_only).strip()
# return marathi_only
#
# # Function to predict label and subclass
# def predict_hate_speech(text):
# cleaned_text = clean_marathi_text(text)
# vectorized_text = tfidf_vectorizer.transform([cleaned_text])
# label_pred = lr_label.predict(vectorized_text)[0]
# subclass_pred = lr_subclass.predict(vectorized_text)[0] if label_pred ==
1 else 0
# return label_pred, subclass_pred
#
# # Route for the home page
# @app.route('/')
# def index():
# return render_template('index.html')
#
# # Route to handle text input and CSV file uploads
# @app.route('/predict', methods=['POST'])
# def predict():
# if 'text_input' in request.form and request.form['text_input']:
# # Single text input prediction
# text_input = request.form['text_input']
# label_pred, subclass_pred = predict_hate_speech(text_input)
# return render_template('result.html', text=text_input,
label=label_pred, subclass=subclass_pred)
#
# elif 'file' in request.files and
request.files['file'].filename.endswith('.csv'):
# # CSV file input prediction
# file = request.files['file']
# df = pd.read_csv(file)
#
# # Clean the text column
# df['cleaned_text'] = df['Text'].apply(clean_marathi_text)
#
# # Vectorize and make predictions
# X_tfidf = tfidf_vectorizer.transform(df['cleaned_text'])
# df['Hate_Speech_Classification'] = lr_label.predict(X_tfidf)
# df['Subclass_Prediction'] =
df['Hate_Speech_Classification'].apply(lambda x:
lr_subclass.predict([X_tfidf[i]])[0] if x == 1 else 0 for i in
range(len(X_tfidf)))
#
# # Save results as a new CSV file
# output_file = 'predictions_output.csv'
# df.to_csv(output_file, index=False)
#
# # Generate a pie chart for subclass distribution
# subclass_counts = df['Subclass_Prediction'].value_counts()
# labels = [f'Subclass {i}' for i in subclass_counts.index]
# plt.figure(figsize=(8, 6))
# plt.pie(subclass_counts, labels=labels, autopct='%1.1f%%',
startangle=140, colors=plt.cm.Paired.colors)
# plt.title('Subclass Distribution of Hate Speech Predictions')
# pie_chart_file = 'subclass_distribution.png'
# plt.savefig(pie_chart_file)
#
# # Return the downloadable CSV and show the pie chart
# return render_template('result.html', csv_file=output_file,
pie_chart=pie_chart_file)
#
# else:
# return redirect(url_for('index'))
#
# # Route to download the generated CSV
# @app.route('/download/<filename>')
# def download(filename):
# return send_file(filename, as_attachment=True)
#
# # Start the Flask app
# if __name__ == '__main__':
# app.run(debug=True)

Introduction To Geotechnical Grouting
No ratings yet
Introduction To Geotechnical Grouting
39 pages
Masculinity Report, USA 2018: Executive Summary
No ratings yet
Masculinity Report, USA 2018: Executive Summary
10 pages
Mainpy (Customer Segmentation)
No ratings yet
Mainpy (Customer Segmentation)
6 pages
Views - Py Forlder
No ratings yet
Views - Py Forlder
8 pages
Streamlit PDF Application Setup All Commands in One Single File
No ratings yet
Streamlit PDF Application Setup All Commands in One Single File
8 pages
code
No ratings yet
code
13 pages
Medical Text Classifier GabrieldeOlaguibel
No ratings yet
Medical Text Classifier GabrieldeOlaguibel
12 pages
app
No ratings yet
app
7 pages
Python Day 14 (Typed Notes) - Data Extraction Test Cases
No ratings yet
Python Day 14 (Typed Notes) - Data Extraction Test Cases
3 pages
1 - Sentiment - Analysis - NLP - Ipynb - Codes Only
No ratings yet
1 - Sentiment - Analysis - NLP - Ipynb - Codes Only
5 pages
QA_Using_Gemini_Langchain_ChromaDB_PDF
No ratings yet
QA_Using_Gemini_Langchain_ChromaDB_PDF
2 pages
Loading and Saving Data
No ratings yet
Loading and Saving Data
5 pages
Da Programs
No ratings yet
Da Programs
10 pages
Data Gathering
No ratings yet
Data Gathering
7 pages
Deepxplore Implementation
No ratings yet
Deepxplore Implementation
5 pages
Shreya Srivastava-27
No ratings yet
Shreya Srivastava-27
3 pages
Creating Deep Learning Model in vs Code
No ratings yet
Creating Deep Learning Model in vs Code
5 pages
Sourcecode
No ratings yet
Sourcecode
16 pages
Codes
No ratings yet
Codes
37 pages
تجربة كود
No ratings yet
تجربة كود
3 pages
Data Analyzing AI Web App
No ratings yet
Data Analyzing AI Web App
3 pages
10 Realtime Python Automation Scripts
100% (2)
10 Realtime Python Automation Scripts
12 pages
6 - Text Vectorization-CSC688-SP22
No ratings yet
6 - Text Vectorization-CSC688-SP22
5 pages
My_own_cheatsheet
No ratings yet
My_own_cheatsheet
13 pages
Backup Code
No ratings yet
Backup Code
4 pages
Python Lab ALL 10 Prgms
No ratings yet
Python Lab ALL 10 Prgms
16 pages
csv files
No ratings yet
csv files
22 pages
Data Visualization EDA-print
No ratings yet
Data Visualization EDA-print
18 pages
Multi Classification.py(for 1 Class Tp,Tn,Fp,Fn)
No ratings yet
Multi Classification.py(for 1 Class Tp,Tn,Fp,Fn)
25 pages
Sentiment Analysis
No ratings yet
Sentiment Analysis
2 pages
Self Evaluation Exercises (1)
No ratings yet
Self Evaluation Exercises (1)
12 pages
XX
No ratings yet
XX
4 pages
ENEL2CM Assignment 2 (2025)
No ratings yet
ENEL2CM Assignment 2 (2025)
15 pages
Data Migration Steps
No ratings yet
Data Migration Steps
13 pages
complete Django Cheat Sheet
No ratings yet
complete Django Cheat Sheet
17 pages
Source Code Python Jemmy
No ratings yet
Source Code Python Jemmy
7 pages
DL ex4
No ratings yet
DL ex4
5 pages
IR 4 E-Mail Spam Filtering Spam - Dataset
No ratings yet
IR 4 E-Mail Spam Filtering Spam - Dataset
2 pages
IFM GROUP2 CODE
No ratings yet
IFM GROUP2 CODE
7 pages
spark_code
No ratings yet
spark_code
1 page
Code
No ratings yet
Code
4 pages
Computer Science-CLASS-12-RECORD PROGRAMS
No ratings yet
Computer Science-CLASS-12-RECORD PROGRAMS
10 pages
pr10_fam
No ratings yet
pr10_fam
3 pages
Wine - Data2.py: Import As Import As Def
No ratings yet
Wine - Data2.py: Import As Import As Def
2 pages
MACHINE LEARNING manual
No ratings yet
MACHINE LEARNING manual
36 pages
Codigo base stocks prediction LSTM Thushan GAnegedara
No ratings yet
Codigo base stocks prediction LSTM Thushan GAnegedara
3 pages
EDS - Python Cheat Sheet
No ratings yet
EDS - Python Cheat Sheet
3 pages
imp programs[1]
No ratings yet
imp programs[1]
8 pages
Pattern Recognition
No ratings yet
Pattern Recognition
26 pages
TechReport_2014_LANL_LA-UR-14-25267_CraneMartz
No ratings yet
TechReport_2014_LANL_LA-UR-14-25267_CraneMartz
66 pages
Assignment 10
No ratings yet
Assignment 10
2 pages
Sahil Malhotra 16 BCE 0113 Web Mining L51+L52: 1. Universal Crawling 1.1. CODE
No ratings yet
Sahil Malhotra 16 BCE 0113 Web Mining L51+L52: 1. Universal Crawling 1.1. CODE
11 pages
10 Python Automation Scripts
No ratings yet
10 Python Automation Scripts
8 pages
Assignment 10
No ratings yet
Assignment 10
2 pages
Abusive_Language_Detection_Chatbot_Project_Summary_Detailed
No ratings yet
Abusive_Language_Detection_Chatbot_Project_Summary_Detailed
6 pages
bda_hubapi
No ratings yet
bda_hubapi
2 pages
cymbal_ingest_to_vector_database_all_steps
No ratings yet
cymbal_ingest_to_vector_database_all_steps
6 pages
R语言基础入门指令 (tips)
No ratings yet
R语言基础入门指令 (tips)
14 pages
Economist Old Edition
No ratings yet
Economist Old Edition
7 pages
Electricity Price Forecasting Project Code
No ratings yet
Electricity Price Forecasting Project Code
5 pages
Angular Generative AI: Building an intelligent CV enhancer with Google Gemini
From Everand
Angular Generative AI: Building an intelligent CV enhancer with Google Gemini
Abdelfattah Ragab
No ratings yet
Firebase Storage for Angular: A reliable file upload solution for your applications
From Everand
Firebase Storage for Angular: A reliable file upload solution for your applications
Abdelfattah Ragab
No ratings yet
TIP-COURSE - Mam Loren Francisco1
No ratings yet
TIP-COURSE - Mam Loren Francisco1
67 pages
The Dedekind/Peano Axioms
No ratings yet
The Dedekind/Peano Axioms
3 pages
Losh Diagram
No ratings yet
Losh Diagram
2 pages
Pollution Under Control Certificate: Form 59
No ratings yet
Pollution Under Control Certificate: Form 59
1 page
Lispector Smallest Woman
No ratings yet
Lispector Smallest Woman
8 pages
DLP For Topic 1 in English 8 Quarter 3 Module 4 Week 5
No ratings yet
DLP For Topic 1 in English 8 Quarter 3 Module 4 Week 5
11 pages
Cambridge IGCSE & O Level: Complete
No ratings yet
Cambridge IGCSE & O Level: Complete
12 pages
158-Article Text-546-1-10-20180411
No ratings yet
158-Article Text-546-1-10-20180411
10 pages
2022 Parking Solution Brochure Preview
No ratings yet
2022 Parking Solution Brochure Preview
20 pages
G7 Changing Earth 2024-25 Notes
No ratings yet
G7 Changing Earth 2024-25 Notes
5 pages
Products List
No ratings yet
Products List
5 pages
Lab Technician Vacancy Repro Toxys 20241029
No ratings yet
Lab Technician Vacancy Repro Toxys 20241029
1 page
The Effect of Negative Excess Pore-Water Pressure On The Stability
No ratings yet
The Effect of Negative Excess Pore-Water Pressure On The Stability
34 pages
Final Exam Study Guide: Courtney Lockley
No ratings yet
Final Exam Study Guide: Courtney Lockley
2 pages
Brochure
No ratings yet
Brochure
19 pages
Admission Circular For MDS-Professional 2024-25
No ratings yet
Admission Circular For MDS-Professional 2024-25
3 pages
May 2809
100% (1)
May 2809
52 pages
Senior High School Stand Alone: Grade 11-JUPITER-E (Science Technology Engineering Mathematics)
No ratings yet
Senior High School Stand Alone: Grade 11-JUPITER-E (Science Technology Engineering Mathematics)
6 pages
Purposive Communication (Module 4)
No ratings yet
Purposive Communication (Module 4)
3 pages
Astm C14 PDF
0% (1)
Astm C14 PDF
4 pages
Aygo X NAV RHD PZ41C 90330 00 AIM 003 194 3
No ratings yet
Aygo X NAV RHD PZ41C 90330 00 AIM 003 194 3
12 pages
Heidegger The Problem of Reality in Modern Philosophy
100% (1)
Heidegger The Problem of Reality in Modern Philosophy
9 pages
Sap Media List
No ratings yet
Sap Media List
2 pages
ĐỀ KIỂM TRA CHẤT LƯỢNG HỌC KÌ 2 2023- 2024
No ratings yet
ĐỀ KIỂM TRA CHẤT LƯỢNG HỌC KÌ 2 2023- 2024
4 pages
Of Indian Standard Specifications On Dimensional Metrology: 1. Precision Measuring Equipment
No ratings yet
Of Indian Standard Specifications On Dimensional Metrology: 1. Precision Measuring Equipment
2 pages
EIA - PHWR Atomic Power Project
No ratings yet
EIA - PHWR Atomic Power Project
402 pages
EIT Food Impact Funding Framework Single Projects
No ratings yet
EIT Food Impact Funding Framework Single Projects
21 pages
Tutorial 02
No ratings yet
Tutorial 02
6 pages

app.py

Uploaded by

app.py

Uploaded by

from flask import Flask, request, render_template, redirect, url_for, send_file

# Initialize Flask app

# Load models and vectorizer

with open('models/lr_subclass_model.pkl', 'rb') as subclass_model_file:

with open('models/tfidf_vectorizer.pkl', 'rb') as vectorizer_file:

# Function to clean Marathi text

# Index route for rendering the form

# Route for handling text classification

# Preprocess and vectorize input text

# Predict using both models

# Route for handling CSV uploads

# Read the uploaded CSV file

# Normalize the column names

# Predict using both models

# Save the result to a new CSV file

# Provide the file for download

# Run the app

# from flask import Flask, request, render_template, redirect, url_for,

# from flask import Flask, render_template, request, redirect, url_for,

You might also like